aboutsummaryrefslogtreecommitdiffstats
path: root/tools
diff options
context:
space:
mode:
Diffstat (limited to 'tools')
-rw-r--r--tools/firewire/Makefile19
-rw-r--r--tools/firewire/decode-fcp.c213
-rw-r--r--tools/firewire/list.h62
-rw-r--r--tools/firewire/nosy-dump.c1031
-rw-r--r--tools/firewire/nosy-dump.h173
-rw-r--r--tools/perf/.gitignore1
-rw-r--r--tools/perf/Documentation/Makefile4
-rw-r--r--tools/perf/Documentation/perf-annotate.txt2
-rw-r--r--tools/perf/Documentation/perf-archive.txt22
-rw-r--r--tools/perf/Documentation/perf-bench.txt8
-rw-r--r--tools/perf/Documentation/perf-buildid-cache.txt33
-rw-r--r--tools/perf/Documentation/perf-diff.txt2
-rw-r--r--tools/perf/Documentation/perf-inject.txt35
-rw-r--r--tools/perf/Documentation/perf-kmem.txt2
-rw-r--r--tools/perf/Documentation/perf-kvm.txt68
-rw-r--r--tools/perf/Documentation/perf-list.txt33
-rw-r--r--tools/perf/Documentation/perf-lock.txt29
-rw-r--r--tools/perf/Documentation/perf-probe.txt95
-rw-r--r--tools/perf/Documentation/perf-record.txt8
-rw-r--r--tools/perf/Documentation/perf-sched.txt4
-rw-r--r--tools/perf/Documentation/perf-stat.txt7
-rw-r--r--tools/perf/Documentation/perf-test.txt22
-rw-r--r--tools/perf/Documentation/perf-top.txt2
-rw-r--r--tools/perf/Documentation/perf-trace-perl.txt8
-rw-r--r--tools/perf/Documentation/perf-trace-python.txt623
-rw-r--r--tools/perf/Documentation/perf-trace.txt17
-rw-r--r--tools/perf/Documentation/perf.txt2
-rw-r--r--tools/perf/Makefile453
-rw-r--r--tools/perf/arch/powerpc/Makefile4
-rw-r--r--tools/perf/arch/powerpc/util/dwarf-regs.c88
-rw-r--r--tools/perf/arch/sparc/Makefile4
-rw-r--r--tools/perf/arch/sparc/util/dwarf-regs.c43
-rw-r--r--tools/perf/arch/x86/Makefile4
-rw-r--r--tools/perf/arch/x86/util/dwarf-regs.c75
-rw-r--r--tools/perf/bench/mem-memcpy.c3
-rw-r--r--tools/perf/bench/sched-messaging.c10
-rw-r--r--tools/perf/bench/sched-pipe.c2
-rw-r--r--tools/perf/builtin-annotate.c352
-rw-r--r--tools/perf/builtin-bench.c4
-rw-r--r--tools/perf/builtin-buildid-cache.c133
-rw-r--r--tools/perf/builtin-buildid-list.c39
-rw-r--r--tools/perf/builtin-diff.c127
-rw-r--r--tools/perf/builtin-help.c13
-rw-r--r--tools/perf/builtin-inject.c228
-rw-r--r--tools/perf/builtin-kmem.c64
-rw-r--r--tools/perf/builtin-kvm.c144
-rw-r--r--tools/perf/builtin-lock.c1005
-rw-r--r--tools/perf/builtin-probe.c277
-rw-r--r--tools/perf/builtin-record.c623
-rw-r--r--tools/perf/builtin-report.c306
-rw-r--r--tools/perf/builtin-sched.c66
-rw-r--r--tools/perf/builtin-stat.c271
-rw-r--r--tools/perf/builtin-test.c281
-rw-r--r--tools/perf/builtin-timechart.c136
-rw-r--r--tools/perf/builtin-top.c423
-rw-r--r--tools/perf/builtin-trace.c133
-rw-r--r--tools/perf/builtin.h5
-rw-r--r--tools/perf/command-list.txt6
-rw-r--r--tools/perf/design.txt8
-rw-r--r--tools/perf/perf-archive.sh36
-rw-r--r--tools/perf/perf.c56
-rw-r--r--tools/perf/perf.h13
-rw-r--r--tools/perf/scripts/perl/Perf-Trace-Util/Context.c5
-rw-r--r--tools/perf/scripts/perl/Perf-Trace-Util/Context.xs3
-rw-r--r--tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm8
-rw-r--r--tools/perf/scripts/perl/bin/check-perf-trace-record7
-rw-r--r--tools/perf/scripts/perl/bin/check-perf-trace-report6
-rw-r--r--tools/perf/scripts/perl/bin/failed-syscalls-record2
-rw-r--r--tools/perf/scripts/perl/bin/failed-syscalls-report10
-rw-r--r--tools/perf/scripts/perl/bin/rw-by-file-record3
-rw-r--r--tools/perf/scripts/perl/bin/rw-by-file-report8
-rw-r--r--tools/perf/scripts/perl/bin/rw-by-pid-record2
-rw-r--r--tools/perf/scripts/perl/bin/rw-by-pid-report2
-rw-r--r--tools/perf/scripts/perl/bin/rwtop-record2
-rw-r--r--tools/perf/scripts/perl/bin/rwtop-report23
-rw-r--r--tools/perf/scripts/perl/bin/wakeup-latency-record2
-rw-r--r--tools/perf/scripts/perl/bin/wakeup-latency-report2
-rw-r--r--tools/perf/scripts/perl/bin/workqueue-stats-record2
-rw-r--r--tools/perf/scripts/perl/bin/workqueue-stats-report2
-rw-r--r--tools/perf/scripts/perl/failed-syscalls.pl42
-rw-r--r--tools/perf/scripts/perl/rw-by-pid.pl60
-rw-r--r--tools/perf/scripts/perl/rwtop.pl199
-rw-r--r--tools/perf/scripts/perl/wakeup-latency.pl12
-rw-r--r--tools/perf/scripts/perl/workqueue-stats.pl12
-rw-r--r--tools/perf/scripts/python/Perf-Trace-Util/Context.c88
-rw-r--r--tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Core.py91
-rw-r--r--tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py28
-rw-r--r--tools/perf/scripts/python/bin/failed-syscalls-by-pid-record2
-rw-r--r--tools/perf/scripts/python/bin/failed-syscalls-by-pid-report10
-rw-r--r--tools/perf/scripts/python/bin/sctop-record2
-rw-r--r--tools/perf/scripts/python/bin/sctop-report24
-rw-r--r--tools/perf/scripts/python/bin/syscall-counts-by-pid-record2
-rw-r--r--tools/perf/scripts/python/bin/syscall-counts-by-pid-report10
-rw-r--r--tools/perf/scripts/python/bin/syscall-counts-record2
-rw-r--r--tools/perf/scripts/python/bin/syscall-counts-report10
-rw-r--r--tools/perf/scripts/python/check-perf-trace.py82
-rw-r--r--tools/perf/scripts/python/failed-syscalls-by-pid.py68
-rw-r--r--tools/perf/scripts/python/sctop.py78
-rw-r--r--tools/perf/scripts/python/syscall-counts-by-pid.py64
-rw-r--r--tools/perf/scripts/python/syscall-counts.py58
-rwxr-xr-xtools/perf/util/PERF-VERSION-GEN23
-rw-r--r--tools/perf/util/abspath.c81
-rw-r--r--tools/perf/util/bitmap.c21
-rw-r--r--tools/perf/util/build-id.c61
-rw-r--r--tools/perf/util/build-id.h10
-rw-r--r--tools/perf/util/cache.h67
-rw-r--r--tools/perf/util/callchain.c131
-rw-r--r--tools/perf/util/callchain.h14
-rw-r--r--tools/perf/util/color.c48
-rw-r--r--tools/perf/util/color.h4
-rw-r--r--tools/perf/util/config.c461
-rw-r--r--tools/perf/util/cpumap.c59
-rw-r--r--tools/perf/util/cpumap.h7
-rw-r--r--tools/perf/util/data_map.c252
-rw-r--r--tools/perf/util/debug.c9
-rw-r--r--tools/perf/util/debug.h30
-rw-r--r--tools/perf/util/debugfs.c17
-rw-r--r--tools/perf/util/debugfs.h2
-rw-r--r--tools/perf/util/event.c475
-rw-r--r--tools/perf/util/event.h130
-rw-r--r--tools/perf/util/exec_cmd.c6
-rw-r--r--tools/perf/util/exec_cmd.h1
-rw-r--r--tools/perf/util/header.c745
-rw-r--r--tools/perf/util/header.h46
-rw-r--r--tools/perf/util/help.c30
-rw-r--r--tools/perf/util/hist.c660
-rw-r--r--tools/perf/util/hist.h122
-rw-r--r--tools/perf/util/hweight.c31
-rw-r--r--tools/perf/util/include/asm/bitops.h18
-rw-r--r--tools/perf/util/include/asm/hweight.h8
-rw-r--r--tools/perf/util/include/dwarf-regs.h8
-rw-r--r--tools/perf/util/include/linux/bitmap.h38
-rw-r--r--tools/perf/util/include/linux/bitops.h20
-rw-r--r--tools/perf/util/include/linux/compiler.h2
-rw-r--r--tools/perf/util/include/linux/hash.h5
-rw-r--r--tools/perf/util/include/linux/kernel.h12
-rw-r--r--tools/perf/util/map.c461
-rw-r--r--tools/perf/util/map.h217
-rw-r--r--tools/perf/util/newt.c1178
-rw-r--r--tools/perf/util/parse-events.c90
-rw-r--r--tools/perf/util/parse-events.h1
-rw-r--r--tools/perf/util/parse-options.c55
-rw-r--r--tools/perf/util/parse-options.h29
-rw-r--r--tools/perf/util/path.c204
-rw-r--r--tools/perf/util/probe-event.c1556
-rw-r--r--tools/perf/util/probe-event.h128
-rw-r--r--tools/perf/util/probe-finder.c1616
-rw-r--r--tools/perf/util/probe-finder.h81
-rw-r--r--tools/perf/util/pstack.c75
-rw-r--r--tools/perf/util/pstack.h12
-rw-r--r--tools/perf/util/quote.c433
-rw-r--r--tools/perf/util/quote.h39
-rw-r--r--tools/perf/util/run-command.c90
-rw-r--r--tools/perf/util/run-command.h30
-rw-r--r--tools/perf/util/scripting-engines/trace-event-perl.c (renamed from tools/perf/util/trace-event-perl.c)118
-rw-r--r--tools/perf/util/scripting-engines/trace-event-python.c594
-rw-r--r--tools/perf/util/session.c807
-rw-r--r--tools/perf/util/session.h130
-rw-r--r--tools/perf/util/sigchain.c2
-rw-r--r--tools/perf/util/sigchain.h1
-rw-r--r--tools/perf/util/sort.c153
-rw-r--r--tools/perf/util/sort.h35
-rw-r--r--tools/perf/util/strbuf.c229
-rw-r--r--tools/perf/util/strbuf.h45
-rw-r--r--tools/perf/util/string.c141
-rw-r--r--tools/perf/util/string.h17
-rw-r--r--tools/perf/util/symbol.c1030
-rw-r--r--tools/perf/util/symbol.h114
-rw-r--r--tools/perf/util/thread.c228
-rw-r--r--tools/perf/util/thread.h51
-rw-r--r--tools/perf/util/trace-event-info.c99
-rw-r--r--tools/perf/util/trace-event-parse.c142
-rw-r--r--tools/perf/util/trace-event-perl.h55
-rw-r--r--tools/perf/util/trace-event-read.c139
-rw-r--r--tools/perf/util/trace-event-scripting.c167
-rw-r--r--tools/perf/util/trace-event.h25
-rw-r--r--tools/perf/util/util.c116
-rw-r--r--tools/perf/util/util.h190
-rw-r--r--tools/perf/util/values.c1
-rw-r--r--tools/perf/util/wrapper.c110
-rw-r--r--tools/usb/ffs-test.c554
-rw-r--r--tools/usb/testusb.c547
182 files changed, 18642 insertions, 6140 deletions
diff --git a/tools/firewire/Makefile b/tools/firewire/Makefile
new file mode 100644
index 000000000000..81767adaae7d
--- /dev/null
+++ b/tools/firewire/Makefile
@@ -0,0 +1,19 @@
1prefix = /usr
2nosy-dump-version = 0.4
3
4CC = gcc
5
6all : nosy-dump
7
8nosy-dump : CFLAGS = -Wall -O2 -g
9nosy-dump : CPPFLAGS = -DVERSION=\"$(nosy-dump-version)\" -I../../drivers/firewire
10nosy-dump : LDFLAGS = -g
11nosy-dump : LDLIBS = -lpopt
12
13nosy-dump : nosy-dump.o decode-fcp.o
14
15clean :
16 rm -rf *.o nosy-dump
17
18install :
19 install nosy-dump $(prefix)/bin/nosy-dump
diff --git a/tools/firewire/decode-fcp.c b/tools/firewire/decode-fcp.c
new file mode 100644
index 000000000000..e41223b6a4c8
--- /dev/null
+++ b/tools/firewire/decode-fcp.c
@@ -0,0 +1,213 @@
1#include <linux/firewire-constants.h>
2#include <stdio.h>
3#include <stdlib.h>
4
5#include "list.h"
6#include "nosy-dump.h"
7
8#define CSR_FCP_COMMAND 0xfffff0000b00ull
9#define CSR_FCP_RESPONSE 0xfffff0000d00ull
10
11static const char * const ctype_names[] = {
12 [0x0] = "control", [0x8] = "not implemented",
13 [0x1] = "status", [0x9] = "accepted",
14 [0x2] = "specific inquiry", [0xa] = "rejected",
15 [0x3] = "notify", [0xb] = "in transition",
16 [0x4] = "general inquiry", [0xc] = "stable",
17 [0x5] = "(reserved 0x05)", [0xd] = "changed",
18 [0x6] = "(reserved 0x06)", [0xe] = "(reserved 0x0e)",
19 [0x7] = "(reserved 0x07)", [0xf] = "interim",
20};
21
22static const char * const subunit_type_names[] = {
23 [0x00] = "monitor", [0x10] = "(reserved 0x10)",
24 [0x01] = "audio", [0x11] = "(reserved 0x11)",
25 [0x02] = "printer", [0x12] = "(reserved 0x12)",
26 [0x03] = "disc", [0x13] = "(reserved 0x13)",
27 [0x04] = "tape recorder/player",[0x14] = "(reserved 0x14)",
28 [0x05] = "tuner", [0x15] = "(reserved 0x15)",
29 [0x06] = "ca", [0x16] = "(reserved 0x16)",
30 [0x07] = "camera", [0x17] = "(reserved 0x17)",
31 [0x08] = "(reserved 0x08)", [0x18] = "(reserved 0x18)",
32 [0x09] = "panel", [0x19] = "(reserved 0x19)",
33 [0x0a] = "bulletin board", [0x1a] = "(reserved 0x1a)",
34 [0x0b] = "camera storage", [0x1b] = "(reserved 0x1b)",
35 [0x0c] = "(reserved 0x0c)", [0x1c] = "vendor unique",
36 [0x0d] = "(reserved 0x0d)", [0x1d] = "all subunit types",
37 [0x0e] = "(reserved 0x0e)", [0x1e] = "subunit_type extended to next byte",
38 [0x0f] = "(reserved 0x0f)", [0x1f] = "unit",
39};
40
41struct avc_enum {
42 int value;
43 const char *name;
44};
45
46struct avc_field {
47 const char *name; /* Short name for field. */
48 int offset; /* Location of field, specified in bits; */
49 /* negative means from end of packet. */
50 int width; /* Width of field, 0 means use data_length. */
51 struct avc_enum *names;
52};
53
54struct avc_opcode_info {
55 const char *name;
56 struct avc_field fields[8];
57};
58
59struct avc_enum power_field_names[] = {
60 { 0x70, "on" },
61 { 0x60, "off" },
62 { }
63};
64
65static const struct avc_opcode_info opcode_info[256] = {
66
67 /* TA Document 1999026 */
68 /* AV/C Digital Interface Command Set General Specification 4.0 */
69 [0xb2] = { "power", {
70 { "state", 0, 8, power_field_names }
71 }
72 },
73 [0x30] = { "unit info", {
74 { "foo", 0, 8 },
75 { "unit_type", 8, 5 },
76 { "unit", 13, 3 },
77 { "company id", 16, 24 },
78 }
79 },
80 [0x31] = { "subunit info" },
81 [0x01] = { "reserve" },
82 [0xb0] = { "version" },
83 [0x00] = { "vendor dependent" },
84 [0x02] = { "plug info" },
85 [0x12] = { "channel usage" },
86 [0x24] = { "connect" },
87 [0x20] = { "connect av" },
88 [0x22] = { "connections" },
89 [0x11] = { "digital input" },
90 [0x10] = { "digital output" },
91 [0x25] = { "disconnect" },
92 [0x21] = { "disconnect av" },
93 [0x19] = { "input plug signal format" },
94 [0x18] = { "output plug signal format" },
95 [0x1f] = { "general bus setup" },
96
97 /* TA Document 1999025 */
98 /* AV/C Descriptor Mechanism Specification Version 1.0 */
99 [0x0c] = { "create descriptor" },
100 [0x08] = { "open descriptor" },
101 [0x09] = { "read descriptor" },
102 [0x0a] = { "write descriptor" },
103 [0x05] = { "open info block" },
104 [0x06] = { "read info block" },
105 [0x07] = { "write info block" },
106 [0x0b] = { "search descriptor" },
107 [0x0d] = { "object number select" },
108
109 /* TA Document 1999015 */
110 /* AV/C Command Set for Rate Control of Isochronous Data Flow 1.0 */
111 [0xb3] = { "rate", {
112 { "subfunction", 0, 8 },
113 { "result", 8, 8 },
114 { "plug_type", 16, 8 },
115 { "plug_id", 16, 8 },
116 }
117 },
118
119 /* TA Document 1999008 */
120 /* AV/C Audio Subunit Specification 1.0 */
121 [0xb8] = { "function block" },
122
123 /* TA Document 2001001 */
124 /* AV/C Panel Subunit Specification 1.1 */
125 [0x7d] = { "gui update" },
126 [0x7e] = { "push gui data" },
127 [0x7f] = { "user action" },
128 [0x7c] = { "pass through" },
129
130 /* */
131 [0x26] = { "asynchronous connection" },
132};
133
134struct avc_frame {
135 uint32_t operand0:8;
136 uint32_t opcode:8;
137 uint32_t subunit_id:3;
138 uint32_t subunit_type:5;
139 uint32_t ctype:4;
140 uint32_t cts:4;
141};
142
143static void
144decode_avc(struct link_transaction *t)
145{
146 struct avc_frame *frame =
147 (struct avc_frame *) t->request->packet.write_block.data;
148 const struct avc_opcode_info *info;
149 const char *name;
150 char buffer[32];
151 int i;
152
153 info = &opcode_info[frame->opcode];
154 if (info->name == NULL) {
155 snprintf(buffer, sizeof(buffer),
156 "(unknown opcode 0x%02x)", frame->opcode);
157 name = buffer;
158 } else {
159 name = info->name;
160 }
161
162 printf("av/c %s, subunit_type=%s, subunit_id=%d, opcode=%s",
163 ctype_names[frame->ctype], subunit_type_names[frame->subunit_type],
164 frame->subunit_id, name);
165
166 for (i = 0; info->fields[i].name != NULL; i++)
167 printf(", %s", info->fields[i].name);
168
169 printf("\n");
170}
171
172int
173decode_fcp(struct link_transaction *t)
174{
175 struct avc_frame *frame =
176 (struct avc_frame *) t->request->packet.write_block.data;
177 unsigned long long offset =
178 ((unsigned long long) t->request->packet.common.offset_high << 32) |
179 t->request->packet.common.offset_low;
180
181 if (t->request->packet.common.tcode != TCODE_WRITE_BLOCK_REQUEST)
182 return 0;
183
184 if (offset == CSR_FCP_COMMAND || offset == CSR_FCP_RESPONSE) {
185 switch (frame->cts) {
186 case 0x00:
187 decode_avc(t);
188 break;
189 case 0x01:
190 printf("cal fcp frame (cts=0x01)\n");
191 break;
192 case 0x02:
193 printf("ehs fcp frame (cts=0x02)\n");
194 break;
195 case 0x03:
196 printf("havi fcp frame (cts=0x03)\n");
197 break;
198 case 0x0e:
199 printf("vendor specific fcp frame (cts=0x0e)\n");
200 break;
201 case 0x0f:
202 printf("extended cts\n");
203 break;
204 default:
205 printf("reserved fcp frame (ctx=0x%02x)\n", frame->cts);
206 break;
207 }
208 return 1;
209 }
210
211 return 0;
212}
213
diff --git a/tools/firewire/list.h b/tools/firewire/list.h
new file mode 100644
index 000000000000..41f4bdadf634
--- /dev/null
+++ b/tools/firewire/list.h
@@ -0,0 +1,62 @@
1struct list {
2 struct list *next, *prev;
3};
4
5static inline void
6list_init(struct list *list)
7{
8 list->next = list;
9 list->prev = list;
10}
11
12static inline int
13list_empty(struct list *list)
14{
15 return list->next == list;
16}
17
18static inline void
19list_insert(struct list *link, struct list *new_link)
20{
21 new_link->prev = link->prev;
22 new_link->next = link;
23 new_link->prev->next = new_link;
24 new_link->next->prev = new_link;
25}
26
27static inline void
28list_append(struct list *list, struct list *new_link)
29{
30 list_insert((struct list *)list, new_link);
31}
32
33static inline void
34list_prepend(struct list *list, struct list *new_link)
35{
36 list_insert(list->next, new_link);
37}
38
39static inline void
40list_remove(struct list *link)
41{
42 link->prev->next = link->next;
43 link->next->prev = link->prev;
44}
45
46#define list_entry(link, type, member) \
47 ((type *)((char *)(link)-(unsigned long)(&((type *)0)->member)))
48
49#define list_head(list, type, member) \
50 list_entry((list)->next, type, member)
51
52#define list_tail(list, type, member) \
53 list_entry((list)->prev, type, member)
54
55#define list_next(elm, member) \
56 list_entry((elm)->member.next, typeof(*elm), member)
57
58#define list_for_each_entry(pos, list, member) \
59 for (pos = list_head(list, typeof(*pos), member); \
60 &pos->member != (list); \
61 pos = list_next(pos, member))
62
diff --git a/tools/firewire/nosy-dump.c b/tools/firewire/nosy-dump.c
new file mode 100644
index 000000000000..f93b776370b6
--- /dev/null
+++ b/tools/firewire/nosy-dump.c
@@ -0,0 +1,1031 @@
1/*
2 * nosy-dump - Interface to snoop mode driver for TI PCILynx 1394 controllers
3 * Copyright (C) 2002-2006 Kristian Høgsberg
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
16 * along with this program; if not, write to the Free Software Foundation,
17 * Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 */
19
20#include <byteswap.h>
21#include <endian.h>
22#include <fcntl.h>
23#include <linux/firewire-constants.h>
24#include <poll.h>
25#include <popt.h>
26#include <signal.h>
27#include <stdio.h>
28#include <stdlib.h>
29#include <string.h>
30#include <sys/ioctl.h>
31#include <sys/time.h>
32#include <termios.h>
33#include <unistd.h>
34
35#include "list.h"
36#include "nosy-dump.h"
37#include "nosy-user.h"
38
39enum {
40 PACKET_FIELD_DETAIL = 0x01,
41 PACKET_FIELD_DATA_LENGTH = 0x02,
42 /* Marks the fields we print in transaction view. */
43 PACKET_FIELD_TRANSACTION = 0x04,
44};
45
46static void print_packet(uint32_t *data, size_t length);
47static void decode_link_packet(struct link_packet *packet, size_t length,
48 int include_flags, int exclude_flags);
49static int run = 1;
50sig_t sys_sigint_handler;
51
52static char *option_nosy_device = "/dev/nosy";
53static char *option_view = "packet";
54static char *option_output;
55static char *option_input;
56static int option_hex;
57static int option_iso;
58static int option_cycle_start;
59static int option_version;
60static int option_verbose;
61
62enum {
63 VIEW_TRANSACTION,
64 VIEW_PACKET,
65 VIEW_STATS,
66};
67
68static const struct poptOption options[] = {
69 {
70 .longName = "device",
71 .shortName = 'd',
72 .argInfo = POPT_ARG_STRING,
73 .arg = &option_nosy_device,
74 .descrip = "Path to nosy device.",
75 .argDescrip = "DEVICE"
76 },
77 {
78 .longName = "view",
79 .argInfo = POPT_ARG_STRING,
80 .arg = &option_view,
81 .descrip = "Specify view of bus traffic: packet, transaction or stats.",
82 .argDescrip = "VIEW"
83 },
84 {
85 .longName = "hex",
86 .shortName = 'x',
87 .argInfo = POPT_ARG_NONE,
88 .arg = &option_hex,
89 .descrip = "Print each packet in hex.",
90 },
91 {
92 .longName = "iso",
93 .argInfo = POPT_ARG_NONE,
94 .arg = &option_iso,
95 .descrip = "Print iso packets.",
96 },
97 {
98 .longName = "cycle-start",
99 .argInfo = POPT_ARG_NONE,
100 .arg = &option_cycle_start,
101 .descrip = "Print cycle start packets.",
102 },
103 {
104 .longName = "verbose",
105 .shortName = 'v',
106 .argInfo = POPT_ARG_NONE,
107 .arg = &option_verbose,
108 .descrip = "Verbose packet view.",
109 },
110 {
111 .longName = "output",
112 .shortName = 'o',
113 .argInfo = POPT_ARG_STRING,
114 .arg = &option_output,
115 .descrip = "Log to output file.",
116 .argDescrip = "FILENAME"
117 },
118 {
119 .longName = "input",
120 .shortName = 'i',
121 .argInfo = POPT_ARG_STRING,
122 .arg = &option_input,
123 .descrip = "Decode log from file.",
124 .argDescrip = "FILENAME"
125 },
126 {
127 .longName = "version",
128 .argInfo = POPT_ARG_NONE,
129 .arg = &option_version,
130 .descrip = "Specify print version info.",
131 },
132 POPT_AUTOHELP
133 POPT_TABLEEND
134};
135
136/* Allow all ^C except the first to interrupt the program in the usual way. */
137static void
138sigint_handler(int signal_num)
139{
140 if (run == 1) {
141 run = 0;
142 signal(SIGINT, SIG_DFL);
143 }
144}
145
146static struct subaction *
147subaction_create(uint32_t *data, size_t length)
148{
149 struct subaction *sa;
150
151 /* we put the ack in the subaction struct for easy access. */
152 sa = malloc(sizeof *sa - sizeof sa->packet + length);
153 sa->ack = data[length / 4 - 1];
154 sa->length = length;
155 memcpy(&sa->packet, data, length);
156
157 return sa;
158}
159
160static void
161subaction_destroy(struct subaction *sa)
162{
163 free(sa);
164}
165
166static struct list pending_transaction_list = {
167 &pending_transaction_list, &pending_transaction_list
168};
169
170static struct link_transaction *
171link_transaction_lookup(int request_node, int response_node, int tlabel)
172{
173 struct link_transaction *t;
174
175 list_for_each_entry(t, &pending_transaction_list, link) {
176 if (t->request_node == request_node &&
177 t->response_node == response_node &&
178 t->tlabel == tlabel)
179 return t;
180 }
181
182 t = malloc(sizeof *t);
183 t->request_node = request_node;
184 t->response_node = response_node;
185 t->tlabel = tlabel;
186 list_init(&t->request_list);
187 list_init(&t->response_list);
188
189 list_append(&pending_transaction_list, &t->link);
190
191 return t;
192}
193
194static void
195link_transaction_destroy(struct link_transaction *t)
196{
197 struct subaction *sa;
198
199 while (!list_empty(&t->request_list)) {
200 sa = list_head(&t->request_list, struct subaction, link);
201 list_remove(&sa->link);
202 subaction_destroy(sa);
203 }
204 while (!list_empty(&t->response_list)) {
205 sa = list_head(&t->response_list, struct subaction, link);
206 list_remove(&sa->link);
207 subaction_destroy(sa);
208 }
209 free(t);
210}
211
212struct protocol_decoder {
213 const char *name;
214 int (*decode)(struct link_transaction *t);
215};
216
217static const struct protocol_decoder protocol_decoders[] = {
218 { "FCP", decode_fcp }
219};
220
221static void
222handle_transaction(struct link_transaction *t)
223{
224 struct subaction *sa;
225 int i;
226
227 if (!t->request) {
228 printf("BUG in handle_transaction\n");
229 return;
230 }
231
232 for (i = 0; i < array_length(protocol_decoders); i++)
233 if (protocol_decoders[i].decode(t))
234 break;
235
236 /* HACK: decode only fcp right now. */
237 return;
238
239 decode_link_packet(&t->request->packet, t->request->length,
240 PACKET_FIELD_TRANSACTION, 0);
241 if (t->response)
242 decode_link_packet(&t->response->packet, t->request->length,
243 PACKET_FIELD_TRANSACTION, 0);
244 else
245 printf("[no response]");
246
247 if (option_verbose) {
248 list_for_each_entry(sa, &t->request_list, link)
249 print_packet((uint32_t *) &sa->packet, sa->length);
250 list_for_each_entry(sa, &t->response_list, link)
251 print_packet((uint32_t *) &sa->packet, sa->length);
252 }
253 printf("\r\n");
254
255 link_transaction_destroy(t);
256}
257
258static void
259clear_pending_transaction_list(void)
260{
261 struct link_transaction *t;
262
263 while (!list_empty(&pending_transaction_list)) {
264 t = list_head(&pending_transaction_list,
265 struct link_transaction, link);
266 list_remove(&t->link);
267 link_transaction_destroy(t);
268 /* print unfinished transactions */
269 }
270}
271
272static const char * const tcode_names[] = {
273 [0x0] = "write_quadlet_request", [0x6] = "read_quadlet_response",
274 [0x1] = "write_block_request", [0x7] = "read_block_response",
275 [0x2] = "write_response", [0x8] = "cycle_start",
276 [0x3] = "reserved", [0x9] = "lock_request",
277 [0x4] = "read_quadlet_request", [0xa] = "iso_data",
278 [0x5] = "read_block_request", [0xb] = "lock_response",
279};
280
281static const char * const ack_names[] = {
282 [0x0] = "no ack", [0x8] = "reserved (0x08)",
283 [0x1] = "ack_complete", [0x9] = "reserved (0x09)",
284 [0x2] = "ack_pending", [0xa] = "reserved (0x0a)",
285 [0x3] = "reserved (0x03)", [0xb] = "reserved (0x0b)",
286 [0x4] = "ack_busy_x", [0xc] = "reserved (0x0c)",
287 [0x5] = "ack_busy_a", [0xd] = "ack_data_error",
288 [0x6] = "ack_busy_b", [0xe] = "ack_type_error",
289 [0x7] = "reserved (0x07)", [0xf] = "reserved (0x0f)",
290};
291
292static const char * const rcode_names[] = {
293 [0x0] = "complete", [0x4] = "conflict_error",
294 [0x1] = "reserved (0x01)", [0x5] = "data_error",
295 [0x2] = "reserved (0x02)", [0x6] = "type_error",
296 [0x3] = "reserved (0x03)", [0x7] = "address_error",
297};
298
299static const char * const retry_names[] = {
300 [0x0] = "retry_1",
301 [0x1] = "retry_x",
302 [0x2] = "retry_a",
303 [0x3] = "retry_b",
304};
305
306enum {
307 PACKET_RESERVED,
308 PACKET_REQUEST,
309 PACKET_RESPONSE,
310 PACKET_OTHER,
311};
312
313struct packet_info {
314 const char *name;
315 int type;
316 int response_tcode;
317 const struct packet_field *fields;
318 int field_count;
319};
320
321struct packet_field {
322 const char *name; /* Short name for field. */
323 int offset; /* Location of field, specified in bits; */
324 /* negative means from end of packet. */
325 int width; /* Width of field, 0 means use data_length. */
326 int flags; /* Show options. */
327 const char * const *value_names;
328};
329
330#define COMMON_REQUEST_FIELDS \
331 { "dest", 0, 16, PACKET_FIELD_TRANSACTION }, \
332 { "tl", 16, 6 }, \
333 { "rt", 22, 2, PACKET_FIELD_DETAIL, retry_names }, \
334 { "tcode", 24, 4, PACKET_FIELD_TRANSACTION, tcode_names }, \
335 { "pri", 28, 4, PACKET_FIELD_DETAIL }, \
336 { "src", 32, 16, PACKET_FIELD_TRANSACTION }, \
337 { "offs", 48, 48, PACKET_FIELD_TRANSACTION }
338
339#define COMMON_RESPONSE_FIELDS \
340 { "dest", 0, 16 }, \
341 { "tl", 16, 6 }, \
342 { "rt", 22, 2, PACKET_FIELD_DETAIL, retry_names }, \
343 { "tcode", 24, 4, 0, tcode_names }, \
344 { "pri", 28, 4, PACKET_FIELD_DETAIL }, \
345 { "src", 32, 16 }, \
346 { "rcode", 48, 4, PACKET_FIELD_TRANSACTION, rcode_names }
347
348static const struct packet_field read_quadlet_request_fields[] = {
349 COMMON_REQUEST_FIELDS,
350 { "crc", 96, 32, PACKET_FIELD_DETAIL },
351 { "ack", 156, 4, 0, ack_names },
352};
353
354static const struct packet_field read_quadlet_response_fields[] = {
355 COMMON_RESPONSE_FIELDS,
356 { "data", 96, 32, PACKET_FIELD_TRANSACTION },
357 { "crc", 128, 32, PACKET_FIELD_DETAIL },
358 { "ack", 188, 4, 0, ack_names },
359};
360
361static const struct packet_field read_block_request_fields[] = {
362 COMMON_REQUEST_FIELDS,
363 { "data_length", 96, 16, PACKET_FIELD_TRANSACTION },
364 { "extended_tcode", 112, 16 },
365 { "crc", 128, 32, PACKET_FIELD_DETAIL },
366 { "ack", 188, 4, 0, ack_names },
367};
368
369static const struct packet_field block_response_fields[] = {
370 COMMON_RESPONSE_FIELDS,
371 { "data_length", 96, 16, PACKET_FIELD_DATA_LENGTH },
372 { "extended_tcode", 112, 16 },
373 { "crc", 128, 32, PACKET_FIELD_DETAIL },
374 { "data", 160, 0, PACKET_FIELD_TRANSACTION },
375 { "crc", -64, 32, PACKET_FIELD_DETAIL },
376 { "ack", -4, 4, 0, ack_names },
377};
378
379static const struct packet_field write_quadlet_request_fields[] = {
380 COMMON_REQUEST_FIELDS,
381 { "data", 96, 32, PACKET_FIELD_TRANSACTION },
382 { "ack", -4, 4, 0, ack_names },
383};
384
385static const struct packet_field block_request_fields[] = {
386 COMMON_REQUEST_FIELDS,
387 { "data_length", 96, 16, PACKET_FIELD_DATA_LENGTH | PACKET_FIELD_TRANSACTION },
388 { "extended_tcode", 112, 16, PACKET_FIELD_TRANSACTION },
389 { "crc", 128, 32, PACKET_FIELD_DETAIL },
390 { "data", 160, 0, PACKET_FIELD_TRANSACTION },
391 { "crc", -64, 32, PACKET_FIELD_DETAIL },
392 { "ack", -4, 4, 0, ack_names },
393};
394
395static const struct packet_field write_response_fields[] = {
396 COMMON_RESPONSE_FIELDS,
397 { "reserved", 64, 32, PACKET_FIELD_DETAIL },
398 { "ack", -4, 4, 0, ack_names },
399};
400
401static const struct packet_field iso_data_fields[] = {
402 { "data_length", 0, 16, PACKET_FIELD_DATA_LENGTH },
403 { "tag", 16, 2 },
404 { "channel", 18, 6 },
405 { "tcode", 24, 4, 0, tcode_names },
406 { "sy", 28, 4 },
407 { "crc", 32, 32, PACKET_FIELD_DETAIL },
408 { "data", 64, 0 },
409 { "crc", -64, 32, PACKET_FIELD_DETAIL },
410 { "ack", -4, 4, 0, ack_names },
411};
412
413static const struct packet_info packet_info[] = {
414 {
415 .name = "write_quadlet_request",
416 .type = PACKET_REQUEST,
417 .response_tcode = TCODE_WRITE_RESPONSE,
418 .fields = write_quadlet_request_fields,
419 .field_count = array_length(write_quadlet_request_fields)
420 },
421 {
422 .name = "write_block_request",
423 .type = PACKET_REQUEST,
424 .response_tcode = TCODE_WRITE_RESPONSE,
425 .fields = block_request_fields,
426 .field_count = array_length(block_request_fields)
427 },
428 {
429 .name = "write_response",
430 .type = PACKET_RESPONSE,
431 .fields = write_response_fields,
432 .field_count = array_length(write_response_fields)
433 },
434 {
435 .name = "reserved",
436 .type = PACKET_RESERVED,
437 },
438 {
439 .name = "read_quadlet_request",
440 .type = PACKET_REQUEST,
441 .response_tcode = TCODE_READ_QUADLET_RESPONSE,
442 .fields = read_quadlet_request_fields,
443 .field_count = array_length(read_quadlet_request_fields)
444 },
445 {
446 .name = "read_block_request",
447 .type = PACKET_REQUEST,
448 .response_tcode = TCODE_READ_BLOCK_RESPONSE,
449 .fields = read_block_request_fields,
450 .field_count = array_length(read_block_request_fields)
451 },
452 {
453 .name = "read_quadlet_response",
454 .type = PACKET_RESPONSE,
455 .fields = read_quadlet_response_fields,
456 .field_count = array_length(read_quadlet_response_fields)
457 },
458 {
459 .name = "read_block_response",
460 .type = PACKET_RESPONSE,
461 .fields = block_response_fields,
462 .field_count = array_length(block_response_fields)
463 },
464 {
465 .name = "cycle_start",
466 .type = PACKET_OTHER,
467 .fields = write_quadlet_request_fields,
468 .field_count = array_length(write_quadlet_request_fields)
469 },
470 {
471 .name = "lock_request",
472 .type = PACKET_REQUEST,
473 .fields = block_request_fields,
474 .field_count = array_length(block_request_fields)
475 },
476 {
477 .name = "iso_data",
478 .type = PACKET_OTHER,
479 .fields = iso_data_fields,
480 .field_count = array_length(iso_data_fields)
481 },
482 {
483 .name = "lock_response",
484 .type = PACKET_RESPONSE,
485 .fields = block_response_fields,
486 .field_count = array_length(block_response_fields)
487 },
488};
489
490static int
491handle_request_packet(uint32_t *data, size_t length)
492{
493 struct link_packet *p = (struct link_packet *) data;
494 struct subaction *sa, *prev;
495 struct link_transaction *t;
496
497 t = link_transaction_lookup(p->common.source, p->common.destination,
498 p->common.tlabel);
499 sa = subaction_create(data, length);
500 t->request = sa;
501
502 if (!list_empty(&t->request_list)) {
503 prev = list_tail(&t->request_list,
504 struct subaction, link);
505
506 if (!ACK_BUSY(prev->ack)) {
507 /*
508 * error, we should only see ack_busy_* before the
509 * ack_pending/ack_complete -- this is an ack_pending
510 * instead (ack_complete would have finished the
511 * transaction).
512 */
513 }
514
515 if (prev->packet.common.tcode != sa->packet.common.tcode ||
516 prev->packet.common.tlabel != sa->packet.common.tlabel) {
517 /* memcmp() ? */
518 /* error, these should match for retries. */
519 }
520 }
521
522 list_append(&t->request_list, &sa->link);
523
524 switch (sa->ack) {
525 case ACK_COMPLETE:
526 if (p->common.tcode != TCODE_WRITE_QUADLET_REQUEST &&
527 p->common.tcode != TCODE_WRITE_BLOCK_REQUEST)
528 /* error, unified transactions only allowed for write */;
529 list_remove(&t->link);
530 handle_transaction(t);
531 break;
532
533 case ACK_NO_ACK:
534 case ACK_DATA_ERROR:
535 case ACK_TYPE_ERROR:
536 list_remove(&t->link);
537 handle_transaction(t);
538 break;
539
540 case ACK_PENDING:
541 /* request subaction phase over, wait for response. */
542 break;
543
544 case ACK_BUSY_X:
545 case ACK_BUSY_A:
546 case ACK_BUSY_B:
547 /* ok, wait for retry. */
548 /* check that retry protocol is respected. */
549 break;
550 }
551
552 return 1;
553}
554
555static int
556handle_response_packet(uint32_t *data, size_t length)
557{
558 struct link_packet *p = (struct link_packet *) data;
559 struct subaction *sa, *prev;
560 struct link_transaction *t;
561
562 t = link_transaction_lookup(p->common.destination, p->common.source,
563 p->common.tlabel);
564 if (list_empty(&t->request_list)) {
565 /* unsolicited response */
566 }
567
568 sa = subaction_create(data, length);
569 t->response = sa;
570
571 if (!list_empty(&t->response_list)) {
572 prev = list_tail(&t->response_list, struct subaction, link);
573
574 if (!ACK_BUSY(prev->ack)) {
575 /*
576 * error, we should only see ack_busy_* before the
577 * ack_pending/ack_complete
578 */
579 }
580
581 if (prev->packet.common.tcode != sa->packet.common.tcode ||
582 prev->packet.common.tlabel != sa->packet.common.tlabel) {
583 /* use memcmp() instead? */
584 /* error, these should match for retries. */
585 }
586 } else {
587 prev = list_tail(&t->request_list, struct subaction, link);
588 if (prev->ack != ACK_PENDING) {
589 /*
590 * error, should not get response unless last request got
591 * ack_pending.
592 */
593 }
594
595 if (packet_info[prev->packet.common.tcode].response_tcode !=
596 sa->packet.common.tcode) {
597 /* error, tcode mismatch */
598 }
599 }
600
601 list_append(&t->response_list, &sa->link);
602
603 switch (sa->ack) {
604 case ACK_COMPLETE:
605 case ACK_NO_ACK:
606 case ACK_DATA_ERROR:
607 case ACK_TYPE_ERROR:
608 list_remove(&t->link);
609 handle_transaction(t);
610 /* transaction complete, remove t from pending list. */
611 break;
612
613 case ACK_PENDING:
614 /* error for responses. */
615 break;
616
617 case ACK_BUSY_X:
618 case ACK_BUSY_A:
619 case ACK_BUSY_B:
620 /* no problem, wait for next retry */
621 break;
622 }
623
624 return 1;
625}
626
627static int
628handle_packet(uint32_t *data, size_t length)
629{
630 if (length == 0) {
631 printf("bus reset\r\n");
632 clear_pending_transaction_list();
633 } else if (length > sizeof(struct phy_packet)) {
634 struct link_packet *p = (struct link_packet *) data;
635
636 switch (packet_info[p->common.tcode].type) {
637 case PACKET_REQUEST:
638 return handle_request_packet(data, length);
639
640 case PACKET_RESPONSE:
641 return handle_response_packet(data, length);
642
643 case PACKET_OTHER:
644 case PACKET_RESERVED:
645 return 0;
646 }
647 }
648
649 return 1;
650}
651
652static unsigned int
653get_bits(struct link_packet *packet, int offset, int width)
654{
655 uint32_t *data = (uint32_t *) packet;
656 uint32_t index, shift, mask;
657
658 index = offset / 32 + 1;
659 shift = 32 - (offset & 31) - width;
660 mask = width == 32 ? ~0 : (1 << width) - 1;
661
662 return (data[index] >> shift) & mask;
663}
664
665#if __BYTE_ORDER == __LITTLE_ENDIAN
666#define byte_index(i) ((i) ^ 3)
667#elif __BYTE_ORDER == __BIG_ENDIAN
668#define byte_index(i) (i)
669#else
670#error unsupported byte order.
671#endif
672
673static void
674dump_data(unsigned char *data, int length)
675{
676 int i, print_length;
677
678 if (length > 128)
679 print_length = 128;
680 else
681 print_length = length;
682
683 for (i = 0; i < print_length; i++)
684 printf("%s%02hhx",
685 (i % 4 == 0 && i != 0) ? " " : "",
686 data[byte_index(i)]);
687
688 if (print_length < length)
689 printf(" (%d more bytes)", length - print_length);
690}
691
692static void
693decode_link_packet(struct link_packet *packet, size_t length,
694 int include_flags, int exclude_flags)
695{
696 const struct packet_info *pi;
697 int data_length = 0;
698 int i;
699
700 pi = &packet_info[packet->common.tcode];
701
702 for (i = 0; i < pi->field_count; i++) {
703 const struct packet_field *f = &pi->fields[i];
704 int offset;
705
706 if (f->flags & exclude_flags)
707 continue;
708 if (include_flags && !(f->flags & include_flags))
709 continue;
710
711 if (f->offset < 0)
712 offset = length * 8 + f->offset - 32;
713 else
714 offset = f->offset;
715
716 if (f->value_names != NULL) {
717 uint32_t bits;
718
719 bits = get_bits(packet, offset, f->width);
720 printf("%s", f->value_names[bits]);
721 } else if (f->width == 0) {
722 printf("%s=[", f->name);
723 dump_data((unsigned char *) packet + (offset / 8 + 4), data_length);
724 printf("]");
725 } else {
726 unsigned long long bits;
727 int high_width, low_width;
728
729 if ((offset & ~31) != ((offset + f->width - 1) & ~31)) {
730 /* Bit field spans quadlet boundary. */
731 high_width = ((offset + 31) & ~31) - offset;
732 low_width = f->width - high_width;
733
734 bits = get_bits(packet, offset, high_width);
735 bits = (bits << low_width) |
736 get_bits(packet, offset + high_width, low_width);
737 } else {
738 bits = get_bits(packet, offset, f->width);
739 }
740
741 printf("%s=0x%0*llx", f->name, (f->width + 3) / 4, bits);
742
743 if (f->flags & PACKET_FIELD_DATA_LENGTH)
744 data_length = bits;
745 }
746
747 if (i < pi->field_count - 1)
748 printf(", ");
749 }
750}
751
752static void
753print_packet(uint32_t *data, size_t length)
754{
755 int i;
756
757 printf("%6u ", data[0]);
758
759 if (length == 4) {
760 printf("bus reset");
761 } else if (length < sizeof(struct phy_packet)) {
762 printf("short packet: ");
763 for (i = 1; i < length / 4; i++)
764 printf("%s%08x", i == 0 ? "[" : " ", data[i]);
765 printf("]");
766
767 } else if (length == sizeof(struct phy_packet) && data[1] == ~data[2]) {
768 struct phy_packet *pp = (struct phy_packet *) data;
769
770 /* phy packet are 3 quadlets: the 1 quadlet payload,
771 * the bitwise inverse of the payload and the snoop
772 * mode ack */
773
774 switch (pp->common.identifier) {
775 case PHY_PACKET_CONFIGURATION:
776 if (!pp->phy_config.set_root && !pp->phy_config.set_gap_count) {
777 printf("ext phy config: phy_id=%02x", pp->phy_config.root_id);
778 } else {
779 printf("phy config:");
780 if (pp->phy_config.set_root)
781 printf(" set_root_id=%02x", pp->phy_config.root_id);
782 if (pp->phy_config.set_gap_count)
783 printf(" set_gap_count=%d", pp->phy_config.gap_count);
784 }
785 break;
786
787 case PHY_PACKET_LINK_ON:
788 printf("link-on packet, phy_id=%02x", pp->link_on.phy_id);
789 break;
790
791 case PHY_PACKET_SELF_ID:
792 if (pp->self_id.extended) {
793 printf("extended self id: phy_id=%02x, seq=%d",
794 pp->ext_self_id.phy_id, pp->ext_self_id.sequence);
795 } else {
796 static const char * const speed_names[] = {
797 "S100", "S200", "S400", "BETA"
798 };
799 printf("self id: phy_id=%02x, link %s, gap_count=%d, speed=%s%s%s",
800 pp->self_id.phy_id,
801 (pp->self_id.link_active ? "active" : "not active"),
802 pp->self_id.gap_count,
803 speed_names[pp->self_id.phy_speed],
804 (pp->self_id.contender ? ", irm contender" : ""),
805 (pp->self_id.initiated_reset ? ", initiator" : ""));
806 }
807 break;
808 default:
809 printf("unknown phy packet: ");
810 for (i = 1; i < length / 4; i++)
811 printf("%s%08x", i == 0 ? "[" : " ", data[i]);
812 printf("]");
813 break;
814 }
815 } else {
816 struct link_packet *packet = (struct link_packet *) data;
817
818 decode_link_packet(packet, length, 0,
819 option_verbose ? 0 : PACKET_FIELD_DETAIL);
820 }
821
822 if (option_hex) {
823 printf(" [");
824 dump_data((unsigned char *) data + 4, length - 4);
825 printf("]");
826 }
827
828 printf("\r\n");
829}
830
831#define HIDE_CURSOR "\033[?25l"
832#define SHOW_CURSOR "\033[?25h"
833#define CLEAR "\033[H\033[2J"
834
835static void
836print_stats(uint32_t *data, size_t length)
837{
838 static int bus_reset_count, short_packet_count, phy_packet_count;
839 static int tcode_count[16];
840 static struct timeval last_update;
841 struct timeval now;
842 int i;
843
844 if (length == 0)
845 bus_reset_count++;
846 else if (length < sizeof(struct phy_packet))
847 short_packet_count++;
848 else if (length == sizeof(struct phy_packet) && data[1] == ~data[2])
849 phy_packet_count++;
850 else {
851 struct link_packet *packet = (struct link_packet *) data;
852 tcode_count[packet->common.tcode]++;
853 }
854
855 gettimeofday(&now, NULL);
856 if (now.tv_sec <= last_update.tv_sec &&
857 now.tv_usec < last_update.tv_usec + 500000)
858 return;
859
860 last_update = now;
861 printf(CLEAR HIDE_CURSOR
862 " bus resets : %8d\n"
863 " short packets : %8d\n"
864 " phy packets : %8d\n",
865 bus_reset_count, short_packet_count, phy_packet_count);
866
867 for (i = 0; i < array_length(packet_info); i++)
868 if (packet_info[i].type != PACKET_RESERVED)
869 printf(" %-24s: %8d\n", packet_info[i].name, tcode_count[i]);
870 printf(SHOW_CURSOR "\n");
871}
872
873static struct termios saved_attributes;
874
875static void
876reset_input_mode(void)
877{
878 tcsetattr(STDIN_FILENO, TCSANOW, &saved_attributes);
879}
880
881static void
882set_input_mode(void)
883{
884 struct termios tattr;
885
886 /* Make sure stdin is a terminal. */
887 if (!isatty(STDIN_FILENO)) {
888 fprintf(stderr, "Not a terminal.\n");
889 exit(EXIT_FAILURE);
890 }
891
892 /* Save the terminal attributes so we can restore them later. */
893 tcgetattr(STDIN_FILENO, &saved_attributes);
894 atexit(reset_input_mode);
895
896 /* Set the funny terminal modes. */
897 tcgetattr(STDIN_FILENO, &tattr);
898 tattr.c_lflag &= ~(ICANON|ECHO); /* Clear ICANON and ECHO. */
899 tattr.c_cc[VMIN] = 1;
900 tattr.c_cc[VTIME] = 0;
901 tcsetattr(STDIN_FILENO, TCSAFLUSH, &tattr);
902}
903
904int main(int argc, const char *argv[])
905{
906 uint32_t buf[128 * 1024];
907 uint32_t filter;
908 int length, retval, view;
909 int fd = -1;
910 FILE *output = NULL, *input = NULL;
911 poptContext con;
912 char c;
913 struct pollfd pollfds[2];
914
915 sys_sigint_handler = signal(SIGINT, sigint_handler);
916
917 con = poptGetContext(NULL, argc, argv, options, 0);
918 retval = poptGetNextOpt(con);
919 if (retval < -1) {
920 poptPrintUsage(con, stdout, 0);
921 return -1;
922 }
923
924 if (option_version) {
925 printf("dump tool for nosy sniffer, version %s\n", VERSION);
926 return 0;
927 }
928
929 if (__BYTE_ORDER != __LITTLE_ENDIAN)
930 fprintf(stderr, "warning: nosy has only been tested on little "
931 "endian machines\n");
932
933 if (option_input != NULL) {
934 input = fopen(option_input, "r");
935 if (input == NULL) {
936 fprintf(stderr, "Could not open %s, %m\n", option_input);
937 return -1;
938 }
939 } else {
940 fd = open(option_nosy_device, O_RDWR);
941 if (fd < 0) {
942 fprintf(stderr, "Could not open %s, %m\n", option_nosy_device);
943 return -1;
944 }
945 set_input_mode();
946 }
947
948 if (strcmp(option_view, "transaction") == 0)
949 view = VIEW_TRANSACTION;
950 else if (strcmp(option_view, "stats") == 0)
951 view = VIEW_STATS;
952 else
953 view = VIEW_PACKET;
954
955 if (option_output) {
956 output = fopen(option_output, "w");
957 if (output == NULL) {
958 fprintf(stderr, "Could not open %s, %m\n", option_output);
959 return -1;
960 }
961 }
962
963 setvbuf(stdout, NULL, _IOLBF, BUFSIZ);
964
965 filter = ~0;
966 if (!option_iso)
967 filter &= ~(1 << TCODE_STREAM_DATA);
968 if (!option_cycle_start)
969 filter &= ~(1 << TCODE_CYCLE_START);
970 if (view == VIEW_STATS)
971 filter = ~(1 << TCODE_CYCLE_START);
972
973 ioctl(fd, NOSY_IOC_FILTER, filter);
974
975 ioctl(fd, NOSY_IOC_START);
976
977 pollfds[0].fd = fd;
978 pollfds[0].events = POLLIN;
979 pollfds[1].fd = STDIN_FILENO;
980 pollfds[1].events = POLLIN;
981
982 while (run) {
983 if (input != NULL) {
984 if (fread(&length, sizeof length, 1, input) != 1)
985 return 0;
986 fread(buf, 1, length, input);
987 } else {
988 poll(pollfds, 2, -1);
989 if (pollfds[1].revents) {
990 read(STDIN_FILENO, &c, sizeof c);
991 switch (c) {
992 case 'q':
993 if (output != NULL)
994 fclose(output);
995 return 0;
996 }
997 }
998
999 if (pollfds[0].revents)
1000 length = read(fd, buf, sizeof buf);
1001 else
1002 continue;
1003 }
1004
1005 if (output != NULL) {
1006 fwrite(&length, sizeof length, 1, output);
1007 fwrite(buf, 1, length, output);
1008 }
1009
1010 switch (view) {
1011 case VIEW_TRANSACTION:
1012 handle_packet(buf, length);
1013 break;
1014 case VIEW_PACKET:
1015 print_packet(buf, length);
1016 break;
1017 case VIEW_STATS:
1018 print_stats(buf, length);
1019 break;
1020 }
1021 }
1022
1023 if (output != NULL)
1024 fclose(output);
1025
1026 close(fd);
1027
1028 poptFreeContext(con);
1029
1030 return 0;
1031}
diff --git a/tools/firewire/nosy-dump.h b/tools/firewire/nosy-dump.h
new file mode 100644
index 000000000000..3a4b5b33ba5d
--- /dev/null
+++ b/tools/firewire/nosy-dump.h
@@ -0,0 +1,173 @@
1#ifndef __nosy_dump_h__
2#define __nosy_dump_h__
3
4#define array_length(array) (sizeof(array) / sizeof(array[0]))
5
6#define ACK_NO_ACK 0x0
7#define ACK_DONE(a) ((a >> 2) == 0)
8#define ACK_BUSY(a) ((a >> 2) == 1)
9#define ACK_ERROR(a) ((a >> 2) == 3)
10
11#include <stdint.h>
12
13struct phy_packet {
14 uint32_t timestamp;
15 union {
16 struct {
17 uint32_t zero:24;
18 uint32_t phy_id:6;
19 uint32_t identifier:2;
20 } common, link_on;
21
22 struct {
23 uint32_t zero:16;
24 uint32_t gap_count:6;
25 uint32_t set_gap_count:1;
26 uint32_t set_root:1;
27 uint32_t root_id:6;
28 uint32_t identifier:2;
29 } phy_config;
30
31 struct {
32 uint32_t more_packets:1;
33 uint32_t initiated_reset:1;
34 uint32_t port2:2;
35 uint32_t port1:2;
36 uint32_t port0:2;
37 uint32_t power_class:3;
38 uint32_t contender:1;
39 uint32_t phy_delay:2;
40 uint32_t phy_speed:2;
41 uint32_t gap_count:6;
42 uint32_t link_active:1;
43 uint32_t extended:1;
44 uint32_t phy_id:6;
45 uint32_t identifier:2;
46 } self_id;
47
48 struct {
49 uint32_t more_packets:1;
50 uint32_t reserved1:1;
51 uint32_t porth:2;
52 uint32_t portg:2;
53 uint32_t portf:2;
54 uint32_t porte:2;
55 uint32_t portd:2;
56 uint32_t portc:2;
57 uint32_t portb:2;
58 uint32_t porta:2;
59 uint32_t reserved0:2;
60 uint32_t sequence:3;
61 uint32_t extended:1;
62 uint32_t phy_id:6;
63 uint32_t identifier:2;
64 } ext_self_id;
65 };
66 uint32_t inverted;
67 uint32_t ack;
68};
69
70#define TCODE_PHY_PACKET 0x10
71
72#define PHY_PACKET_CONFIGURATION 0x00
73#define PHY_PACKET_LINK_ON 0x01
74#define PHY_PACKET_SELF_ID 0x02
75
76struct link_packet {
77 uint32_t timestamp;
78 union {
79 struct {
80 uint32_t priority:4;
81 uint32_t tcode:4;
82 uint32_t rt:2;
83 uint32_t tlabel:6;
84 uint32_t destination:16;
85
86 uint32_t offset_high:16;
87 uint32_t source:16;
88
89 uint32_t offset_low;
90 } common;
91
92 struct {
93 uint32_t common[3];
94 uint32_t crc;
95 } read_quadlet;
96
97 struct {
98 uint32_t common[3];
99 uint32_t data;
100 uint32_t crc;
101 } read_quadlet_response;
102
103 struct {
104 uint32_t common[3];
105 uint32_t extended_tcode:16;
106 uint32_t data_length:16;
107 uint32_t crc;
108 } read_block;
109
110 struct {
111 uint32_t common[3];
112 uint32_t extended_tcode:16;
113 uint32_t data_length:16;
114 uint32_t crc;
115 uint32_t data[0];
116 /* crc and ack follows. */
117 } read_block_response;
118
119 struct {
120 uint32_t common[3];
121 uint32_t data;
122 uint32_t crc;
123 } write_quadlet;
124
125 struct {
126 uint32_t common[3];
127 uint32_t extended_tcode:16;
128 uint32_t data_length:16;
129 uint32_t crc;
130 uint32_t data[0];
131 /* crc and ack follows. */
132 } write_block;
133
134 struct {
135 uint32_t common[3];
136 uint32_t crc;
137 } write_response;
138
139 struct {
140 uint32_t common[3];
141 uint32_t data;
142 uint32_t crc;
143 } cycle_start;
144
145 struct {
146 uint32_t sy:4;
147 uint32_t tcode:4;
148 uint32_t channel:6;
149 uint32_t tag:2;
150 uint32_t data_length:16;
151
152 uint32_t crc;
153 } iso_data;
154 };
155};
156
157struct subaction {
158 uint32_t ack;
159 size_t length;
160 struct list link;
161 struct link_packet packet;
162};
163
164struct link_transaction {
165 int request_node, response_node, tlabel;
166 struct subaction *request, *response;
167 struct list request_list, response_list;
168 struct list link;
169};
170
171int decode_fcp(struct link_transaction *t);
172
173#endif /* __nosy_dump_h__ */
diff --git a/tools/perf/.gitignore b/tools/perf/.gitignore
index 124760bb37b5..e1d60d780784 100644
--- a/tools/perf/.gitignore
+++ b/tools/perf/.gitignore
@@ -14,6 +14,7 @@ perf*.html
14common-cmds.h 14common-cmds.h
15perf.data 15perf.data
16perf.data.old 16perf.data.old
17perf-archive
17tags 18tags
18TAGS 19TAGS
19cscope* 20cscope*
diff --git a/tools/perf/Documentation/Makefile b/tools/perf/Documentation/Makefile
index bdd3b7ecad0a..bd498d496952 100644
--- a/tools/perf/Documentation/Makefile
+++ b/tools/perf/Documentation/Makefile
@@ -24,7 +24,10 @@ DOC_MAN1=$(patsubst %.txt,%.1,$(MAN1_TXT))
24DOC_MAN5=$(patsubst %.txt,%.5,$(MAN5_TXT)) 24DOC_MAN5=$(patsubst %.txt,%.5,$(MAN5_TXT))
25DOC_MAN7=$(patsubst %.txt,%.7,$(MAN7_TXT)) 25DOC_MAN7=$(patsubst %.txt,%.7,$(MAN7_TXT))
26 26
27# Make the path relative to DESTDIR, not prefix
28ifndef DESTDIR
27prefix?=$(HOME) 29prefix?=$(HOME)
30endif
28bindir?=$(prefix)/bin 31bindir?=$(prefix)/bin
29htmldir?=$(prefix)/share/doc/perf-doc 32htmldir?=$(prefix)/share/doc/perf-doc
30pdfdir?=$(prefix)/share/doc/perf-doc 33pdfdir?=$(prefix)/share/doc/perf-doc
@@ -32,7 +35,6 @@ mandir?=$(prefix)/share/man
32man1dir=$(mandir)/man1 35man1dir=$(mandir)/man1
33man5dir=$(mandir)/man5 36man5dir=$(mandir)/man5
34man7dir=$(mandir)/man7 37man7dir=$(mandir)/man7
35# DESTDIR=
36 38
37ASCIIDOC=asciidoc 39ASCIIDOC=asciidoc
38ASCIIDOC_EXTRA = --unsafe 40ASCIIDOC_EXTRA = --unsafe
diff --git a/tools/perf/Documentation/perf-annotate.txt b/tools/perf/Documentation/perf-annotate.txt
index c9dcade06831..5164a655c39f 100644
--- a/tools/perf/Documentation/perf-annotate.txt
+++ b/tools/perf/Documentation/perf-annotate.txt
@@ -1,5 +1,5 @@
1perf-annotate(1) 1perf-annotate(1)
2============== 2================
3 3
4NAME 4NAME
5---- 5----
diff --git a/tools/perf/Documentation/perf-archive.txt b/tools/perf/Documentation/perf-archive.txt
new file mode 100644
index 000000000000..fae174dc7d01
--- /dev/null
+++ b/tools/perf/Documentation/perf-archive.txt
@@ -0,0 +1,22 @@
1perf-archive(1)
2===============
3
4NAME
5----
6perf-archive - Create archive with object files with build-ids found in perf.data file
7
8SYNOPSIS
9--------
10[verse]
11'perf archive' [file]
12
13DESCRIPTION
14-----------
15This command runs runs perf-buildid-list --with-hits, and collects the files
16with the buildids found so that analisys of perf.data contents can be possible
17on another machine.
18
19
20SEE ALSO
21--------
22linkperf:perf-record[1], linkperf:perf-buildid-list[1], linkperf:perf-report[1]
diff --git a/tools/perf/Documentation/perf-bench.txt b/tools/perf/Documentation/perf-bench.txt
index ae525ac5a2ce..a3dbadb26ef5 100644
--- a/tools/perf/Documentation/perf-bench.txt
+++ b/tools/perf/Documentation/perf-bench.txt
@@ -1,5 +1,5 @@
1perf-bench(1) 1perf-bench(1)
2============ 2=============
3 3
4NAME 4NAME
5---- 5----
@@ -19,12 +19,12 @@ COMMON OPTIONS
19-f:: 19-f::
20--format=:: 20--format=::
21Specify format style. 21Specify format style.
22Current available format styles are, 22Current available format styles are:
23 23
24'default':: 24'default'::
25Default style. This is mainly for human reading. 25Default style. This is mainly for human reading.
26--------------------- 26---------------------
27% perf bench sched pipe # with no style specify 27% perf bench sched pipe # with no style specified
28(executing 1000000 pipe operations between two tasks) 28(executing 1000000 pipe operations between two tasks)
29 Total time:5.855 sec 29 Total time:5.855 sec
30 5.855061 usecs/op 30 5.855061 usecs/op
@@ -79,7 +79,7 @@ options (20 sender and receiver processes per group)
79 79
80 Total time:0.308 sec 80 Total time:0.308 sec
81 81
82% perf bench sched messaging -t -g 20 # be multi-thread,with 20 groups 82% perf bench sched messaging -t -g 20 # be multi-thread, with 20 groups
83(20 sender and receiver threads per group) 83(20 sender and receiver threads per group)
84(20 groups == 800 threads run) 84(20 groups == 800 threads run)
85 85
diff --git a/tools/perf/Documentation/perf-buildid-cache.txt b/tools/perf/Documentation/perf-buildid-cache.txt
new file mode 100644
index 000000000000..5d1a9500277f
--- /dev/null
+++ b/tools/perf/Documentation/perf-buildid-cache.txt
@@ -0,0 +1,33 @@
1perf-buildid-cache(1)
2=====================
3
4NAME
5----
6perf-buildid-cache - Manage build-id cache.
7
8SYNOPSIS
9--------
10[verse]
11'perf buildid-cache <options>'
12
13DESCRIPTION
14-----------
15This command manages the build-id cache. It can add and remove files to the
16cache. In the future it should as well purge older entries, set upper limits
17for the space used by the cache, etc.
18
19OPTIONS
20-------
21-a::
22--add=::
23 Add specified file to the cache.
24-r::
25--remove=::
26 Remove specified file to the cache.
27-v::
28--verbose::
29 Be more verbose.
30
31SEE ALSO
32--------
33linkperf:perf-record[1], linkperf:perf-report[1], linkperf:perf-buildid-list[1]
diff --git a/tools/perf/Documentation/perf-diff.txt b/tools/perf/Documentation/perf-diff.txt
index 8974e208cba6..20d97d84ea1c 100644
--- a/tools/perf/Documentation/perf-diff.txt
+++ b/tools/perf/Documentation/perf-diff.txt
@@ -1,5 +1,5 @@
1perf-diff(1) 1perf-diff(1)
2============== 2============
3 3
4NAME 4NAME
5---- 5----
diff --git a/tools/perf/Documentation/perf-inject.txt b/tools/perf/Documentation/perf-inject.txt
new file mode 100644
index 000000000000..025630d43cd2
--- /dev/null
+++ b/tools/perf/Documentation/perf-inject.txt
@@ -0,0 +1,35 @@
1perf-inject(1)
2==============
3
4NAME
5----
6perf-inject - Filter to augment the events stream with additional information
7
8SYNOPSIS
9--------
10[verse]
11'perf inject <options>'
12
13DESCRIPTION
14-----------
15perf-inject reads a perf-record event stream and repipes it to stdout. At any
16point the processing code can inject other events into the event stream - in
17this case build-ids (-b option) are read and injected as needed into the event
18stream.
19
20Build-ids are just the first user of perf-inject - potentially anything that
21needs userspace processing to augment the events stream with additional
22information could make use of this facility.
23
24OPTIONS
25-------
26-b::
27--build-ids=::
28 Inject build-ids into the output stream
29-v::
30--verbose::
31 Be more verbose.
32
33SEE ALSO
34--------
35linkperf:perf-record[1], linkperf:perf-report[1], linkperf:perf-archive[1]
diff --git a/tools/perf/Documentation/perf-kmem.txt b/tools/perf/Documentation/perf-kmem.txt
index eac4d852e7cd..a52fcde894c7 100644
--- a/tools/perf/Documentation/perf-kmem.txt
+++ b/tools/perf/Documentation/perf-kmem.txt
@@ -1,5 +1,5 @@
1perf-kmem(1) 1perf-kmem(1)
2============== 2============
3 3
4NAME 4NAME
5---- 5----
diff --git a/tools/perf/Documentation/perf-kvm.txt b/tools/perf/Documentation/perf-kvm.txt
new file mode 100644
index 000000000000..d004e19fe6d6
--- /dev/null
+++ b/tools/perf/Documentation/perf-kvm.txt
@@ -0,0 +1,68 @@
1perf-kvm(1)
2===========
3
4NAME
5----
6perf-kvm - Tool to trace/measure kvm guest os
7
8SYNOPSIS
9--------
10[verse]
11'perf kvm' [--host] [--guest] [--guestmount=<path>
12 [--guestkallsyms=<path> --guestmodules=<path> | --guestvmlinux=<path>]]
13 {top|record|report|diff|buildid-list}
14'perf kvm' [--host] [--guest] [--guestkallsyms=<path> --guestmodules=<path>
15 | --guestvmlinux=<path>] {top|record|report|diff|buildid-list}
16
17DESCRIPTION
18-----------
19There are a couple of variants of perf kvm:
20
21 'perf kvm [options] top <command>' to generates and displays
22 a performance counter profile of guest os in realtime
23 of an arbitrary workload.
24
25 'perf kvm record <command>' to record the performance couinter profile
26 of an arbitrary workload and save it into a perf data file. If both
27 --host and --guest are input, the perf data file name is perf.data.kvm.
28 If there is no --host but --guest, the file name is perf.data.guest.
29 If there is no --guest but --host, the file name is perf.data.host.
30
31 'perf kvm report' to display the performance counter profile information
32 recorded via perf kvm record.
33
34 'perf kvm diff' to displays the performance difference amongst two perf.data
35 files captured via perf record.
36
37 'perf kvm buildid-list' to display the buildids found in a perf data file,
38 so that other tools can be used to fetch packages with matching symbol tables
39 for use by perf report.
40
41OPTIONS
42-------
43--host=::
44 Collect host side performance profile.
45--guest=::
46 Collect guest side performance profile.
47--guestmount=<path>::
48 Guest os root file system mount directory. Users mounts guest os
49 root directories under <path> by a specific filesystem access method,
50 typically, sshfs. For example, start 2 guest os. The one's pid is 8888
51 and the other's is 9999.
52 #mkdir ~/guestmount; cd ~/guestmount
53 #sshfs -o allow_other,direct_io -p 5551 localhost:/ 8888/
54 #sshfs -o allow_other,direct_io -p 5552 localhost:/ 9999/
55 #perf kvm --host --guest --guestmount=~/guestmount top
56--guestkallsyms=<path>::
57 Guest os /proc/kallsyms file copy. 'perf' kvm' reads it to get guest
58 kernel symbols. Users copy it out from guest os.
59--guestmodules=<path>::
60 Guest os /proc/modules file copy. 'perf' kvm' reads it to get guest
61 kernel module information. Users copy it out from guest os.
62--guestvmlinux=<path>::
63 Guest os kernel vmlinux.
64
65SEE ALSO
66--------
67linkperf:perf-top[1], linkperf:perf-record[1], linkperf:perf-report[1],
68linkperf:perf-diff[1], linkperf:perf-buildid-list[1]
diff --git a/tools/perf/Documentation/perf-list.txt b/tools/perf/Documentation/perf-list.txt
index 8290b9422668..43e3dd284b90 100644
--- a/tools/perf/Documentation/perf-list.txt
+++ b/tools/perf/Documentation/perf-list.txt
@@ -15,6 +15,35 @@ DESCRIPTION
15This command displays the symbolic event types which can be selected in the 15This command displays the symbolic event types which can be selected in the
16various perf commands with the -e option. 16various perf commands with the -e option.
17 17
18RAW HARDWARE EVENT DESCRIPTOR
19-----------------------------
20Even when an event is not available in a symbolic form within perf right now,
21it can be encoded in a per processor specific way.
22
23For instance For x86 CPUs NNN represents the raw register encoding with the
24layout of IA32_PERFEVTSELx MSRs (see [Intel® 64 and IA-32 Architectures Software Developer's Manual Volume 3B: System Programming Guide] Figure 30-1 Layout
25of IA32_PERFEVTSELx MSRs) or AMD's PerfEvtSeln (see [AMD64 Architecture Programmer’s Manual Volume 2: System Programming], Page 344,
26Figure 13-7 Performance Event-Select Register (PerfEvtSeln)).
27
28Example:
29
30If the Intel docs for a QM720 Core i7 describe an event as:
31
32 Event Umask Event Mask
33 Num. Value Mnemonic Description Comment
34
35 A8H 01H LSD.UOPS Counts the number of micro-ops Use cmask=1 and
36 delivered by loop stream detector invert to count
37 cycles
38
39raw encoding of 0x1A8 can be used:
40
41 perf stat -e r1a8 -a sleep 1
42 perf record -e r1a8 ...
43
44You should refer to the processor specific documentation for getting these
45details. Some of them are referenced in the SEE ALSO section below.
46
18OPTIONS 47OPTIONS
19------- 48-------
20None 49None
@@ -22,4 +51,6 @@ None
22SEE ALSO 51SEE ALSO
23-------- 52--------
24linkperf:perf-stat[1], linkperf:perf-top[1], 53linkperf:perf-stat[1], linkperf:perf-top[1],
25linkperf:perf-record[1] 54linkperf:perf-record[1],
55http://www.intel.com/Assets/PDF/manual/253669.pdf[Intel® 64 and IA-32 Architectures Software Developer's Manual Volume 3B: System Programming Guide],
56http://support.amd.com/us/Processor_TechDocs/24593.pdf[AMD64 Architecture Programmer’s Manual Volume 2: System Programming]
diff --git a/tools/perf/Documentation/perf-lock.txt b/tools/perf/Documentation/perf-lock.txt
new file mode 100644
index 000000000000..b317102138c8
--- /dev/null
+++ b/tools/perf/Documentation/perf-lock.txt
@@ -0,0 +1,29 @@
1perf-lock(1)
2============
3
4NAME
5----
6perf-lock - Analyze lock events
7
8SYNOPSIS
9--------
10[verse]
11'perf lock' {record|report|trace}
12
13DESCRIPTION
14-----------
15You can analyze various lock behaviours
16and statistics with this 'perf lock' command.
17
18 'perf lock record <command>' records lock events
19 between start and end <command>. And this command
20 produces the file "perf.data" which contains tracing
21 results of lock events.
22
23 'perf lock trace' shows raw lock events.
24
25 'perf lock report' reports statistical data.
26
27SEE ALSO
28--------
29linkperf:perf[1]
diff --git a/tools/perf/Documentation/perf-probe.txt b/tools/perf/Documentation/perf-probe.txt
index 250e391b4bc8..94a258c96a44 100644
--- a/tools/perf/Documentation/perf-probe.txt
+++ b/tools/perf/Documentation/perf-probe.txt
@@ -15,6 +15,8 @@ or
15'perf probe' [options] --del='[GROUP:]EVENT' [...] 15'perf probe' [options] --del='[GROUP:]EVENT' [...]
16or 16or
17'perf probe' --list 17'perf probe' --list
18or
19'perf probe' --line='FUNC[:RLN[+NUM|:RLN2]]|SRC:ALN[+NUM|:ALN2]'
18 20
19DESCRIPTION 21DESCRIPTION
20----------- 22-----------
@@ -39,22 +41,105 @@ OPTIONS
39 41
40-d:: 42-d::
41--del=:: 43--del=::
42 Delete a probe event. 44 Delete probe events. This accepts glob wildcards('*', '?') and character
45 classes(e.g. [a-z], [!A-Z]).
43 46
44-l:: 47-l::
45--list:: 48--list::
46 List up current probe events. 49 List up current probe events.
47 50
51-L::
52--line=::
53 Show source code lines which can be probed. This needs an argument
54 which specifies a range of the source code. (see LINE SYNTAX for detail)
55
56-f::
57--force::
58 Forcibly add events with existing name.
59
60-n::
61--dry-run::
62 Dry run. With this option, --add and --del doesn't execute actual
63 adding and removal operations.
64
65--max-probes::
66 Set the maximum number of probe points for an event. Default is 128.
67
48PROBE SYNTAX 68PROBE SYNTAX
49------------ 69------------
50Probe points are defined by following syntax. 70Probe points are defined by following syntax.
51 71
52 "[EVENT=]FUNC[+OFFS|:RLN|%return][@SRC]|SRC:ALN [ARG ...]" 72 1) Define event based on function name
73 [EVENT=]FUNC[@SRC][:RLN|+OFFS|%return|;PTN] [ARG ...]
74
75 2) Define event based on source file with line number
76 [EVENT=]SRC:ALN [ARG ...]
77
78 3) Define event based on source file with lazy pattern
79 [EVENT=]SRC;PTN [ARG ...]
80
53 81
54'EVENT' specifies the name of new event, if omitted, it will be set the name of the probed function. Currently, event group name is set as 'probe'. 82'EVENT' specifies the name of new event, if omitted, it will be set the name of the probed function. Currently, event group name is set as 'probe'.
55'FUNC' specifies a probed function name, and it may have one of the following options; '+OFFS' is the offset from function entry address in bytes, 'RLN' is the relative-line number from function entry line, and '%return' means that it probes function return. In addition, 'SRC' specifies a source file which has that function. 83'FUNC' specifies a probed function name, and it may have one of the following options; '+OFFS' is the offset from function entry address in bytes, ':RLN' is the relative-line number from function entry line, and '%return' means that it probes function return. And ';PTN' means lazy matching pattern (see LAZY MATCHING). Note that ';PTN' must be the end of the probe point definition. In addition, '@SRC' specifies a source file which has that function.
56It is also possible to specify a probe point by the source line number by using 'SRC:ALN' syntax, where 'SRC' is the source file path and 'ALN' is the line number. 84It is also possible to specify a probe point by the source line number or lazy matching by using 'SRC:ALN' or 'SRC;PTN' syntax, where 'SRC' is the source file path, ':ALN' is the line number and ';PTN' is the lazy matching pattern.
57'ARG' specifies the arguments of this probe point. You can use the name of local variable, or kprobe-tracer argument format (e.g. $retval, %ax, etc). 85'ARG' specifies the arguments of this probe point, (see PROBE ARGUMENT).
86
87PROBE ARGUMENT
88--------------
89Each probe argument follows below syntax.
90
91 [NAME=]LOCALVAR|$retval|%REG|@SYMBOL[:TYPE]
92
93'NAME' specifies the name of this argument (optional). You can use the name of local variable, local data structure member (e.g. var->field, var.field2), or kprobe-tracer argument format (e.g. $retval, %ax, etc). Note that the name of this argument will be set as the last member name if you specify a local data structure member (e.g. field2 for 'var->field1.field2'.)
94'TYPE' casts the type of this argument (optional). If omitted, perf probe automatically set the type based on debuginfo.
95
96LINE SYNTAX
97-----------
98Line range is descripted by following syntax.
99
100 "FUNC[:RLN[+NUM|-RLN2]]|SRC:ALN[+NUM|-ALN2]"
101
102FUNC specifies the function name of showing lines. 'RLN' is the start line
103number from function entry line, and 'RLN2' is the end line number. As same as
104probe syntax, 'SRC' means the source file path, 'ALN' is start line number,
105and 'ALN2' is end line number in the file. It is also possible to specify how
106many lines to show by using 'NUM'.
107So, "source.c:100-120" shows lines between 100th to l20th in source.c file. And "func:10+20" shows 20 lines from 10th line of func function.
108
109LAZY MATCHING
110-------------
111 The lazy line matching is similar to glob matching but ignoring spaces in both of pattern and target. So this accepts wildcards('*', '?') and character classes(e.g. [a-z], [!A-Z]).
112
113e.g.
114 'a=*' can matches 'a=b', 'a = b', 'a == b' and so on.
115
116This provides some sort of flexibility and robustness to probe point definitions against minor code changes. For example, actual 10th line of schedule() can be moved easily by modifying schedule(), but the same line matching 'rq=cpu_rq*' may still exist in the function.)
117
118
119EXAMPLES
120--------
121Display which lines in schedule() can be probed:
122
123 ./perf probe --line schedule
124
125Add a probe on schedule() function 12th line with recording cpu local variable:
126
127 ./perf probe schedule:12 cpu
128 or
129 ./perf probe --add='schedule:12 cpu'
130
131 this will add one or more probes which has the name start with "schedule".
132
133 Add probes on lines in schedule() function which calls update_rq_clock().
134
135 ./perf probe 'schedule;update_rq_clock*'
136 or
137 ./perf probe --add='schedule;update_rq_clock*'
138
139Delete all probes on schedule().
140
141 ./perf probe --del='schedule*'
142
58 143
59SEE ALSO 144SEE ALSO
60-------- 145--------
diff --git a/tools/perf/Documentation/perf-record.txt b/tools/perf/Documentation/perf-record.txt
index fc46c0b40f6e..34e255fc3e2f 100644
--- a/tools/perf/Documentation/perf-record.txt
+++ b/tools/perf/Documentation/perf-record.txt
@@ -58,7 +58,7 @@ OPTIONS
58 58
59-f:: 59-f::
60--force:: 60--force::
61 Overwrite existing data file. 61 Overwrite existing data file. (deprecated)
62 62
63-c:: 63-c::
64--count=:: 64--count=::
@@ -69,8 +69,8 @@ OPTIONS
69 Output file name. 69 Output file name.
70 70
71-i:: 71-i::
72--inherit:: 72--no-inherit::
73 Child tasks inherit counters. 73 Child tasks do not inherit counters.
74-F:: 74-F::
75--freq=:: 75--freq=::
76 Profile at this frequency. 76 Profile at this frequency.
@@ -101,7 +101,7 @@ OPTIONS
101 101
102-R:: 102-R::
103--raw-samples:: 103--raw-samples::
104Collect raw sample records from all opened counters (typically for tracepoint counters). 104Collect raw sample records from all opened counters (default for tracepoint counters).
105 105
106SEE ALSO 106SEE ALSO
107-------- 107--------
diff --git a/tools/perf/Documentation/perf-sched.txt b/tools/perf/Documentation/perf-sched.txt
index 1ce79198997b..8417644a6166 100644
--- a/tools/perf/Documentation/perf-sched.txt
+++ b/tools/perf/Documentation/perf-sched.txt
@@ -12,7 +12,7 @@ SYNOPSIS
12 12
13DESCRIPTION 13DESCRIPTION
14----------- 14-----------
15There's four variants of perf sched: 15There are four variants of perf sched:
16 16
17 'perf sched record <command>' to record the scheduling events 17 'perf sched record <command>' to record the scheduling events
18 of an arbitrary workload. 18 of an arbitrary workload.
@@ -27,7 +27,7 @@ There's four variants of perf sched:
27 via perf sched record. (this is done by starting up mockup threads 27 via perf sched record. (this is done by starting up mockup threads
28 that mimic the workload based on the events in the trace. These 28 that mimic the workload based on the events in the trace. These
29 threads can then replay the timings (CPU runtime and sleep patterns) 29 threads can then replay the timings (CPU runtime and sleep patterns)
30 of the workload as it occured when it was recorded - and can repeat 30 of the workload as it occurred when it was recorded - and can repeat
31 it a number of times, measuring its performance.) 31 it a number of times, measuring its performance.)
32 32
33OPTIONS 33OPTIONS
diff --git a/tools/perf/Documentation/perf-stat.txt b/tools/perf/Documentation/perf-stat.txt
index 484080dd5b6f..909fa766fa1c 100644
--- a/tools/perf/Documentation/perf-stat.txt
+++ b/tools/perf/Documentation/perf-stat.txt
@@ -31,8 +31,8 @@ OPTIONS
31 hexadecimal event descriptor. 31 hexadecimal event descriptor.
32 32
33-i:: 33-i::
34--inherit:: 34--no-inherit::
35 child tasks inherit counters 35 child tasks do not inherit counters
36-p:: 36-p::
37--pid=<pid>:: 37--pid=<pid>::
38 stat events on existing pid 38 stat events on existing pid
@@ -43,6 +43,9 @@ OPTIONS
43-c:: 43-c::
44 scale counter values 44 scale counter values
45 45
46-B::
47 print large numbers with thousands' separators according to locale
48
46EXAMPLES 49EXAMPLES
47-------- 50--------
48 51
diff --git a/tools/perf/Documentation/perf-test.txt b/tools/perf/Documentation/perf-test.txt
new file mode 100644
index 000000000000..1c4b5f5b7f71
--- /dev/null
+++ b/tools/perf/Documentation/perf-test.txt
@@ -0,0 +1,22 @@
1perf-test(1)
2============
3
4NAME
5----
6perf-test - Runs sanity tests.
7
8SYNOPSIS
9--------
10[verse]
11'perf test <options>'
12
13DESCRIPTION
14-----------
15This command does assorted sanity tests, initially thru linked routines but
16also will look for a directory with more tests in the form of scripts.
17
18OPTIONS
19-------
20-v::
21--verbose::
22 Be more verbose.
diff --git a/tools/perf/Documentation/perf-top.txt b/tools/perf/Documentation/perf-top.txt
index 4a7d558dc309..785b9fc32a46 100644
--- a/tools/perf/Documentation/perf-top.txt
+++ b/tools/perf/Documentation/perf-top.txt
@@ -74,7 +74,7 @@ OPTIONS
74 74
75-s <symbol>:: 75-s <symbol>::
76--sym-annotate=<symbol>:: 76--sym-annotate=<symbol>::
77 Annotate this symbol. Requires -k option. 77 Annotate this symbol.
78 78
79-v:: 79-v::
80--verbose:: 80--verbose::
diff --git a/tools/perf/Documentation/perf-trace-perl.txt b/tools/perf/Documentation/perf-trace-perl.txt
index c5f55f439091..ee6525ee6d69 100644
--- a/tools/perf/Documentation/perf-trace-perl.txt
+++ b/tools/perf/Documentation/perf-trace-perl.txt
@@ -8,7 +8,7 @@ perf-trace-perl - Process trace data with a Perl script
8SYNOPSIS 8SYNOPSIS
9-------- 9--------
10[verse] 10[verse]
11'perf trace' [-s [lang]:script[.ext] ] 11'perf trace' [-s [Perl]:script[.pl] ]
12 12
13DESCRIPTION 13DESCRIPTION
14----------- 14-----------
@@ -49,12 +49,10 @@ available as calls back into the perf executable (see below).
49As an example, the following perf record command can be used to record 49As an example, the following perf record command can be used to record
50all sched_wakeup events in the system: 50all sched_wakeup events in the system:
51 51
52 # perf record -c 1 -f -a -M -R -e sched:sched_wakeup 52 # perf record -a -e sched:sched_wakeup
53 53
54Traces meant to be processed using a script should be recorded with 54Traces meant to be processed using a script should be recorded with
55the above options: -c 1 says to sample every event, -a to enable 55the above option: -a to enable system-wide collection.
56system-wide collection, -M to multiplex the output, and -R to collect
57raw samples.
58 56
59The format file for the sched_wakep event defines the following fields 57The format file for the sched_wakep event defines the following fields
60(see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format): 58(see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format):
diff --git a/tools/perf/Documentation/perf-trace-python.txt b/tools/perf/Documentation/perf-trace-python.txt
new file mode 100644
index 000000000000..693be804dd3d
--- /dev/null
+++ b/tools/perf/Documentation/perf-trace-python.txt
@@ -0,0 +1,623 @@
1perf-trace-python(1)
2====================
3
4NAME
5----
6perf-trace-python - Process trace data with a Python script
7
8SYNOPSIS
9--------
10[verse]
11'perf trace' [-s [Python]:script[.py] ]
12
13DESCRIPTION
14-----------
15
16This perf trace option is used to process perf trace data using perf's
17built-in Python interpreter. It reads and processes the input file and
18displays the results of the trace analysis implemented in the given
19Python script, if any.
20
21A QUICK EXAMPLE
22---------------
23
24This section shows the process, start to finish, of creating a working
25Python script that aggregates and extracts useful information from a
26raw perf trace stream. You can avoid reading the rest of this
27document if an example is enough for you; the rest of the document
28provides more details on each step and lists the library functions
29available to script writers.
30
31This example actually details the steps that were used to create the
32'syscall-counts' script you see when you list the available perf trace
33scripts via 'perf trace -l'. As such, this script also shows how to
34integrate your script into the list of general-purpose 'perf trace'
35scripts listed by that command.
36
37The syscall-counts script is a simple script, but demonstrates all the
38basic ideas necessary to create a useful script. Here's an example
39of its output (syscall names are not yet supported, they will appear
40as numbers):
41
42----
43syscall events:
44
45event count
46---------------------------------------- -----------
47sys_write 455067
48sys_getdents 4072
49sys_close 3037
50sys_swapoff 1769
51sys_read 923
52sys_sched_setparam 826
53sys_open 331
54sys_newfstat 326
55sys_mmap 217
56sys_munmap 216
57sys_futex 141
58sys_select 102
59sys_poll 84
60sys_setitimer 12
61sys_writev 8
6215 8
63sys_lseek 7
64sys_rt_sigprocmask 6
65sys_wait4 3
66sys_ioctl 3
67sys_set_robust_list 1
68sys_exit 1
6956 1
70sys_access 1
71----
72
73Basically our task is to keep a per-syscall tally that gets updated
74every time a system call occurs in the system. Our script will do
75that, but first we need to record the data that will be processed by
76that script. Theoretically, there are a couple of ways we could do
77that:
78
79- we could enable every event under the tracing/events/syscalls
80 directory, but this is over 600 syscalls, well beyond the number
81 allowable by perf. These individual syscall events will however be
82 useful if we want to later use the guidance we get from the
83 general-purpose scripts to drill down and get more detail about
84 individual syscalls of interest.
85
86- we can enable the sys_enter and/or sys_exit syscalls found under
87 tracing/events/raw_syscalls. These are called for all syscalls; the
88 'id' field can be used to distinguish between individual syscall
89 numbers.
90
91For this script, we only need to know that a syscall was entered; we
92don't care how it exited, so we'll use 'perf record' to record only
93the sys_enter events:
94
95----
96# perf record -a -e raw_syscalls:sys_enter
97
98^C[ perf record: Woken up 1 times to write data ]
99[ perf record: Captured and wrote 56.545 MB perf.data (~2470503 samples) ]
100----
101
102The options basically say to collect data for every syscall event
103system-wide and multiplex the per-cpu output into a single stream.
104That single stream will be recorded in a file in the current directory
105called perf.data.
106
107Once we have a perf.data file containing our data, we can use the -g
108'perf trace' option to generate a Python script that will contain a
109callback handler for each event type found in the perf.data trace
110stream (for more details, see the STARTER SCRIPTS section).
111
112----
113# perf trace -g python
114generated Python script: perf-trace.py
115
116The output file created also in the current directory is named
117perf-trace.py. Here's the file in its entirety:
118
119# perf trace event handlers, generated by perf trace -g python
120# Licensed under the terms of the GNU GPL License version 2
121
122# The common_* event handler fields are the most useful fields common to
123# all events. They don't necessarily correspond to the 'common_*' fields
124# in the format files. Those fields not available as handler params can
125# be retrieved using Python functions of the form common_*(context).
126# See the perf-trace-python Documentation for the list of available functions.
127
128import os
129import sys
130
131sys.path.append(os.environ['PERF_EXEC_PATH'] + \
132 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
133
134from perf_trace_context import *
135from Core import *
136
137def trace_begin():
138 print "in trace_begin"
139
140def trace_end():
141 print "in trace_end"
142
143def raw_syscalls__sys_enter(event_name, context, common_cpu,
144 common_secs, common_nsecs, common_pid, common_comm,
145 id, args):
146 print_header(event_name, common_cpu, common_secs, common_nsecs,
147 common_pid, common_comm)
148
149 print "id=%d, args=%s\n" % \
150 (id, args),
151
152def trace_unhandled(event_name, context, common_cpu, common_secs, common_nsecs,
153 common_pid, common_comm):
154 print_header(event_name, common_cpu, common_secs, common_nsecs,
155 common_pid, common_comm)
156
157def print_header(event_name, cpu, secs, nsecs, pid, comm):
158 print "%-20s %5u %05u.%09u %8u %-20s " % \
159 (event_name, cpu, secs, nsecs, pid, comm),
160----
161
162At the top is a comment block followed by some import statements and a
163path append which every perf trace script should include.
164
165Following that are a couple generated functions, trace_begin() and
166trace_end(), which are called at the beginning and the end of the
167script respectively (for more details, see the SCRIPT_LAYOUT section
168below).
169
170Following those are the 'event handler' functions generated one for
171every event in the 'perf record' output. The handler functions take
172the form subsystem__event_name, and contain named parameters, one for
173each field in the event; in this case, there's only one event,
174raw_syscalls__sys_enter(). (see the EVENT HANDLERS section below for
175more info on event handlers).
176
177The final couple of functions are, like the begin and end functions,
178generated for every script. The first, trace_unhandled(), is called
179every time the script finds an event in the perf.data file that
180doesn't correspond to any event handler in the script. This could
181mean either that the record step recorded event types that it wasn't
182really interested in, or the script was run against a trace file that
183doesn't correspond to the script.
184
185The script generated by -g option simply prints a line for each
186event found in the trace stream i.e. it basically just dumps the event
187and its parameter values to stdout. The print_header() function is
188simply a utility function used for that purpose. Let's rename the
189script and run it to see the default output:
190
191----
192# mv perf-trace.py syscall-counts.py
193# perf trace -s syscall-counts.py
194
195raw_syscalls__sys_enter 1 00840.847582083 7506 perf id=1, args=
196raw_syscalls__sys_enter 1 00840.847595764 7506 perf id=1, args=
197raw_syscalls__sys_enter 1 00840.847620860 7506 perf id=1, args=
198raw_syscalls__sys_enter 1 00840.847710478 6533 npviewer.bin id=78, args=
199raw_syscalls__sys_enter 1 00840.847719204 6533 npviewer.bin id=142, args=
200raw_syscalls__sys_enter 1 00840.847755445 6533 npviewer.bin id=3, args=
201raw_syscalls__sys_enter 1 00840.847775601 6533 npviewer.bin id=3, args=
202raw_syscalls__sys_enter 1 00840.847781820 6533 npviewer.bin id=3, args=
203.
204.
205.
206----
207
208Of course, for this script, we're not interested in printing every
209trace event, but rather aggregating it in a useful way. So we'll get
210rid of everything to do with printing as well as the trace_begin() and
211trace_unhandled() functions, which we won't be using. That leaves us
212with this minimalistic skeleton:
213
214----
215import os
216import sys
217
218sys.path.append(os.environ['PERF_EXEC_PATH'] + \
219 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
220
221from perf_trace_context import *
222from Core import *
223
224def trace_end():
225 print "in trace_end"
226
227def raw_syscalls__sys_enter(event_name, context, common_cpu,
228 common_secs, common_nsecs, common_pid, common_comm,
229 id, args):
230----
231
232In trace_end(), we'll simply print the results, but first we need to
233generate some results to print. To do that we need to have our
234sys_enter() handler do the necessary tallying until all events have
235been counted. A hash table indexed by syscall id is a good way to
236store that information; every time the sys_enter() handler is called,
237we simply increment a count associated with that hash entry indexed by
238that syscall id:
239
240----
241 syscalls = autodict()
242
243 try:
244 syscalls[id] += 1
245 except TypeError:
246 syscalls[id] = 1
247----
248
249The syscalls 'autodict' object is a special kind of Python dictionary
250(implemented in Core.py) that implements Perl's 'autovivifying' hashes
251in Python i.e. with autovivifying hashes, you can assign nested hash
252values without having to go to the trouble of creating intermediate
253levels if they don't exist e.g syscalls[comm][pid][id] = 1 will create
254the intermediate hash levels and finally assign the value 1 to the
255hash entry for 'id' (because the value being assigned isn't a hash
256object itself, the initial value is assigned in the TypeError
257exception. Well, there may be a better way to do this in Python but
258that's what works for now).
259
260Putting that code into the raw_syscalls__sys_enter() handler, we
261effectively end up with a single-level dictionary keyed on syscall id
262and having the counts we've tallied as values.
263
264The print_syscall_totals() function iterates over the entries in the
265dictionary and displays a line for each entry containing the syscall
266name (the dictonary keys contain the syscall ids, which are passed to
267the Util function syscall_name(), which translates the raw syscall
268numbers to the corresponding syscall name strings). The output is
269displayed after all the events in the trace have been processed, by
270calling the print_syscall_totals() function from the trace_end()
271handler called at the end of script processing.
272
273The final script producing the output shown above is shown in its
274entirety below (syscall_name() helper is not yet available, you can
275only deal with id's for now):
276
277----
278import os
279import sys
280
281sys.path.append(os.environ['PERF_EXEC_PATH'] + \
282 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
283
284from perf_trace_context import *
285from Core import *
286from Util import *
287
288syscalls = autodict()
289
290def trace_end():
291 print_syscall_totals()
292
293def raw_syscalls__sys_enter(event_name, context, common_cpu,
294 common_secs, common_nsecs, common_pid, common_comm,
295 id, args):
296 try:
297 syscalls[id] += 1
298 except TypeError:
299 syscalls[id] = 1
300
301def print_syscall_totals():
302 if for_comm is not None:
303 print "\nsyscall events for %s:\n\n" % (for_comm),
304 else:
305 print "\nsyscall events:\n\n",
306
307 print "%-40s %10s\n" % ("event", "count"),
308 print "%-40s %10s\n" % ("----------------------------------------", \
309 "-----------"),
310
311 for id, val in sorted(syscalls.iteritems(), key = lambda(k, v): (v, k), \
312 reverse = True):
313 print "%-40s %10d\n" % (syscall_name(id), val),
314----
315
316The script can be run just as before:
317
318 # perf trace -s syscall-counts.py
319
320So those are the essential steps in writing and running a script. The
321process can be generalized to any tracepoint or set of tracepoints
322you're interested in - basically find the tracepoint(s) you're
323interested in by looking at the list of available events shown by
324'perf list' and/or look in /sys/kernel/debug/tracing events for
325detailed event and field info, record the corresponding trace data
326using 'perf record', passing it the list of interesting events,
327generate a skeleton script using 'perf trace -g python' and modify the
328code to aggregate and display it for your particular needs.
329
330After you've done that you may end up with a general-purpose script
331that you want to keep around and have available for future use. By
332writing a couple of very simple shell scripts and putting them in the
333right place, you can have your script listed alongside the other
334scripts listed by the 'perf trace -l' command e.g.:
335
336----
337root@tropicana:~# perf trace -l
338List of available trace scripts:
339 workqueue-stats workqueue stats (ins/exe/create/destroy)
340 wakeup-latency system-wide min/max/avg wakeup latency
341 rw-by-file <comm> r/w activity for a program, by file
342 rw-by-pid system-wide r/w activity
343----
344
345A nice side effect of doing this is that you also then capture the
346probably lengthy 'perf record' command needed to record the events for
347the script.
348
349To have the script appear as a 'built-in' script, you write two simple
350scripts, one for recording and one for 'reporting'.
351
352The 'record' script is a shell script with the same base name as your
353script, but with -record appended. The shell script should be put
354into the perf/scripts/python/bin directory in the kernel source tree.
355In that script, you write the 'perf record' command-line needed for
356your script:
357
358----
359# cat kernel-source/tools/perf/scripts/python/bin/syscall-counts-record
360
361#!/bin/bash
362perf record -a -e raw_syscalls:sys_enter
363----
364
365The 'report' script is also a shell script with the same base name as
366your script, but with -report appended. It should also be located in
367the perf/scripts/python/bin directory. In that script, you write the
368'perf trace -s' command-line needed for running your script:
369
370----
371# cat kernel-source/tools/perf/scripts/python/bin/syscall-counts-report
372
373#!/bin/bash
374# description: system-wide syscall counts
375perf trace -s ~/libexec/perf-core/scripts/python/syscall-counts.py
376----
377
378Note that the location of the Python script given in the shell script
379is in the libexec/perf-core/scripts/python directory - this is where
380the script will be copied by 'make install' when you install perf.
381For the installation to install your script there, your script needs
382to be located in the perf/scripts/python directory in the kernel
383source tree:
384
385----
386# ls -al kernel-source/tools/perf/scripts/python
387
388root@tropicana:/home/trz/src/tip# ls -al tools/perf/scripts/python
389total 32
390drwxr-xr-x 4 trz trz 4096 2010-01-26 22:30 .
391drwxr-xr-x 4 trz trz 4096 2010-01-26 22:29 ..
392drwxr-xr-x 2 trz trz 4096 2010-01-26 22:29 bin
393-rw-r--r-- 1 trz trz 2548 2010-01-26 22:29 check-perf-trace.py
394drwxr-xr-x 3 trz trz 4096 2010-01-26 22:49 Perf-Trace-Util
395-rw-r--r-- 1 trz trz 1462 2010-01-26 22:30 syscall-counts.py
396----
397
398Once you've done that (don't forget to do a new 'make install',
399otherwise your script won't show up at run-time), 'perf trace -l'
400should show a new entry for your script:
401
402----
403root@tropicana:~# perf trace -l
404List of available trace scripts:
405 workqueue-stats workqueue stats (ins/exe/create/destroy)
406 wakeup-latency system-wide min/max/avg wakeup latency
407 rw-by-file <comm> r/w activity for a program, by file
408 rw-by-pid system-wide r/w activity
409 syscall-counts system-wide syscall counts
410----
411
412You can now perform the record step via 'perf trace record':
413
414 # perf trace record syscall-counts
415
416and display the output using 'perf trace report':
417
418 # perf trace report syscall-counts
419
420STARTER SCRIPTS
421---------------
422
423You can quickly get started writing a script for a particular set of
424trace data by generating a skeleton script using 'perf trace -g
425python' in the same directory as an existing perf.data trace file.
426That will generate a starter script containing a handler for each of
427the event types in the trace file; it simply prints every available
428field for each event in the trace file.
429
430You can also look at the existing scripts in
431~/libexec/perf-core/scripts/python for typical examples showing how to
432do basic things like aggregate event data, print results, etc. Also,
433the check-perf-trace.py script, while not interesting for its results,
434attempts to exercise all of the main scripting features.
435
436EVENT HANDLERS
437--------------
438
439When perf trace is invoked using a trace script, a user-defined
440'handler function' is called for each event in the trace. If there's
441no handler function defined for a given event type, the event is
442ignored (or passed to a 'trace_handled' function, see below) and the
443next event is processed.
444
445Most of the event's field values are passed as arguments to the
446handler function; some of the less common ones aren't - those are
447available as calls back into the perf executable (see below).
448
449As an example, the following perf record command can be used to record
450all sched_wakeup events in the system:
451
452 # perf record -a -e sched:sched_wakeup
453
454Traces meant to be processed using a script should be recorded with
455the above option: -a to enable system-wide collection.
456
457The format file for the sched_wakep event defines the following fields
458(see /sys/kernel/debug/tracing/events/sched/sched_wakeup/format):
459
460----
461 format:
462 field:unsigned short common_type;
463 field:unsigned char common_flags;
464 field:unsigned char common_preempt_count;
465 field:int common_pid;
466 field:int common_lock_depth;
467
468 field:char comm[TASK_COMM_LEN];
469 field:pid_t pid;
470 field:int prio;
471 field:int success;
472 field:int target_cpu;
473----
474
475The handler function for this event would be defined as:
476
477----
478def sched__sched_wakeup(event_name, context, common_cpu, common_secs,
479 common_nsecs, common_pid, common_comm,
480 comm, pid, prio, success, target_cpu):
481 pass
482----
483
484The handler function takes the form subsystem__event_name.
485
486The common_* arguments in the handler's argument list are the set of
487arguments passed to all event handlers; some of the fields correspond
488to the common_* fields in the format file, but some are synthesized,
489and some of the common_* fields aren't common enough to to be passed
490to every event as arguments but are available as library functions.
491
492Here's a brief description of each of the invariant event args:
493
494 event_name the name of the event as text
495 context an opaque 'cookie' used in calls back into perf
496 common_cpu the cpu the event occurred on
497 common_secs the secs portion of the event timestamp
498 common_nsecs the nsecs portion of the event timestamp
499 common_pid the pid of the current task
500 common_comm the name of the current process
501
502All of the remaining fields in the event's format file have
503counterparts as handler function arguments of the same name, as can be
504seen in the example above.
505
506The above provides the basics needed to directly access every field of
507every event in a trace, which covers 90% of what you need to know to
508write a useful trace script. The sections below cover the rest.
509
510SCRIPT LAYOUT
511-------------
512
513Every perf trace Python script should start by setting up a Python
514module search path and 'import'ing a few support modules (see module
515descriptions below):
516
517----
518 import os
519 import sys
520
521 sys.path.append(os.environ['PERF_EXEC_PATH'] + \
522 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
523
524 from perf_trace_context import *
525 from Core import *
526----
527
528The rest of the script can contain handler functions and support
529functions in any order.
530
531Aside from the event handler functions discussed above, every script
532can implement a set of optional functions:
533
534*trace_begin*, if defined, is called before any event is processed and
535gives scripts a chance to do setup tasks:
536
537----
538def trace_begin:
539 pass
540----
541
542*trace_end*, if defined, is called after all events have been
543 processed and gives scripts a chance to do end-of-script tasks, such
544 as display results:
545
546----
547def trace_end:
548 pass
549----
550
551*trace_unhandled*, if defined, is called after for any event that
552 doesn't have a handler explicitly defined for it. The standard set
553 of common arguments are passed into it:
554
555----
556def trace_unhandled(event_name, context, common_cpu, common_secs,
557 common_nsecs, common_pid, common_comm):
558 pass
559----
560
561The remaining sections provide descriptions of each of the available
562built-in perf trace Python modules and their associated functions.
563
564AVAILABLE MODULES AND FUNCTIONS
565-------------------------------
566
567The following sections describe the functions and variables available
568via the various perf trace Python modules. To use the functions and
569variables from the given module, add the corresponding 'from XXXX
570import' line to your perf trace script.
571
572Core.py Module
573~~~~~~~~~~~~~~
574
575These functions provide some essential functions to user scripts.
576
577The *flag_str* and *symbol_str* functions provide human-readable
578strings for flag and symbolic fields. These correspond to the strings
579and values parsed from the 'print fmt' fields of the event format
580files:
581
582 flag_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the flag field field_name of event event_name
583 symbol_str(event_name, field_name, field_value) - returns the string represention corresponding to field_value for the symbolic field field_name of event event_name
584
585The *autodict* function returns a special kind of Python
586dictionary that implements Perl's 'autovivifying' hashes in Python
587i.e. with autovivifying hashes, you can assign nested hash values
588without having to go to the trouble of creating intermediate levels if
589they don't exist.
590
591 autodict() - returns an autovivifying dictionary instance
592
593
594perf_trace_context Module
595~~~~~~~~~~~~~~~~~~~~~~~~~
596
597Some of the 'common' fields in the event format file aren't all that
598common, but need to be made accessible to user scripts nonetheless.
599
600perf_trace_context defines a set of functions that can be used to
601access this data in the context of the current event. Each of these
602functions expects a context variable, which is the same as the
603context variable passed into every event handler as the second
604argument.
605
606 common_pc(context) - returns common_preempt count for the current event
607 common_flags(context) - returns common_flags for the current event
608 common_lock_depth(context) - returns common_lock_depth for the current event
609
610Util.py Module
611~~~~~~~~~~~~~~
612
613Various utility functions for use with perf trace:
614
615 nsecs(secs, nsecs) - returns total nsecs given secs/nsecs pair
616 nsecs_secs(nsecs) - returns whole secs portion given nsecs
617 nsecs_nsecs(nsecs) - returns nsecs remainder given nsecs
618 nsecs_str(nsecs) - returns printable string in the form secs.nsecs
619 avg(total, n) - returns average given a sum and a total number of values
620
621SEE ALSO
622--------
623linkperf:perf-trace[1]
diff --git a/tools/perf/Documentation/perf-trace.txt b/tools/perf/Documentation/perf-trace.txt
index 60e5900da483..122ec9dc4853 100644
--- a/tools/perf/Documentation/perf-trace.txt
+++ b/tools/perf/Documentation/perf-trace.txt
@@ -1,5 +1,5 @@
1perf-trace(1) 1perf-trace(1)
2============== 2=============
3 3
4NAME 4NAME
5---- 5----
@@ -19,6 +19,11 @@ There are several variants of perf trace:
19 'perf trace' to see a detailed trace of the workload that was 19 'perf trace' to see a detailed trace of the workload that was
20 recorded. 20 recorded.
21 21
22 You can also run a set of pre-canned scripts that aggregate and
23 summarize the raw trace data in various ways (the list of scripts is
24 available via 'perf trace -l'). The following variants allow you to
25 record and run those scripts:
26
22 'perf trace record <script>' to record the events required for 'perf 27 'perf trace record <script>' to record the events required for 'perf
23 trace report'. <script> is the name displayed in the output of 28 trace report'. <script> is the name displayed in the output of
24 'perf trace --list' i.e. the actual script name minus any language 29 'perf trace --list' i.e. the actual script name minus any language
@@ -31,6 +36,9 @@ There are several variants of perf trace:
31 record <script>' is used and should be present for this command to 36 record <script>' is used and should be present for this command to
32 succeed. 37 succeed.
33 38
39 See the 'SEE ALSO' section for links to language-specific
40 information on how to write and run your own trace scripts.
41
34OPTIONS 42OPTIONS
35------- 43-------
36-D:: 44-D::
@@ -45,9 +53,11 @@ OPTIONS
45--list=:: 53--list=::
46 Display a list of available trace scripts. 54 Display a list of available trace scripts.
47 55
48-s:: 56-s ['lang']::
49--script=:: 57--script=::
50 Process trace data with the given script ([lang]:script[.ext]). 58 Process trace data with the given script ([lang]:script[.ext]).
59 If the string 'lang' is specified in place of a script name, a
60 list of supported languages will be displayed instead.
51 61
52-g:: 62-g::
53--gen-script=:: 63--gen-script=::
@@ -56,4 +66,5 @@ OPTIONS
56 66
57SEE ALSO 67SEE ALSO
58-------- 68--------
59linkperf:perf-record[1], linkperf:perf-trace-perl[1] 69linkperf:perf-record[1], linkperf:perf-trace-perl[1],
70linkperf:perf-trace-python[1]
diff --git a/tools/perf/Documentation/perf.txt b/tools/perf/Documentation/perf.txt
index 69c832557199..0eeb247dc7d2 100644
--- a/tools/perf/Documentation/perf.txt
+++ b/tools/perf/Documentation/perf.txt
@@ -12,7 +12,7 @@ SYNOPSIS
12 12
13DESCRIPTION 13DESCRIPTION
14----------- 14-----------
15Performance counters for Linux are are a new kernel-based subsystem 15Performance counters for Linux are a new kernel-based subsystem
16that provide a framework for all things performance analysis. It 16that provide a framework for all things performance analysis. It
17covers hardware level (CPU/PMU, Performance Monitoring Unit) features 17covers hardware level (CPU/PMU, Performance Monitoring Unit) features
18and software features (software counters, tracepoints) as well. 18and software features (software counters, tracepoints) as well.
diff --git a/tools/perf/Makefile b/tools/perf/Makefile
index 2e7fa3a06806..d75c28a825f5 100644
--- a/tools/perf/Makefile
+++ b/tools/perf/Makefile
@@ -1,3 +1,7 @@
1ifeq ("$(origin O)", "command line")
2 OUTPUT := $(O)/
3endif
4
1# The default target of this Makefile is... 5# The default target of this Makefile is...
2all:: 6all::
3 7
@@ -150,10 +154,17 @@ all::
150# Define LDFLAGS=-static to build a static binary. 154# Define LDFLAGS=-static to build a static binary.
151# 155#
152# Define EXTRA_CFLAGS=-m64 or EXTRA_CFLAGS=-m32 as appropriate for cross-builds. 156# Define EXTRA_CFLAGS=-m64 or EXTRA_CFLAGS=-m32 as appropriate for cross-builds.
157#
158# Define NO_DWARF if you do not want debug-info analysis feature at all.
159
160$(shell sh -c 'mkdir -p $(OUTPUT)scripts/python/Perf-Trace-Util/' 2> /dev/null)
161$(shell sh -c 'mkdir -p $(OUTPUT)scripts/perl/Perf-Trace-Util/' 2> /dev/null)
162$(shell sh -c 'mkdir -p $(OUTPUT)util/scripting-engines/' 2> /dev/null)
163$(shell sh -c 'mkdir $(OUTPUT)bench' 2> /dev/null)
153 164
154PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE 165$(OUTPUT)PERF-VERSION-FILE: .FORCE-PERF-VERSION-FILE
155 @$(SHELL_PATH) util/PERF-VERSION-GEN 166 @$(SHELL_PATH) util/PERF-VERSION-GEN $(OUTPUT)
156-include PERF-VERSION-FILE 167-include $(OUTPUT)PERF-VERSION-FILE
157 168
158uname_S := $(shell sh -c 'uname -s 2>/dev/null || echo not') 169uname_S := $(shell sh -c 'uname -s 2>/dev/null || echo not')
159uname_M := $(shell sh -c 'uname -m 2>/dev/null || echo not') 170uname_M := $(shell sh -c 'uname -m 2>/dev/null || echo not')
@@ -162,6 +173,22 @@ uname_R := $(shell sh -c 'uname -r 2>/dev/null || echo not')
162uname_P := $(shell sh -c 'uname -p 2>/dev/null || echo not') 173uname_P := $(shell sh -c 'uname -p 2>/dev/null || echo not')
163uname_V := $(shell sh -c 'uname -v 2>/dev/null || echo not') 174uname_V := $(shell sh -c 'uname -v 2>/dev/null || echo not')
164 175
176ARCH ?= $(shell echo $(uname_M) | sed -e s/i.86/i386/ -e s/sun4u/sparc64/ \
177 -e s/arm.*/arm/ -e s/sa110/arm/ \
178 -e s/s390x/s390/ -e s/parisc64/parisc/ \
179 -e s/ppc.*/powerpc/ -e s/mips.*/mips/ \
180 -e s/sh[234].*/sh/ )
181
182# Additional ARCH settings for x86
183ifeq ($(ARCH),i386)
184 ARCH := x86
185endif
186ifeq ($(ARCH),x86_64)
187 ARCH := x86
188endif
189
190$(shell sh -c 'mkdir -p $(OUTPUT)arch/$(ARCH)/util/' 2> /dev/null)
191
165# CFLAGS and LDFLAGS are for the users to override from the command line. 192# CFLAGS and LDFLAGS are for the users to override from the command line.
166 193
167# 194#
@@ -200,7 +227,7 @@ endif
200 227
201CFLAGS = -ggdb3 -Wall -Wextra -std=gnu99 -Werror $(CFLAGS_OPTIMIZE) -D_FORTIFY_SOURCE=2 $(EXTRA_WARNINGS) $(EXTRA_CFLAGS) 228CFLAGS = -ggdb3 -Wall -Wextra -std=gnu99 -Werror $(CFLAGS_OPTIMIZE) -D_FORTIFY_SOURCE=2 $(EXTRA_WARNINGS) $(EXTRA_CFLAGS)
202EXTLIBS = -lpthread -lrt -lelf -lm 229EXTLIBS = -lpthread -lrt -lelf -lm
203ALL_CFLAGS = $(CFLAGS) 230ALL_CFLAGS = $(CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64
204ALL_LDFLAGS = $(LDFLAGS) 231ALL_LDFLAGS = $(LDFLAGS)
205STRIP ?= strip 232STRIP ?= strip
206 233
@@ -216,7 +243,10 @@ STRIP ?= strip
216# runtime figures out where they are based on the path to the executable. 243# runtime figures out where they are based on the path to the executable.
217# This can help installing the suite in a relocatable way. 244# This can help installing the suite in a relocatable way.
218 245
246# Make the path relative to DESTDIR, not to prefix
247ifndef DESTDIR
219prefix = $(HOME) 248prefix = $(HOME)
249endif
220bindir_relative = bin 250bindir_relative = bin
221bindir = $(prefix)/$(bindir_relative) 251bindir = $(prefix)/$(bindir_relative)
222mandir = share/man 252mandir = share/man
@@ -233,7 +263,6 @@ sysconfdir = $(prefix)/etc
233ETC_PERFCONFIG = etc/perfconfig 263ETC_PERFCONFIG = etc/perfconfig
234endif 264endif
235lib = lib 265lib = lib
236# DESTDIR=
237 266
238export prefix bindir sharedir sysconfdir 267export prefix bindir sharedir sysconfdir
239 268
@@ -272,7 +301,7 @@ endif
272# Those must not be GNU-specific; they are shared with perl/ which may 301# Those must not be GNU-specific; they are shared with perl/ which may
273# be built by a different compiler. (Note that this is an artifact now 302# be built by a different compiler. (Note that this is an artifact now
274# but it still might be nice to keep that distinction.) 303# but it still might be nice to keep that distinction.)
275BASIC_CFLAGS = -Iutil/include 304BASIC_CFLAGS = -Iutil/include -Iarch/$(ARCH)/include
276BASIC_LDFLAGS = 305BASIC_LDFLAGS =
277 306
278# Guard against environment variables 307# Guard against environment variables
@@ -286,11 +315,7 @@ SCRIPT_PERL =
286SCRIPT_SH = 315SCRIPT_SH =
287TEST_PROGRAMS = 316TEST_PROGRAMS =
288 317
289# 318SCRIPT_SH += perf-archive.sh
290# No scripts right now:
291#
292
293# SCRIPT_SH += perf-am.sh
294 319
295# 320#
296# No Perl scripts right now: 321# No Perl scripts right now:
@@ -310,20 +335,17 @@ PROGRAMS += $(EXTRA_PROGRAMS)
310# 335#
311# Single 'perf' binary right now: 336# Single 'perf' binary right now:
312# 337#
313PROGRAMS += perf 338PROGRAMS += $(OUTPUT)perf
314 339
315# List built-in command $C whose implementation cmd_$C() is not in 340# List built-in command $C whose implementation cmd_$C() is not in
316# builtin-$C.o but is linked in as part of some other command. 341# builtin-$C.o but is linked in as part of some other command.
317# 342#
318# None right now:
319#
320# BUILT_INS += perf-init $X
321 343
322# what 'all' will build and 'install' will install, in perfexecdir 344# what 'all' will build and 'install' will install, in perfexecdir
323ALL_PROGRAMS = $(PROGRAMS) $(SCRIPTS) 345ALL_PROGRAMS = $(PROGRAMS) $(SCRIPTS)
324 346
325# what 'all' will build but not install in perfexecdir 347# what 'all' will build but not install in perfexecdir
326OTHER_PROGRAMS = perf$X 348OTHER_PROGRAMS = $(OUTPUT)perf$X
327 349
328# Set paths to tools early so that they can be used for version tests. 350# Set paths to tools early so that they can be used for version tests.
329ifndef SHELL_PATH 351ifndef SHELL_PATH
@@ -335,11 +357,12 @@ endif
335 357
336export PERL_PATH 358export PERL_PATH
337 359
338LIB_FILE=libperf.a 360LIB_FILE=$(OUTPUT)libperf.a
339 361
340LIB_H += ../../include/linux/perf_event.h 362LIB_H += ../../include/linux/perf_event.h
341LIB_H += ../../include/linux/rbtree.h 363LIB_H += ../../include/linux/rbtree.h
342LIB_H += ../../include/linux/list.h 364LIB_H += ../../include/linux/list.h
365LIB_H += ../../include/linux/hash.h
343LIB_H += ../../include/linux/stringify.h 366LIB_H += ../../include/linux/stringify.h
344LIB_H += util/include/linux/bitmap.h 367LIB_H += util/include/linux/bitmap.h
345LIB_H += util/include/linux/bitops.h 368LIB_H += util/include/linux/bitops.h
@@ -354,21 +377,24 @@ LIB_H += util/include/linux/rbtree.h
354LIB_H += util/include/linux/string.h 377LIB_H += util/include/linux/string.h
355LIB_H += util/include/linux/types.h 378LIB_H += util/include/linux/types.h
356LIB_H += util/include/asm/asm-offsets.h 379LIB_H += util/include/asm/asm-offsets.h
357LIB_H += util/include/asm/bitops.h
358LIB_H += util/include/asm/bug.h 380LIB_H += util/include/asm/bug.h
359LIB_H += util/include/asm/byteorder.h 381LIB_H += util/include/asm/byteorder.h
382LIB_H += util/include/asm/hweight.h
360LIB_H += util/include/asm/swab.h 383LIB_H += util/include/asm/swab.h
361LIB_H += util/include/asm/system.h 384LIB_H += util/include/asm/system.h
362LIB_H += util/include/asm/uaccess.h 385LIB_H += util/include/asm/uaccess.h
386LIB_H += util/include/dwarf-regs.h
363LIB_H += perf.h 387LIB_H += perf.h
364LIB_H += util/cache.h 388LIB_H += util/cache.h
365LIB_H += util/callchain.h 389LIB_H += util/callchain.h
390LIB_H += util/build-id.h
366LIB_H += util/debug.h 391LIB_H += util/debug.h
367LIB_H += util/debugfs.h 392LIB_H += util/debugfs.h
368LIB_H += util/event.h 393LIB_H += util/event.h
369LIB_H += util/exec_cmd.h 394LIB_H += util/exec_cmd.h
370LIB_H += util/types.h 395LIB_H += util/types.h
371LIB_H += util/levenshtein.h 396LIB_H += util/levenshtein.h
397LIB_H += util/map.h
372LIB_H += util/parse-options.h 398LIB_H += util/parse-options.h
373LIB_H += util/parse-events.h 399LIB_H += util/parse-events.h
374LIB_H += util/quote.h 400LIB_H += util/quote.h
@@ -377,7 +403,6 @@ LIB_H += util/header.h
377LIB_H += util/help.h 403LIB_H += util/help.h
378LIB_H += util/session.h 404LIB_H += util/session.h
379LIB_H += util/strbuf.h 405LIB_H += util/strbuf.h
380LIB_H += util/string.h
381LIB_H += util/strlist.h 406LIB_H += util/strlist.h
382LIB_H += util/svghelper.h 407LIB_H += util/svghelper.h
383LIB_H += util/run-command.h 408LIB_H += util/run-command.h
@@ -389,77 +414,85 @@ LIB_H += util/sort.h
389LIB_H += util/hist.h 414LIB_H += util/hist.h
390LIB_H += util/thread.h 415LIB_H += util/thread.h
391LIB_H += util/trace-event.h 416LIB_H += util/trace-event.h
392LIB_H += util/trace-event-perl.h
393LIB_H += util/probe-finder.h 417LIB_H += util/probe-finder.h
394LIB_H += util/probe-event.h 418LIB_H += util/probe-event.h
395 419LIB_H += util/pstack.h
396LIB_OBJS += util/abspath.o 420LIB_H += util/cpumap.h
397LIB_OBJS += util/alias.o 421
398LIB_OBJS += util/config.o 422LIB_OBJS += $(OUTPUT)util/abspath.o
399LIB_OBJS += util/ctype.o 423LIB_OBJS += $(OUTPUT)util/alias.o
400LIB_OBJS += util/debugfs.o 424LIB_OBJS += $(OUTPUT)util/build-id.o
401LIB_OBJS += util/environment.o 425LIB_OBJS += $(OUTPUT)util/config.o
402LIB_OBJS += util/event.o 426LIB_OBJS += $(OUTPUT)util/ctype.o
403LIB_OBJS += util/exec_cmd.o 427LIB_OBJS += $(OUTPUT)util/debugfs.o
404LIB_OBJS += util/help.o 428LIB_OBJS += $(OUTPUT)util/environment.o
405LIB_OBJS += util/levenshtein.o 429LIB_OBJS += $(OUTPUT)util/event.o
406LIB_OBJS += util/parse-options.o 430LIB_OBJS += $(OUTPUT)util/exec_cmd.o
407LIB_OBJS += util/parse-events.o 431LIB_OBJS += $(OUTPUT)util/help.o
408LIB_OBJS += util/path.o 432LIB_OBJS += $(OUTPUT)util/levenshtein.o
409LIB_OBJS += util/rbtree.o 433LIB_OBJS += $(OUTPUT)util/parse-options.o
410LIB_OBJS += util/bitmap.o 434LIB_OBJS += $(OUTPUT)util/parse-events.o
411LIB_OBJS += util/hweight.o 435LIB_OBJS += $(OUTPUT)util/path.o
412LIB_OBJS += util/find_next_bit.o 436LIB_OBJS += $(OUTPUT)util/rbtree.o
413LIB_OBJS += util/run-command.o 437LIB_OBJS += $(OUTPUT)util/bitmap.o
414LIB_OBJS += util/quote.o 438LIB_OBJS += $(OUTPUT)util/hweight.o
415LIB_OBJS += util/strbuf.o 439LIB_OBJS += $(OUTPUT)util/run-command.o
416LIB_OBJS += util/string.o 440LIB_OBJS += $(OUTPUT)util/quote.o
417LIB_OBJS += util/strlist.o 441LIB_OBJS += $(OUTPUT)util/strbuf.o
418LIB_OBJS += util/usage.o 442LIB_OBJS += $(OUTPUT)util/string.o
419LIB_OBJS += util/wrapper.o 443LIB_OBJS += $(OUTPUT)util/strlist.o
420LIB_OBJS += util/sigchain.o 444LIB_OBJS += $(OUTPUT)util/usage.o
421LIB_OBJS += util/symbol.o 445LIB_OBJS += $(OUTPUT)util/wrapper.o
422LIB_OBJS += util/color.o 446LIB_OBJS += $(OUTPUT)util/sigchain.o
423LIB_OBJS += util/pager.o 447LIB_OBJS += $(OUTPUT)util/symbol.o
424LIB_OBJS += util/header.o 448LIB_OBJS += $(OUTPUT)util/color.o
425LIB_OBJS += util/callchain.o 449LIB_OBJS += $(OUTPUT)util/pager.o
426LIB_OBJS += util/values.o 450LIB_OBJS += $(OUTPUT)util/header.o
427LIB_OBJS += util/debug.o 451LIB_OBJS += $(OUTPUT)util/callchain.o
428LIB_OBJS += util/map.o 452LIB_OBJS += $(OUTPUT)util/values.o
429LIB_OBJS += util/session.o 453LIB_OBJS += $(OUTPUT)util/debug.o
430LIB_OBJS += util/thread.o 454LIB_OBJS += $(OUTPUT)util/map.o
431LIB_OBJS += util/trace-event-parse.o 455LIB_OBJS += $(OUTPUT)util/pstack.o
432LIB_OBJS += util/trace-event-read.o 456LIB_OBJS += $(OUTPUT)util/session.o
433LIB_OBJS += util/trace-event-info.o 457LIB_OBJS += $(OUTPUT)util/thread.o
434LIB_OBJS += util/trace-event-perl.o 458LIB_OBJS += $(OUTPUT)util/trace-event-parse.o
435LIB_OBJS += util/svghelper.o 459LIB_OBJS += $(OUTPUT)util/trace-event-read.o
436LIB_OBJS += util/sort.o 460LIB_OBJS += $(OUTPUT)util/trace-event-info.o
437LIB_OBJS += util/hist.o 461LIB_OBJS += $(OUTPUT)util/trace-event-scripting.o
438LIB_OBJS += util/data_map.o 462LIB_OBJS += $(OUTPUT)util/svghelper.o
439LIB_OBJS += util/probe-event.o 463LIB_OBJS += $(OUTPUT)util/sort.o
440 464LIB_OBJS += $(OUTPUT)util/hist.o
441BUILTIN_OBJS += builtin-annotate.o 465LIB_OBJS += $(OUTPUT)util/probe-event.o
442 466LIB_OBJS += $(OUTPUT)util/util.o
443BUILTIN_OBJS += builtin-bench.o 467LIB_OBJS += $(OUTPUT)util/cpumap.o
468
469BUILTIN_OBJS += $(OUTPUT)builtin-annotate.o
470
471BUILTIN_OBJS += $(OUTPUT)builtin-bench.o
444 472
445# Benchmark modules 473# Benchmark modules
446BUILTIN_OBJS += bench/sched-messaging.o 474BUILTIN_OBJS += $(OUTPUT)bench/sched-messaging.o
447BUILTIN_OBJS += bench/sched-pipe.o 475BUILTIN_OBJS += $(OUTPUT)bench/sched-pipe.o
448BUILTIN_OBJS += bench/mem-memcpy.o 476BUILTIN_OBJS += $(OUTPUT)bench/mem-memcpy.o
449 477
450BUILTIN_OBJS += builtin-diff.o 478BUILTIN_OBJS += $(OUTPUT)builtin-diff.o
451BUILTIN_OBJS += builtin-help.o 479BUILTIN_OBJS += $(OUTPUT)builtin-help.o
452BUILTIN_OBJS += builtin-sched.o 480BUILTIN_OBJS += $(OUTPUT)builtin-sched.o
453BUILTIN_OBJS += builtin-buildid-list.o 481BUILTIN_OBJS += $(OUTPUT)builtin-buildid-list.o
454BUILTIN_OBJS += builtin-list.o 482BUILTIN_OBJS += $(OUTPUT)builtin-buildid-cache.o
455BUILTIN_OBJS += builtin-record.o 483BUILTIN_OBJS += $(OUTPUT)builtin-list.o
456BUILTIN_OBJS += builtin-report.o 484BUILTIN_OBJS += $(OUTPUT)builtin-record.o
457BUILTIN_OBJS += builtin-stat.o 485BUILTIN_OBJS += $(OUTPUT)builtin-report.o
458BUILTIN_OBJS += builtin-timechart.o 486BUILTIN_OBJS += $(OUTPUT)builtin-stat.o
459BUILTIN_OBJS += builtin-top.o 487BUILTIN_OBJS += $(OUTPUT)builtin-timechart.o
460BUILTIN_OBJS += builtin-trace.o 488BUILTIN_OBJS += $(OUTPUT)builtin-top.o
461BUILTIN_OBJS += builtin-probe.o 489BUILTIN_OBJS += $(OUTPUT)builtin-trace.o
462BUILTIN_OBJS += builtin-kmem.o 490BUILTIN_OBJS += $(OUTPUT)builtin-probe.o
491BUILTIN_OBJS += $(OUTPUT)builtin-kmem.o
492BUILTIN_OBJS += $(OUTPUT)builtin-lock.o
493BUILTIN_OBJS += $(OUTPUT)builtin-kvm.o
494BUILTIN_OBJS += $(OUTPUT)builtin-test.o
495BUILTIN_OBJS += $(OUTPUT)builtin-inject.o
463 496
464PERFLIBS = $(LIB_FILE) 497PERFLIBS = $(LIB_FILE)
465 498
@@ -474,6 +507,15 @@ PERFLIBS = $(LIB_FILE)
474-include config.mak.autogen 507-include config.mak.autogen
475-include config.mak 508-include config.mak
476 509
510ifndef NO_DWARF
511ifneq ($(shell sh -c "(echo '\#include <dwarf.h>'; echo '\#include <libdw.h>'; echo '\#include <version.h>'; echo '\#ifndef _ELFUTILS_PREREQ'; echo '\#error'; echo '\#endif'; echo 'int main(void) { Dwarf *dbg; dbg = dwarf_begin(0, DWARF_C_READ); return (long)dbg; }') | $(CC) -x c - $(ALL_CFLAGS) -I/usr/include/elfutils -ldw -lelf -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y)
512 msg := $(warning No libdw.h found or old libdw.h found or elfutils is older than 0.138, disables dwarf support. Please install new elfutils-devel/libdw-dev);
513 NO_DWARF := 1
514endif # Dwarf support
515endif # NO_DWARF
516
517-include arch/$(ARCH)/Makefile
518
477ifeq ($(uname_S),Darwin) 519ifeq ($(uname_S),Darwin)
478 ifndef NO_FINK 520 ifndef NO_FINK
479 ifeq ($(shell test -d /sw/lib && echo y),y) 521 ifeq ($(shell test -d /sw/lib && echo y),y)
@@ -490,26 +532,45 @@ ifeq ($(uname_S),Darwin)
490 PTHREAD_LIBS = 532 PTHREAD_LIBS =
491endif 533endif
492 534
493ifeq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64 -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) 535ifneq ($(OUTPUT),)
494ifneq ($(shell sh -c "(echo '\#include <gnu/libc-version.h>'; echo 'int main(void) { const char * version = gnu_get_libc_version(); return (long)version; }') | $(CC) -x c - $(ALL_CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64 -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) 536 BASIC_CFLAGS += -I$(OUTPUT)
537endif
538
539ifeq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y)
540ifneq ($(shell sh -c "(echo '\#include <gnu/libc-version.h>'; echo 'int main(void) { const char * version = gnu_get_libc_version(); return (long)version; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y)
495 msg := $(error No gnu/libc-version.h found, please install glibc-dev[el]/glibc-static); 541 msg := $(error No gnu/libc-version.h found, please install glibc-dev[el]/glibc-static);
496endif 542endif
497 543
498 ifneq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ_MMAP, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64 -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) 544 ifneq ($(shell sh -c "(echo '\#include <libelf.h>'; echo 'int main(void) { Elf * elf = elf_begin(0, ELF_C_READ_MMAP, 0); return (long)elf; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y)
499 BASIC_CFLAGS += -DLIBELF_NO_MMAP 545 BASIC_CFLAGS += -DLIBELF_NO_MMAP
500 endif 546 endif
501else 547else
502 msg := $(error No libelf.h/libelf found, please install libelf-dev/elfutils-libelf-devel and glibc-dev[el]); 548 msg := $(error No libelf.h/libelf found, please install libelf-dev/elfutils-libelf-devel and glibc-dev[el]);
503endif 549endif
504 550
505ifneq ($(shell sh -c "(echo '\#ifndef _MIPS_SZLONG'; echo '\#define _MIPS_SZLONG 0'; echo '\#endif'; echo '\#include <dwarf.h>'; echo '\#include <libdwarf.h>'; echo 'int main(void) { Dwarf_Debug dbg; Dwarf_Error err; Dwarf_Ranges *rng; dwarf_init(0, DW_DLC_READ, 0, 0, &dbg, &err); dwarf_get_ranges(dbg, 0, &rng, 0, 0, &err); return (long)dbg; }') | $(CC) -x c - $(ALL_CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64 -I/usr/include/libdwarf -ldwarf -lelf -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y) 551ifndef NO_DWARF
506 msg := $(warning No libdwarf.h found or old libdwarf.h found, disables dwarf support. Please install libdwarf-dev/libdwarf-devel >= 20081231); 552ifeq ($(origin PERF_HAVE_DWARF_REGS), undefined)
507 BASIC_CFLAGS += -DNO_LIBDWARF 553 msg := $(warning DWARF register mappings have not been defined for architecture $(ARCH), DWARF support disabled);
508else 554else
509 BASIC_CFLAGS += -I/usr/include/libdwarf 555 BASIC_CFLAGS += -I/usr/include/elfutils -DDWARF_SUPPORT
510 EXTLIBS += -lelf -ldwarf 556 EXTLIBS += -lelf -ldw
511 LIB_OBJS += util/probe-finder.o 557 LIB_OBJS += $(OUTPUT)util/probe-finder.o
558endif # PERF_HAVE_DWARF_REGS
559endif # NO_DWARF
560
561ifdef NO_NEWT
562 BASIC_CFLAGS += -DNO_NEWT_SUPPORT
563else
564ifneq ($(shell sh -c "(echo '\#include <newt.h>'; echo 'int main(void) { newtInit(); newtCls(); return newtFinished(); }') | $(CC) -x c - $(ALL_CFLAGS) -D_LARGEFILE64_SOURCE -D_FILE_OFFSET_BITS=64 -lnewt -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) "$(QUIET_STDERR)" && echo y"), y)
565 msg := $(warning newt not found, disables TUI support. Please install newt-devel or libnewt-dev);
566 BASIC_CFLAGS += -DNO_NEWT_SUPPORT
567else
568 # Fedora has /usr/include/slang/slang.h, but ubuntu /usr/include/slang.h
569 BASIC_CFLAGS += -I/usr/include/slang
570 EXTLIBS += -lnewt -lslang
571 LIB_OBJS += $(OUTPUT)util/newt.o
512endif 572endif
573endif # NO_NEWT
513 574
514ifndef NO_LIBPERL 575ifndef NO_LIBPERL
515PERL_EMBED_LDOPTS = `perl -MExtUtils::Embed -e ldopts 2>/dev/null` 576PERL_EMBED_LDOPTS = `perl -MExtUtils::Embed -e ldopts 2>/dev/null`
@@ -520,32 +581,51 @@ ifneq ($(shell sh -c "(echo '\#include <EXTERN.h>'; echo '\#include <perl.h>'; e
520 BASIC_CFLAGS += -DNO_LIBPERL 581 BASIC_CFLAGS += -DNO_LIBPERL
521else 582else
522 ALL_LDFLAGS += $(PERL_EMBED_LDOPTS) 583 ALL_LDFLAGS += $(PERL_EMBED_LDOPTS)
523 LIB_OBJS += scripts/perl/Perf-Trace-Util/Context.o 584 LIB_OBJS += $(OUTPUT)util/scripting-engines/trace-event-perl.o
585 LIB_OBJS += $(OUTPUT)scripts/perl/Perf-Trace-Util/Context.o
586endif
587
588ifndef NO_LIBPYTHON
589PYTHON_EMBED_LDOPTS = `python-config --ldflags 2>/dev/null`
590PYTHON_EMBED_CCOPTS = `python-config --cflags 2>/dev/null`
591endif
592
593ifneq ($(shell sh -c "(echo '\#include <Python.h>'; echo 'int main(void) { Py_Initialize(); return 0; }') | $(CC) -x c - $(PYTHON_EMBED_CCOPTS) -o $(BITBUCKET) $(PYTHON_EMBED_LDOPTS) > /dev/null 2>&1 && echo y"), y)
594 BASIC_CFLAGS += -DNO_LIBPYTHON
595else
596 ALL_LDFLAGS += $(PYTHON_EMBED_LDOPTS)
597 LIB_OBJS += $(OUTPUT)util/scripting-engines/trace-event-python.o
598 LIB_OBJS += $(OUTPUT)scripts/python/Perf-Trace-Util/Context.o
524endif 599endif
525 600
526ifdef NO_DEMANGLE 601ifdef NO_DEMANGLE
527 BASIC_CFLAGS += -DNO_DEMANGLE 602 BASIC_CFLAGS += -DNO_DEMANGLE
528else 603else
529 has_bfd := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd "$(QUIET_STDERR)" && echo y") 604 ifdef HAVE_CPLUS_DEMANGLE
530 605 EXTLIBS += -liberty
531 ifeq ($(has_bfd),y) 606 BASIC_CFLAGS += -DHAVE_CPLUS_DEMANGLE
532 EXTLIBS += -lbfd
533 else 607 else
534 has_bfd_iberty := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd -liberty "$(QUIET_STDERR)" && echo y") 608 has_bfd := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd "$(QUIET_STDERR)" && echo y")
535 ifeq ($(has_bfd_iberty),y) 609
536 EXTLIBS += -lbfd -liberty 610 ifeq ($(has_bfd),y)
611 EXTLIBS += -lbfd
537 else 612 else
538 has_bfd_iberty_z := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd -liberty -lz "$(QUIET_STDERR)" && echo y") 613 has_bfd_iberty := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd -liberty "$(QUIET_STDERR)" && echo y")
539 ifeq ($(has_bfd_iberty_z),y) 614 ifeq ($(has_bfd_iberty),y)
540 EXTLIBS += -lbfd -liberty -lz 615 EXTLIBS += -lbfd -liberty
541 else 616 else
542 has_cplus_demangle := $(shell sh -c "(echo 'extern char *cplus_demangle(const char *, int);'; echo 'int main(void) { cplus_demangle(0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -liberty "$(QUIET_STDERR)" && echo y") 617 has_bfd_iberty_z := $(shell sh -c "(echo '\#include <bfd.h>'; echo 'int main(void) { bfd_demangle(0, 0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -lbfd -liberty -lz "$(QUIET_STDERR)" && echo y")
543 ifeq ($(has_cplus_demangle),y) 618 ifeq ($(has_bfd_iberty_z),y)
544 EXTLIBS += -liberty 619 EXTLIBS += -lbfd -liberty -lz
545 BASIC_CFLAGS += -DHAVE_CPLUS_DEMANGLE
546 else 620 else
547 msg := $(warning No bfd.h/libbfd found, install binutils-dev[el]/zlib-static to gain symbol demangling) 621 has_cplus_demangle := $(shell sh -c "(echo 'extern char *cplus_demangle(const char *, int);'; echo 'int main(void) { cplus_demangle(0, 0); return 0; }') | $(CC) -x c - $(ALL_CFLAGS) -o $(BITBUCKET) $(ALL_LDFLAGS) $(EXTLIBS) -liberty "$(QUIET_STDERR)" && echo y")
548 BASIC_CFLAGS += -DNO_DEMANGLE 622 ifeq ($(has_cplus_demangle),y)
623 EXTLIBS += -liberty
624 BASIC_CFLAGS += -DHAVE_CPLUS_DEMANGLE
625 else
626 msg := $(warning No bfd.h/libbfd found, install binutils-dev[el]/zlib-static to gain symbol demangling)
627 BASIC_CFLAGS += -DNO_DEMANGLE
628 endif
549 endif 629 endif
550 endif 630 endif
551 endif 631 endif
@@ -591,53 +671,53 @@ ifdef NO_C99_FORMAT
591endif 671endif
592ifdef SNPRINTF_RETURNS_BOGUS 672ifdef SNPRINTF_RETURNS_BOGUS
593 COMPAT_CFLAGS += -DSNPRINTF_RETURNS_BOGUS 673 COMPAT_CFLAGS += -DSNPRINTF_RETURNS_BOGUS
594 COMPAT_OBJS += compat/snprintf.o 674 COMPAT_OBJS += $(OUTPUT)compat/snprintf.o
595endif 675endif
596ifdef FREAD_READS_DIRECTORIES 676ifdef FREAD_READS_DIRECTORIES
597 COMPAT_CFLAGS += -DFREAD_READS_DIRECTORIES 677 COMPAT_CFLAGS += -DFREAD_READS_DIRECTORIES
598 COMPAT_OBJS += compat/fopen.o 678 COMPAT_OBJS += $(OUTPUT)compat/fopen.o
599endif 679endif
600ifdef NO_SYMLINK_HEAD 680ifdef NO_SYMLINK_HEAD
601 BASIC_CFLAGS += -DNO_SYMLINK_HEAD 681 BASIC_CFLAGS += -DNO_SYMLINK_HEAD
602endif 682endif
603ifdef NO_STRCASESTR 683ifdef NO_STRCASESTR
604 COMPAT_CFLAGS += -DNO_STRCASESTR 684 COMPAT_CFLAGS += -DNO_STRCASESTR
605 COMPAT_OBJS += compat/strcasestr.o 685 COMPAT_OBJS += $(OUTPUT)compat/strcasestr.o
606endif 686endif
607ifdef NO_STRTOUMAX 687ifdef NO_STRTOUMAX
608 COMPAT_CFLAGS += -DNO_STRTOUMAX 688 COMPAT_CFLAGS += -DNO_STRTOUMAX
609 COMPAT_OBJS += compat/strtoumax.o 689 COMPAT_OBJS += $(OUTPUT)compat/strtoumax.o
610endif 690endif
611ifdef NO_STRTOULL 691ifdef NO_STRTOULL
612 COMPAT_CFLAGS += -DNO_STRTOULL 692 COMPAT_CFLAGS += -DNO_STRTOULL
613endif 693endif
614ifdef NO_SETENV 694ifdef NO_SETENV
615 COMPAT_CFLAGS += -DNO_SETENV 695 COMPAT_CFLAGS += -DNO_SETENV
616 COMPAT_OBJS += compat/setenv.o 696 COMPAT_OBJS += $(OUTPUT)compat/setenv.o
617endif 697endif
618ifdef NO_MKDTEMP 698ifdef NO_MKDTEMP
619 COMPAT_CFLAGS += -DNO_MKDTEMP 699 COMPAT_CFLAGS += -DNO_MKDTEMP
620 COMPAT_OBJS += compat/mkdtemp.o 700 COMPAT_OBJS += $(OUTPUT)compat/mkdtemp.o
621endif 701endif
622ifdef NO_UNSETENV 702ifdef NO_UNSETENV
623 COMPAT_CFLAGS += -DNO_UNSETENV 703 COMPAT_CFLAGS += -DNO_UNSETENV
624 COMPAT_OBJS += compat/unsetenv.o 704 COMPAT_OBJS += $(OUTPUT)compat/unsetenv.o
625endif 705endif
626ifdef NO_SYS_SELECT_H 706ifdef NO_SYS_SELECT_H
627 BASIC_CFLAGS += -DNO_SYS_SELECT_H 707 BASIC_CFLAGS += -DNO_SYS_SELECT_H
628endif 708endif
629ifdef NO_MMAP 709ifdef NO_MMAP
630 COMPAT_CFLAGS += -DNO_MMAP 710 COMPAT_CFLAGS += -DNO_MMAP
631 COMPAT_OBJS += compat/mmap.o 711 COMPAT_OBJS += $(OUTPUT)compat/mmap.o
632else 712else
633 ifdef USE_WIN32_MMAP 713 ifdef USE_WIN32_MMAP
634 COMPAT_CFLAGS += -DUSE_WIN32_MMAP 714 COMPAT_CFLAGS += -DUSE_WIN32_MMAP
635 COMPAT_OBJS += compat/win32mmap.o 715 COMPAT_OBJS += $(OUTPUT)compat/win32mmap.o
636 endif 716 endif
637endif 717endif
638ifdef NO_PREAD 718ifdef NO_PREAD
639 COMPAT_CFLAGS += -DNO_PREAD 719 COMPAT_CFLAGS += -DNO_PREAD
640 COMPAT_OBJS += compat/pread.o 720 COMPAT_OBJS += $(OUTPUT)compat/pread.o
641endif 721endif
642ifdef NO_FAST_WORKING_DIRECTORY 722ifdef NO_FAST_WORKING_DIRECTORY
643 BASIC_CFLAGS += -DNO_FAST_WORKING_DIRECTORY 723 BASIC_CFLAGS += -DNO_FAST_WORKING_DIRECTORY
@@ -659,10 +739,10 @@ else
659endif 739endif
660endif 740endif
661ifdef NO_INET_NTOP 741ifdef NO_INET_NTOP
662 LIB_OBJS += compat/inet_ntop.o 742 LIB_OBJS += $(OUTPUT)compat/inet_ntop.o
663endif 743endif
664ifdef NO_INET_PTON 744ifdef NO_INET_PTON
665 LIB_OBJS += compat/inet_pton.o 745 LIB_OBJS += $(OUTPUT)compat/inet_pton.o
666endif 746endif
667 747
668ifdef NO_ICONV 748ifdef NO_ICONV
@@ -679,15 +759,15 @@ endif
679 759
680ifdef PPC_SHA1 760ifdef PPC_SHA1
681 SHA1_HEADER = "ppc/sha1.h" 761 SHA1_HEADER = "ppc/sha1.h"
682 LIB_OBJS += ppc/sha1.o ppc/sha1ppc.o 762 LIB_OBJS += $(OUTPUT)ppc/sha1.o ppc/sha1ppc.o
683else 763else
684ifdef ARM_SHA1 764ifdef ARM_SHA1
685 SHA1_HEADER = "arm/sha1.h" 765 SHA1_HEADER = "arm/sha1.h"
686 LIB_OBJS += arm/sha1.o arm/sha1_arm.o 766 LIB_OBJS += $(OUTPUT)arm/sha1.o $(OUTPUT)arm/sha1_arm.o
687else 767else
688ifdef MOZILLA_SHA1 768ifdef MOZILLA_SHA1
689 SHA1_HEADER = "mozilla-sha1/sha1.h" 769 SHA1_HEADER = "mozilla-sha1/sha1.h"
690 LIB_OBJS += mozilla-sha1/sha1.o 770 LIB_OBJS += $(OUTPUT)mozilla-sha1/sha1.o
691else 771else
692 SHA1_HEADER = <openssl/sha.h> 772 SHA1_HEADER = <openssl/sha.h>
693 EXTLIBS += $(LIB_4_CRYPTO) 773 EXTLIBS += $(LIB_4_CRYPTO)
@@ -699,15 +779,15 @@ ifdef NO_PERL_MAKEMAKER
699endif 779endif
700ifdef NO_HSTRERROR 780ifdef NO_HSTRERROR
701 COMPAT_CFLAGS += -DNO_HSTRERROR 781 COMPAT_CFLAGS += -DNO_HSTRERROR
702 COMPAT_OBJS += compat/hstrerror.o 782 COMPAT_OBJS += $(OUTPUT)compat/hstrerror.o
703endif 783endif
704ifdef NO_MEMMEM 784ifdef NO_MEMMEM
705 COMPAT_CFLAGS += -DNO_MEMMEM 785 COMPAT_CFLAGS += -DNO_MEMMEM
706 COMPAT_OBJS += compat/memmem.o 786 COMPAT_OBJS += $(OUTPUT)compat/memmem.o
707endif 787endif
708ifdef INTERNAL_QSORT 788ifdef INTERNAL_QSORT
709 COMPAT_CFLAGS += -DINTERNAL_QSORT 789 COMPAT_CFLAGS += -DINTERNAL_QSORT
710 COMPAT_OBJS += compat/qsort.o 790 COMPAT_OBJS += $(OUTPUT)compat/qsort.o
711endif 791endif
712ifdef RUNTIME_PREFIX 792ifdef RUNTIME_PREFIX
713 COMPAT_CFLAGS += -DRUNTIME_PREFIX 793 COMPAT_CFLAGS += -DRUNTIME_PREFIX
@@ -787,7 +867,7 @@ export TAR INSTALL DESTDIR SHELL_PATH
787 867
788SHELL = $(SHELL_PATH) 868SHELL = $(SHELL_PATH)
789 869
790all:: .perf.dev.null shell_compatibility_test $(ALL_PROGRAMS) $(BUILT_INS) $(OTHER_PROGRAMS) PERF-BUILD-OPTIONS 870all:: .perf.dev.null shell_compatibility_test $(ALL_PROGRAMS) $(BUILT_INS) $(OTHER_PROGRAMS) $(OUTPUT)PERF-BUILD-OPTIONS
791ifneq (,$X) 871ifneq (,$X)
792 $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), test '$p' -ef '$p$X' || $(RM) '$p';) 872 $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), test '$p' -ef '$p$X' || $(RM) '$p';)
793endif 873endif
@@ -799,39 +879,39 @@ please_set_SHELL_PATH_to_a_more_modern_shell:
799 879
800shell_compatibility_test: please_set_SHELL_PATH_to_a_more_modern_shell 880shell_compatibility_test: please_set_SHELL_PATH_to_a_more_modern_shell
801 881
802strip: $(PROGRAMS) perf$X 882strip: $(PROGRAMS) $(OUTPUT)perf$X
803 $(STRIP) $(STRIP_OPTS) $(PROGRAMS) perf$X 883 $(STRIP) $(STRIP_OPTS) $(PROGRAMS) $(OUTPUT)perf$X
804 884
805perf.o: perf.c common-cmds.h PERF-CFLAGS 885$(OUTPUT)perf.o: perf.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS
806 $(QUIET_CC)$(CC) -DPERF_VERSION='"$(PERF_VERSION)"' \ 886 $(QUIET_CC)$(CC) -DPERF_VERSION='"$(PERF_VERSION)"' \
807 '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ 887 '-DPERF_HTML_PATH="$(htmldir_SQ)"' \
808 $(ALL_CFLAGS) -c $(filter %.c,$^) 888 $(ALL_CFLAGS) -c $(filter %.c,$^) -o $@
809 889
810perf$X: perf.o $(BUILTIN_OBJS) $(PERFLIBS) 890$(OUTPUT)perf$X: $(OUTPUT)perf.o $(BUILTIN_OBJS) $(PERFLIBS)
811 $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ perf.o \ 891 $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(OUTPUT)perf.o \
812 $(BUILTIN_OBJS) $(ALL_LDFLAGS) $(LIBS) 892 $(BUILTIN_OBJS) $(ALL_LDFLAGS) $(LIBS)
813 893
814builtin-help.o: builtin-help.c common-cmds.h PERF-CFLAGS 894$(OUTPUT)builtin-help.o: builtin-help.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS
815 $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ 895 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \
816 '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ 896 '-DPERF_HTML_PATH="$(htmldir_SQ)"' \
817 '-DPERF_MAN_PATH="$(mandir_SQ)"' \ 897 '-DPERF_MAN_PATH="$(mandir_SQ)"' \
818 '-DPERF_INFO_PATH="$(infodir_SQ)"' $< 898 '-DPERF_INFO_PATH="$(infodir_SQ)"' $<
819 899
820builtin-timechart.o: builtin-timechart.c common-cmds.h PERF-CFLAGS 900$(OUTPUT)builtin-timechart.o: builtin-timechart.c $(OUTPUT)common-cmds.h $(OUTPUT)PERF-CFLAGS
821 $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ 901 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \
822 '-DPERF_HTML_PATH="$(htmldir_SQ)"' \ 902 '-DPERF_HTML_PATH="$(htmldir_SQ)"' \
823 '-DPERF_MAN_PATH="$(mandir_SQ)"' \ 903 '-DPERF_MAN_PATH="$(mandir_SQ)"' \
824 '-DPERF_INFO_PATH="$(infodir_SQ)"' $< 904 '-DPERF_INFO_PATH="$(infodir_SQ)"' $<
825 905
826$(BUILT_INS): perf$X 906$(BUILT_INS): $(OUTPUT)perf$X
827 $(QUIET_BUILT_IN)$(RM) $@ && \ 907 $(QUIET_BUILT_IN)$(RM) $@ && \
828 ln perf$X $@ 2>/dev/null || \ 908 ln perf$X $@ 2>/dev/null || \
829 ln -s perf$X $@ 2>/dev/null || \ 909 ln -s perf$X $@ 2>/dev/null || \
830 cp perf$X $@ 910 cp perf$X $@
831 911
832common-cmds.h: util/generate-cmdlist.sh command-list.txt 912$(OUTPUT)common-cmds.h: util/generate-cmdlist.sh command-list.txt
833 913
834common-cmds.h: $(wildcard Documentation/perf-*.txt) 914$(OUTPUT)common-cmds.h: $(wildcard Documentation/perf-*.txt)
835 $(QUIET_GEN). util/generate-cmdlist.sh > $@+ && mv $@+ $@ 915 $(QUIET_GEN). util/generate-cmdlist.sh > $@+ && mv $@+ $@
836 916
837$(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh 917$(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh
@@ -843,7 +923,7 @@ $(patsubst %.sh,%,$(SCRIPT_SH)) : % : %.sh
843 -e 's/@@NO_CURL@@/$(NO_CURL)/g' \ 923 -e 's/@@NO_CURL@@/$(NO_CURL)/g' \
844 $@.sh >$@+ && \ 924 $@.sh >$@+ && \
845 chmod +x $@+ && \ 925 chmod +x $@+ && \
846 mv $@+ $@ 926 mv $@+ $(OUTPUT)$@
847 927
848configure: configure.ac 928configure: configure.ac
849 $(QUIET_GEN)$(RM) $@ $<+ && \ 929 $(QUIET_GEN)$(RM) $@ $<+ && \
@@ -853,54 +933,50 @@ configure: configure.ac
853 $(RM) $<+ 933 $(RM) $<+
854 934
855# These can record PERF_VERSION 935# These can record PERF_VERSION
856perf.o perf.spec \ 936$(OUTPUT)perf.o perf.spec \
857 $(patsubst %.sh,%,$(SCRIPT_SH)) \ 937 $(patsubst %.sh,%,$(SCRIPT_SH)) \
858 $(patsubst %.perl,%,$(SCRIPT_PERL)) \ 938 $(patsubst %.perl,%,$(SCRIPT_PERL)) \
859 : PERF-VERSION-FILE 939 : $(OUTPUT)PERF-VERSION-FILE
860 940
861%.o: %.c PERF-CFLAGS 941$(OUTPUT)%.o: %.c $(OUTPUT)PERF-CFLAGS
862 $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) $< 942 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $<
863%.s: %.c PERF-CFLAGS 943$(OUTPUT)%.s: %.c $(OUTPUT)PERF-CFLAGS
864 $(QUIET_CC)$(CC) -S $(ALL_CFLAGS) $< 944 $(QUIET_CC)$(CC) -S $(ALL_CFLAGS) $<
865%.o: %.S 945$(OUTPUT)%.o: %.S
866 $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) $< 946 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $<
867 947
868util/exec_cmd.o: util/exec_cmd.c PERF-CFLAGS 948$(OUTPUT)util/exec_cmd.o: util/exec_cmd.c $(OUTPUT)PERF-CFLAGS
869 $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) \ 949 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) \
870 '-DPERF_EXEC_PATH="$(perfexecdir_SQ)"' \ 950 '-DPERF_EXEC_PATH="$(perfexecdir_SQ)"' \
871 '-DBINDIR="$(bindir_relative_SQ)"' \ 951 '-DBINDIR="$(bindir_relative_SQ)"' \
872 '-DPREFIX="$(prefix_SQ)"' \ 952 '-DPREFIX="$(prefix_SQ)"' \
873 $< 953 $<
874 954
875builtin-init-db.o: builtin-init-db.c PERF-CFLAGS 955$(OUTPUT)builtin-init-db.o: builtin-init-db.c $(OUTPUT)PERF-CFLAGS
876 $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) -DDEFAULT_PERF_TEMPLATE_DIR='"$(template_dir_SQ)"' $< 956 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DDEFAULT_PERF_TEMPLATE_DIR='"$(template_dir_SQ)"' $<
877
878util/config.o: util/config.c PERF-CFLAGS
879 $(QUIET_CC)$(CC) -o $*.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $<
880 957
881util/rbtree.o: ../../lib/rbtree.c PERF-CFLAGS 958$(OUTPUT)util/config.o: util/config.c $(OUTPUT)PERF-CFLAGS
882 $(QUIET_CC)$(CC) -o util/rbtree.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< 959 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $<
883 960
884# some perf warning policies can't fit to lib/bitmap.c, eg: it warns about variable shadowing 961$(OUTPUT)util/newt.o: util/newt.c $(OUTPUT)PERF-CFLAGS
885# from <string.h> that comes from kernel headers wrapping. 962 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DENABLE_SLFUTURE_CONST $<
886KBITMAP_FLAGS=`echo $(ALL_CFLAGS) | sed s/-Wshadow// | sed s/-Wswitch-default// | sed s/-Wextra//`
887 963
888util/bitmap.o: ../../lib/bitmap.c PERF-CFLAGS 964$(OUTPUT)util/rbtree.o: ../../lib/rbtree.c $(OUTPUT)PERF-CFLAGS
889 $(QUIET_CC)$(CC) -o util/bitmap.o -c $(KBITMAP_FLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< 965 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $<
890 966
891util/hweight.o: ../../lib/hweight.c PERF-CFLAGS 967$(OUTPUT)util/scripting-engines/trace-event-perl.o: util/scripting-engines/trace-event-perl.c $(OUTPUT)PERF-CFLAGS
892 $(QUIET_CC)$(CC) -o util/hweight.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< 968 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $<
893 969
894util/find_next_bit.o: ../../lib/find_next_bit.c PERF-CFLAGS 970$(OUTPUT)scripts/perl/Perf-Trace-Util/Context.o: scripts/perl/Perf-Trace-Util/Context.c $(OUTPUT)PERF-CFLAGS
895 $(QUIET_CC)$(CC) -o util/find_next_bit.o -c $(ALL_CFLAGS) -DETC_PERFCONFIG='"$(ETC_PERFCONFIG_SQ)"' $< 971 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $<
896 972
897util/trace-event-perl.o: util/trace-event-perl.c PERF-CFLAGS 973$(OUTPUT)util/scripting-engines/trace-event-python.o: util/scripting-engines/trace-event-python.c $(OUTPUT)PERF-CFLAGS
898 $(QUIET_CC)$(CC) -o util/trace-event-perl.o -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $< 974 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-shadow $<
899 975
900scripts/perl/Perf-Trace-Util/Context.o: scripts/perl/Perf-Trace-Util/Context.c PERF-CFLAGS 976$(OUTPUT)scripts/python/Perf-Trace-Util/Context.o: scripts/python/Perf-Trace-Util/Context.c $(OUTPUT)PERF-CFLAGS
901 $(QUIET_CC)$(CC) -o scripts/perl/Perf-Trace-Util/Context.o -c $(ALL_CFLAGS) $(PERL_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $< 977 $(QUIET_CC)$(CC) -o $@ -c $(ALL_CFLAGS) $(PYTHON_EMBED_CCOPTS) -Wno-redundant-decls -Wno-strict-prototypes -Wno-unused-parameter -Wno-nested-externs $<
902 978
903perf-%$X: %.o $(PERFLIBS) 979$(OUTPUT)perf-%$X: %.o $(PERFLIBS)
904 $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(ALL_LDFLAGS) $(filter %.o,$^) $(LIBS) 980 $(QUIET_LINK)$(CC) $(ALL_CFLAGS) -o $@ $(ALL_LDFLAGS) $(filter %.o,$^) $(LIBS)
905 981
906$(LIB_OBJS) $(BUILTIN_OBJS): $(LIB_H) 982$(LIB_OBJS) $(BUILTIN_OBJS): $(LIB_H)
@@ -941,17 +1017,17 @@ cscope:
941TRACK_CFLAGS = $(subst ','\'',$(ALL_CFLAGS)):\ 1017TRACK_CFLAGS = $(subst ','\'',$(ALL_CFLAGS)):\
942 $(bindir_SQ):$(perfexecdir_SQ):$(template_dir_SQ):$(prefix_SQ) 1018 $(bindir_SQ):$(perfexecdir_SQ):$(template_dir_SQ):$(prefix_SQ)
943 1019
944PERF-CFLAGS: .FORCE-PERF-CFLAGS 1020$(OUTPUT)PERF-CFLAGS: .FORCE-PERF-CFLAGS
945 @FLAGS='$(TRACK_CFLAGS)'; \ 1021 @FLAGS='$(TRACK_CFLAGS)'; \
946 if test x"$$FLAGS" != x"`cat PERF-CFLAGS 2>/dev/null`" ; then \ 1022 if test x"$$FLAGS" != x"`cat $(OUTPUT)PERF-CFLAGS 2>/dev/null`" ; then \
947 echo 1>&2 " * new build flags or prefix"; \ 1023 echo 1>&2 " * new build flags or prefix"; \
948 echo "$$FLAGS" >PERF-CFLAGS; \ 1024 echo "$$FLAGS" >$(OUTPUT)PERF-CFLAGS; \
949 fi 1025 fi
950 1026
951# We need to apply sq twice, once to protect from the shell 1027# We need to apply sq twice, once to protect from the shell
952# that runs PERF-BUILD-OPTIONS, and then again to protect it 1028# that runs $(OUTPUT)PERF-BUILD-OPTIONS, and then again to protect it
953# and the first level quoting from the shell that runs "echo". 1029# and the first level quoting from the shell that runs "echo".
954PERF-BUILD-OPTIONS: .FORCE-PERF-BUILD-OPTIONS 1030$(OUTPUT)PERF-BUILD-OPTIONS: .FORCE-PERF-BUILD-OPTIONS
955 @echo SHELL_PATH=\''$(subst ','\'',$(SHELL_PATH_SQ))'\' >$@ 1031 @echo SHELL_PATH=\''$(subst ','\'',$(SHELL_PATH_SQ))'\' >$@
956 @echo TAR=\''$(subst ','\'',$(subst ','\'',$(TAR)))'\' >>$@ 1032 @echo TAR=\''$(subst ','\'',$(subst ','\'',$(TAR)))'\' >>$@
957 @echo NO_CURL=\''$(subst ','\'',$(subst ','\'',$(NO_CURL)))'\' >>$@ 1033 @echo NO_CURL=\''$(subst ','\'',$(subst ','\'',$(NO_CURL)))'\' >>$@
@@ -972,7 +1048,7 @@ all:: $(TEST_PROGRAMS)
972 1048
973export NO_SVN_TESTS 1049export NO_SVN_TESTS
974 1050
975check: common-cmds.h 1051check: $(OUTPUT)common-cmds.h
976 if sparse; \ 1052 if sparse; \
977 then \ 1053 then \
978 for i in *.c */*.c; \ 1054 for i in *.c */*.c; \
@@ -1006,17 +1082,24 @@ export perfexec_instdir
1006 1082
1007install: all 1083install: all
1008 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(bindir_SQ)' 1084 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(bindir_SQ)'
1009 $(INSTALL) perf$X '$(DESTDIR_SQ)$(bindir_SQ)' 1085 $(INSTALL) $(OUTPUT)perf$X '$(DESTDIR_SQ)$(bindir_SQ)'
1010 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' 1086 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace'
1011 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' 1087 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin'
1088 $(INSTALL) $(OUTPUT)perf-archive -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)'
1012 $(INSTALL) scripts/perl/Perf-Trace-Util/lib/Perf/Trace/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace' 1089 $(INSTALL) scripts/perl/Perf-Trace-Util/lib/Perf/Trace/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/Perf-Trace-Util/lib/Perf/Trace'
1013 $(INSTALL) scripts/perl/*.pl -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl' 1090 $(INSTALL) scripts/perl/*.pl -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl'
1014 $(INSTALL) scripts/perl/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin' 1091 $(INSTALL) scripts/perl/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/perl/bin'
1092 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/python/Perf-Trace-Util/lib/Perf/Trace'
1093 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/python/bin'
1094 $(INSTALL) scripts/python/Perf-Trace-Util/lib/Perf/Trace/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/python/Perf-Trace-Util/lib/Perf/Trace'
1095 $(INSTALL) scripts/python/*.py -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/python'
1096 $(INSTALL) scripts/python/bin/* -t '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/scripts/python/bin'
1097
1015ifdef BUILT_INS 1098ifdef BUILT_INS
1016 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' 1099 $(INSTALL) -d -m 755 '$(DESTDIR_SQ)$(perfexec_instdir_SQ)'
1017 $(INSTALL) $(BUILT_INS) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)' 1100 $(INSTALL) $(BUILT_INS) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)'
1018ifneq (,$X) 1101ifneq (,$X)
1019 $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) perf$X)), $(RM) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$p';) 1102 $(foreach p,$(patsubst %$X,%,$(filter %$X,$(ALL_PROGRAMS) $(BUILT_INS) $(OUTPUT)perf$X)), $(RM) '$(DESTDIR_SQ)$(perfexec_instdir_SQ)/$p';)
1020endif 1103endif
1021endif 1104endif
1022 1105
@@ -1100,14 +1183,14 @@ clean:
1100 $(RM) *.o */*.o */*/*.o */*/*/*.o $(LIB_FILE) 1183 $(RM) *.o */*.o */*/*.o */*/*/*.o $(LIB_FILE)
1101 $(RM) $(ALL_PROGRAMS) $(BUILT_INS) perf$X 1184 $(RM) $(ALL_PROGRAMS) $(BUILT_INS) perf$X
1102 $(RM) $(TEST_PROGRAMS) 1185 $(RM) $(TEST_PROGRAMS)
1103 $(RM) *.spec *.pyc *.pyo */*.pyc */*.pyo common-cmds.h TAGS tags cscope* 1186 $(RM) *.spec *.pyc *.pyo */*.pyc */*.pyo $(OUTPUT)common-cmds.h TAGS tags cscope*
1104 $(RM) -r autom4te.cache 1187 $(RM) -r autom4te.cache
1105 $(RM) config.log config.mak.autogen config.mak.append config.status config.cache 1188 $(RM) config.log config.mak.autogen config.mak.append config.status config.cache
1106 $(RM) -r $(PERF_TARNAME) .doc-tmp-dir 1189 $(RM) -r $(PERF_TARNAME) .doc-tmp-dir
1107 $(RM) $(PERF_TARNAME).tar.gz perf-core_$(PERF_VERSION)-*.tar.gz 1190 $(RM) $(PERF_TARNAME).tar.gz perf-core_$(PERF_VERSION)-*.tar.gz
1108 $(RM) $(htmldocs).tar.gz $(manpages).tar.gz 1191 $(RM) $(htmldocs).tar.gz $(manpages).tar.gz
1109 $(MAKE) -C Documentation/ clean 1192 $(MAKE) -C Documentation/ clean
1110 $(RM) PERF-VERSION-FILE PERF-CFLAGS PERF-BUILD-OPTIONS 1193 $(RM) $(OUTPUT)PERF-VERSION-FILE $(OUTPUT)PERF-CFLAGS $(OUTPUT)PERF-BUILD-OPTIONS
1111 1194
1112.PHONY: all install clean strip 1195.PHONY: all install clean strip
1113.PHONY: shell_compatibility_test please_set_SHELL_PATH_to_a_more_modern_shell 1196.PHONY: shell_compatibility_test please_set_SHELL_PATH_to_a_more_modern_shell
diff --git a/tools/perf/arch/powerpc/Makefile b/tools/perf/arch/powerpc/Makefile
new file mode 100644
index 000000000000..15130b50dfe3
--- /dev/null
+++ b/tools/perf/arch/powerpc/Makefile
@@ -0,0 +1,4 @@
1ifndef NO_DWARF
2PERF_HAVE_DWARF_REGS := 1
3LIB_OBJS += $(OUTPUT)arch/$(ARCH)/util/dwarf-regs.o
4endif
diff --git a/tools/perf/arch/powerpc/util/dwarf-regs.c b/tools/perf/arch/powerpc/util/dwarf-regs.c
new file mode 100644
index 000000000000..48ae0c5e3f73
--- /dev/null
+++ b/tools/perf/arch/powerpc/util/dwarf-regs.c
@@ -0,0 +1,88 @@
1/*
2 * Mapping of DWARF debug register numbers into register names.
3 *
4 * Copyright (C) 2010 Ian Munsie, IBM Corporation.
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
12#include <libio.h>
13#include <dwarf-regs.h>
14
15
16struct pt_regs_dwarfnum {
17 const char *name;
18 unsigned int dwarfnum;
19};
20
21#define STR(s) #s
22#define REG_DWARFNUM_NAME(r, num) {.name = r, .dwarfnum = num}
23#define GPR_DWARFNUM_NAME(num) \
24 {.name = STR(%gpr##num), .dwarfnum = num}
25#define REG_DWARFNUM_END {.name = NULL, .dwarfnum = 0}
26
27/*
28 * Reference:
29 * http://refspecs.linuxfoundation.org/ELF/ppc64/PPC-elf64abi-1.9.html
30 */
31static const struct pt_regs_dwarfnum regdwarfnum_table[] = {
32 GPR_DWARFNUM_NAME(0),
33 GPR_DWARFNUM_NAME(1),
34 GPR_DWARFNUM_NAME(2),
35 GPR_DWARFNUM_NAME(3),
36 GPR_DWARFNUM_NAME(4),
37 GPR_DWARFNUM_NAME(5),
38 GPR_DWARFNUM_NAME(6),
39 GPR_DWARFNUM_NAME(7),
40 GPR_DWARFNUM_NAME(8),
41 GPR_DWARFNUM_NAME(9),
42 GPR_DWARFNUM_NAME(10),
43 GPR_DWARFNUM_NAME(11),
44 GPR_DWARFNUM_NAME(12),
45 GPR_DWARFNUM_NAME(13),
46 GPR_DWARFNUM_NAME(14),
47 GPR_DWARFNUM_NAME(15),
48 GPR_DWARFNUM_NAME(16),
49 GPR_DWARFNUM_NAME(17),
50 GPR_DWARFNUM_NAME(18),
51 GPR_DWARFNUM_NAME(19),
52 GPR_DWARFNUM_NAME(20),
53 GPR_DWARFNUM_NAME(21),
54 GPR_DWARFNUM_NAME(22),
55 GPR_DWARFNUM_NAME(23),
56 GPR_DWARFNUM_NAME(24),
57 GPR_DWARFNUM_NAME(25),
58 GPR_DWARFNUM_NAME(26),
59 GPR_DWARFNUM_NAME(27),
60 GPR_DWARFNUM_NAME(28),
61 GPR_DWARFNUM_NAME(29),
62 GPR_DWARFNUM_NAME(30),
63 GPR_DWARFNUM_NAME(31),
64 REG_DWARFNUM_NAME("%msr", 66),
65 REG_DWARFNUM_NAME("%ctr", 109),
66 REG_DWARFNUM_NAME("%link", 108),
67 REG_DWARFNUM_NAME("%xer", 101),
68 REG_DWARFNUM_NAME("%dar", 119),
69 REG_DWARFNUM_NAME("%dsisr", 118),
70 REG_DWARFNUM_END,
71};
72
73/**
74 * get_arch_regstr() - lookup register name from it's DWARF register number
75 * @n: the DWARF register number
76 *
77 * get_arch_regstr() returns the name of the register in struct
78 * regdwarfnum_table from it's DWARF register number. If the register is not
79 * found in the table, this returns NULL;
80 */
81const char *get_arch_regstr(unsigned int n)
82{
83 const struct pt_regs_dwarfnum *roff;
84 for (roff = regdwarfnum_table; roff->name != NULL; roff++)
85 if (roff->dwarfnum == n)
86 return roff->name;
87 return NULL;
88}
diff --git a/tools/perf/arch/sparc/Makefile b/tools/perf/arch/sparc/Makefile
new file mode 100644
index 000000000000..15130b50dfe3
--- /dev/null
+++ b/tools/perf/arch/sparc/Makefile
@@ -0,0 +1,4 @@
1ifndef NO_DWARF
2PERF_HAVE_DWARF_REGS := 1
3LIB_OBJS += $(OUTPUT)arch/$(ARCH)/util/dwarf-regs.o
4endif
diff --git a/tools/perf/arch/sparc/util/dwarf-regs.c b/tools/perf/arch/sparc/util/dwarf-regs.c
new file mode 100644
index 000000000000..0ab88483720c
--- /dev/null
+++ b/tools/perf/arch/sparc/util/dwarf-regs.c
@@ -0,0 +1,43 @@
1/*
2 * Mapping of DWARF debug register numbers into register names.
3 *
4 * Copyright (C) 2010 David S. Miller <davem@davemloft.net>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 */
11
12#include <libio.h>
13#include <dwarf-regs.h>
14
15#define SPARC_MAX_REGS 96
16
17const char *sparc_regs_table[SPARC_MAX_REGS] = {
18 "%g0", "%g1", "%g2", "%g3", "%g4", "%g5", "%g6", "%g7",
19 "%o0", "%o1", "%o2", "%o3", "%o4", "%o5", "%sp", "%o7",
20 "%l0", "%l1", "%l2", "%l3", "%l4", "%l5", "%l6", "%l7",
21 "%i0", "%i1", "%i2", "%i3", "%i4", "%i5", "%fp", "%i7",
22 "%f0", "%f1", "%f2", "%f3", "%f4", "%f5", "%f6", "%f7",
23 "%f8", "%f9", "%f10", "%f11", "%f12", "%f13", "%f14", "%f15",
24 "%f16", "%f17", "%f18", "%f19", "%f20", "%f21", "%f22", "%f23",
25 "%f24", "%f25", "%f26", "%f27", "%f28", "%f29", "%f30", "%f31",
26 "%f32", "%f33", "%f34", "%f35", "%f36", "%f37", "%f38", "%f39",
27 "%f40", "%f41", "%f42", "%f43", "%f44", "%f45", "%f46", "%f47",
28 "%f48", "%f49", "%f50", "%f51", "%f52", "%f53", "%f54", "%f55",
29 "%f56", "%f57", "%f58", "%f59", "%f60", "%f61", "%f62", "%f63",
30};
31
32/**
33 * get_arch_regstr() - lookup register name from it's DWARF register number
34 * @n: the DWARF register number
35 *
36 * get_arch_regstr() returns the name of the register in struct
37 * regdwarfnum_table from it's DWARF register number. If the register is not
38 * found in the table, this returns NULL;
39 */
40const char *get_arch_regstr(unsigned int n)
41{
42 return (n <= SPARC_MAX_REGS) ? sparc_regs_table[n] : NULL;
43}
diff --git a/tools/perf/arch/x86/Makefile b/tools/perf/arch/x86/Makefile
new file mode 100644
index 000000000000..15130b50dfe3
--- /dev/null
+++ b/tools/perf/arch/x86/Makefile
@@ -0,0 +1,4 @@
1ifndef NO_DWARF
2PERF_HAVE_DWARF_REGS := 1
3LIB_OBJS += $(OUTPUT)arch/$(ARCH)/util/dwarf-regs.o
4endif
diff --git a/tools/perf/arch/x86/util/dwarf-regs.c b/tools/perf/arch/x86/util/dwarf-regs.c
new file mode 100644
index 000000000000..a794d3081928
--- /dev/null
+++ b/tools/perf/arch/x86/util/dwarf-regs.c
@@ -0,0 +1,75 @@
1/*
2 * dwarf-regs.c : Mapping of DWARF debug register numbers into register names.
3 * Extracted from probe-finder.c
4 *
5 * Written by Masami Hiramatsu <mhiramat@redhat.com>
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
20 *
21 */
22
23#include <libio.h>
24#include <dwarf-regs.h>
25
26/*
27 * Generic dwarf analysis helpers
28 */
29
30#define X86_32_MAX_REGS 8
31const char *x86_32_regs_table[X86_32_MAX_REGS] = {
32 "%ax",
33 "%cx",
34 "%dx",
35 "%bx",
36 "$stack", /* Stack address instead of %sp */
37 "%bp",
38 "%si",
39 "%di",
40};
41
42#define X86_64_MAX_REGS 16
43const char *x86_64_regs_table[X86_64_MAX_REGS] = {
44 "%ax",
45 "%dx",
46 "%cx",
47 "%bx",
48 "%si",
49 "%di",
50 "%bp",
51 "%sp",
52 "%r8",
53 "%r9",
54 "%r10",
55 "%r11",
56 "%r12",
57 "%r13",
58 "%r14",
59 "%r15",
60};
61
62/* TODO: switching by dwarf address size */
63#ifdef __x86_64__
64#define ARCH_MAX_REGS X86_64_MAX_REGS
65#define arch_regs_table x86_64_regs_table
66#else
67#define ARCH_MAX_REGS X86_32_MAX_REGS
68#define arch_regs_table x86_32_regs_table
69#endif
70
71/* Return architecture dependent register string (for kprobe-tracer) */
72const char *get_arch_regstr(unsigned int n)
73{
74 return (n <= ARCH_MAX_REGS) ? arch_regs_table[n] : NULL;
75}
diff --git a/tools/perf/bench/mem-memcpy.c b/tools/perf/bench/mem-memcpy.c
index 89773178e894..38dae7465142 100644
--- a/tools/perf/bench/mem-memcpy.c
+++ b/tools/perf/bench/mem-memcpy.c
@@ -10,7 +10,6 @@
10#include "../perf.h" 10#include "../perf.h"
11#include "../util/util.h" 11#include "../util/util.h"
12#include "../util/parse-options.h" 12#include "../util/parse-options.h"
13#include "../util/string.h"
14#include "../util/header.h" 13#include "../util/header.h"
15#include "bench.h" 14#include "bench.h"
16 15
@@ -24,7 +23,7 @@
24 23
25static const char *length_str = "1MB"; 24static const char *length_str = "1MB";
26static const char *routine = "default"; 25static const char *routine = "default";
27static int use_clock = 0; 26static bool use_clock = false;
28static int clock_fd; 27static int clock_fd;
29 28
30static const struct option options[] = { 29static const struct option options[] = {
diff --git a/tools/perf/bench/sched-messaging.c b/tools/perf/bench/sched-messaging.c
index 81cee78181fa..d1d1b30f99c1 100644
--- a/tools/perf/bench/sched-messaging.c
+++ b/tools/perf/bench/sched-messaging.c
@@ -31,9 +31,9 @@
31 31
32#define DATASIZE 100 32#define DATASIZE 100
33 33
34static int use_pipes = 0; 34static bool use_pipes = false;
35static unsigned int loops = 100; 35static unsigned int loops = 100;
36static unsigned int thread_mode = 0; 36static bool thread_mode = false;
37static unsigned int num_groups = 10; 37static unsigned int num_groups = 10;
38 38
39struct sender_context { 39struct sender_context {
@@ -256,10 +256,8 @@ static const struct option options[] = {
256 "Use pipe() instead of socketpair()"), 256 "Use pipe() instead of socketpair()"),
257 OPT_BOOLEAN('t', "thread", &thread_mode, 257 OPT_BOOLEAN('t', "thread", &thread_mode,
258 "Be multi thread instead of multi process"), 258 "Be multi thread instead of multi process"),
259 OPT_INTEGER('g', "group", &num_groups, 259 OPT_UINTEGER('g', "group", &num_groups, "Specify number of groups"),
260 "Specify number of groups"), 260 OPT_UINTEGER('l', "loop", &loops, "Specify number of loops"),
261 OPT_INTEGER('l', "loop", &loops,
262 "Specify number of loops"),
263 OPT_END() 261 OPT_END()
264}; 262};
265 263
diff --git a/tools/perf/bench/sched-pipe.c b/tools/perf/bench/sched-pipe.c
index 4f77c7c27640..d9ab3ce446ac 100644
--- a/tools/perf/bench/sched-pipe.c
+++ b/tools/perf/bench/sched-pipe.c
@@ -93,7 +93,7 @@ int bench_sched_pipe(int argc, const char **argv,
93 93
94 switch (bench_format) { 94 switch (bench_format) {
95 case BENCH_FORMAT_DEFAULT: 95 case BENCH_FORMAT_DEFAULT:
96 printf("# Extecuted %d pipe operations between two tasks\n\n", 96 printf("# Executed %d pipe operations between two tasks\n\n",
97 loops); 97 loops);
98 98
99 result_usec = diff.tv_sec * 1000000; 99 result_usec = diff.tv_sec * 1000000;
diff --git a/tools/perf/builtin-annotate.c b/tools/perf/builtin-annotate.c
index 593ff25006de..96db5248e995 100644
--- a/tools/perf/builtin-annotate.c
+++ b/tools/perf/builtin-annotate.c
@@ -14,7 +14,6 @@
14#include "util/cache.h" 14#include "util/cache.h"
15#include <linux/rbtree.h> 15#include <linux/rbtree.h>
16#include "util/symbol.h" 16#include "util/symbol.h"
17#include "util/string.h"
18 17
19#include "perf.h" 18#include "perf.h"
20#include "util/debug.h" 19#include "util/debug.h"
@@ -29,175 +28,67 @@
29 28
30static char const *input_name = "perf.data"; 29static char const *input_name = "perf.data";
31 30
32static int force; 31static bool force;
33 32
34static int full_paths; 33static bool full_paths;
35 34
36static int print_line; 35static bool print_line;
37
38struct sym_hist {
39 u64 sum;
40 u64 ip[0];
41};
42
43struct sym_ext {
44 struct rb_node node;
45 double percent;
46 char *path;
47};
48
49struct sym_priv {
50 struct sym_hist *hist;
51 struct sym_ext *ext;
52};
53 36
54static const char *sym_hist_filter; 37static const char *sym_hist_filter;
55 38
56static int symbol_filter(struct map *map __used, struct symbol *sym) 39static int hists__add_entry(struct hists *self, struct addr_location *al)
57{ 40{
58 if (sym_hist_filter == NULL || 41 struct hist_entry *he;
59 strcmp(sym->name, sym_hist_filter) == 0) { 42
60 struct sym_priv *priv = symbol__priv(sym); 43 if (sym_hist_filter != NULL &&
61 const int size = (sizeof(*priv->hist) + 44 (al->sym == NULL || strcmp(sym_hist_filter, al->sym->name) != 0)) {
62 (sym->end - sym->start) * sizeof(u64)); 45 /* We're only interested in a symbol named sym_hist_filter */
63 46 if (al->sym != NULL) {
64 priv->hist = malloc(size); 47 rb_erase(&al->sym->rb_node,
65 if (priv->hist) 48 &al->map->dso->symbols[al->map->type]);
66 memset(priv->hist, 0, size); 49 symbol__delete(al->sym);
50 }
67 return 0; 51 return 0;
68 } 52 }
69 /*
70 * FIXME: We should really filter it out, as we don't want to go thru symbols
71 * we're not interested, and if a DSO ends up with no symbols, delete it too,
72 * but right now the kernel loading routines in symbol.c bail out if no symbols
73 * are found, fix it later.
74 */
75 return 0;
76}
77
78/*
79 * collect histogram counts
80 */
81static void hist_hit(struct hist_entry *he, u64 ip)
82{
83 unsigned int sym_size, offset;
84 struct symbol *sym = he->sym;
85 struct sym_priv *priv;
86 struct sym_hist *h;
87
88 he->count++;
89
90 if (!sym || !he->map)
91 return;
92 53
93 priv = symbol__priv(sym); 54 he = __hists__add_entry(self, al, NULL, 1);
94 if (!priv->hist)
95 return;
96
97 sym_size = sym->end - sym->start;
98 offset = ip - sym->start;
99
100 if (verbose)
101 fprintf(stderr, "%s: ip=%Lx\n", __func__,
102 he->map->unmap_ip(he->map, ip));
103
104 if (offset >= sym_size)
105 return;
106
107 h = priv->hist;
108 h->sum++;
109 h->ip[offset]++;
110
111 if (verbose >= 3)
112 printf("%p %s: count++ [ip: %p, %08Lx] => %Ld\n",
113 (void *)(unsigned long)he->sym->start,
114 he->sym->name,
115 (void *)(unsigned long)ip, ip - he->sym->start,
116 h->ip[offset]);
117}
118
119static int perf_session__add_hist_entry(struct perf_session *self,
120 struct addr_location *al, u64 count)
121{
122 bool hit;
123 struct hist_entry *he = __perf_session__add_hist_entry(self, al, NULL,
124 count, &hit);
125 if (he == NULL) 55 if (he == NULL)
126 return -ENOMEM; 56 return -ENOMEM;
127 hist_hit(he, al->addr); 57
128 return 0; 58 return hist_entry__inc_addr_samples(he, al->addr);
129} 59}
130 60
131static int process_sample_event(event_t *event, struct perf_session *session) 61static int process_sample_event(event_t *event, struct perf_session *session)
132{ 62{
133 struct addr_location al; 63 struct addr_location al;
134 64
135 dump_printf("(IP, %d): %d: %p\n", event->header.misc, 65 dump_printf("(IP, %d): %d: %#Lx\n", event->header.misc,
136 event->ip.pid, (void *)(long)event->ip.ip); 66 event->ip.pid, event->ip.ip);
137 67
138 if (event__preprocess_sample(event, session, &al, symbol_filter) < 0) { 68 if (event__preprocess_sample(event, session, &al, NULL) < 0) {
139 fprintf(stderr, "problem processing %d event, skipping it.\n", 69 pr_warning("problem processing %d event, skipping it.\n",
140 event->header.type); 70 event->header.type);
141 return -1; 71 return -1;
142 } 72 }
143 73
144 if (!al.filtered && perf_session__add_hist_entry(session, &al, 1)) { 74 if (!al.filtered && hists__add_entry(&session->hists, &al)) {
145 fprintf(stderr, "problem incrementing symbol count, " 75 pr_warning("problem incrementing symbol count, "
146 "skipping event\n"); 76 "skipping event\n");
147 return -1; 77 return -1;
148 } 78 }
149 79
150 return 0; 80 return 0;
151} 81}
152 82
153static int parse_line(FILE *file, struct hist_entry *he, u64 len) 83static int objdump_line__print(struct objdump_line *self,
84 struct list_head *head,
85 struct hist_entry *he, u64 len)
154{ 86{
155 struct symbol *sym = he->sym; 87 struct symbol *sym = he->ms.sym;
156 char *line = NULL, *tmp, *tmp2;
157 static const char *prev_line; 88 static const char *prev_line;
158 static const char *prev_color; 89 static const char *prev_color;
159 unsigned int offset;
160 size_t line_len;
161 u64 start;
162 s64 line_ip;
163 int ret;
164 char *c;
165
166 if (getline(&line, &line_len, file) < 0)
167 return -1;
168 if (!line)
169 return -1;
170 90
171 c = strchr(line, '\n'); 91 if (self->offset != -1) {
172 if (c)
173 *c = 0;
174
175 line_ip = -1;
176 offset = 0;
177 ret = -2;
178
179 /*
180 * Strip leading spaces:
181 */
182 tmp = line;
183 while (*tmp) {
184 if (*tmp != ' ')
185 break;
186 tmp++;
187 }
188
189 if (*tmp) {
190 /*
191 * Parse hexa addresses followed by ':'
192 */
193 line_ip = strtoull(tmp, &tmp2, 16);
194 if (*tmp2 != ':')
195 line_ip = -1;
196 }
197
198 start = he->map->unmap_ip(he->map, sym->start);
199
200 if (line_ip != -1) {
201 const char *path = NULL; 92 const char *path = NULL;
202 unsigned int hits = 0; 93 unsigned int hits = 0;
203 double percent = 0.0; 94 double percent = 0.0;
@@ -205,15 +96,22 @@ static int parse_line(FILE *file, struct hist_entry *he, u64 len)
205 struct sym_priv *priv = symbol__priv(sym); 96 struct sym_priv *priv = symbol__priv(sym);
206 struct sym_ext *sym_ext = priv->ext; 97 struct sym_ext *sym_ext = priv->ext;
207 struct sym_hist *h = priv->hist; 98 struct sym_hist *h = priv->hist;
99 s64 offset = self->offset;
100 struct objdump_line *next = objdump__get_next_ip_line(head, self);
101
102 while (offset < (s64)len &&
103 (next == NULL || offset < next->offset)) {
104 if (sym_ext) {
105 if (path == NULL)
106 path = sym_ext[offset].path;
107 percent += sym_ext[offset].percent;
108 } else
109 hits += h->ip[offset];
110
111 ++offset;
112 }
208 113
209 offset = line_ip - start; 114 if (sym_ext == NULL && h->sum)
210 if (offset < len)
211 hits = h->ip[offset];
212
213 if (offset < len && sym_ext) {
214 path = sym_ext[offset].path;
215 percent = sym_ext[offset].percent;
216 } else if (h->sum)
217 percent = 100.0 * hits / h->sum; 115 percent = 100.0 * hits / h->sum;
218 116
219 color = get_percent_color(percent); 117 color = get_percent_color(percent);
@@ -234,12 +132,12 @@ static int parse_line(FILE *file, struct hist_entry *he, u64 len)
234 132
235 color_fprintf(stdout, color, " %7.2f", percent); 133 color_fprintf(stdout, color, " %7.2f", percent);
236 printf(" : "); 134 printf(" : ");
237 color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", line); 135 color_fprintf(stdout, PERF_COLOR_BLUE, "%s\n", self->line);
238 } else { 136 } else {
239 if (!*line) 137 if (!*self->line)
240 printf(" :\n"); 138 printf(" :\n");
241 else 139 else
242 printf(" : %s\n", line); 140 printf(" : %s\n", self->line);
243 } 141 }
244 142
245 return 0; 143 return 0;
@@ -269,7 +167,7 @@ static void insert_source_line(struct sym_ext *sym_ext)
269 167
270static void free_source_line(struct hist_entry *he, int len) 168static void free_source_line(struct hist_entry *he, int len)
271{ 169{
272 struct sym_priv *priv = symbol__priv(he->sym); 170 struct sym_priv *priv = symbol__priv(he->ms.sym);
273 struct sym_ext *sym_ext = priv->ext; 171 struct sym_ext *sym_ext = priv->ext;
274 int i; 172 int i;
275 173
@@ -288,7 +186,7 @@ static void free_source_line(struct hist_entry *he, int len)
288static void 186static void
289get_source_line(struct hist_entry *he, int len, const char *filename) 187get_source_line(struct hist_entry *he, int len, const char *filename)
290{ 188{
291 struct symbol *sym = he->sym; 189 struct symbol *sym = he->ms.sym;
292 u64 start; 190 u64 start;
293 int i; 191 int i;
294 char cmd[PATH_MAX * 2]; 192 char cmd[PATH_MAX * 2];
@@ -303,7 +201,7 @@ get_source_line(struct hist_entry *he, int len, const char *filename)
303 if (!priv->ext) 201 if (!priv->ext)
304 return; 202 return;
305 203
306 start = he->map->unmap_ip(he->map, sym->start); 204 start = he->ms.map->unmap_ip(he->ms.map, sym->start);
307 205
308 for (i = 0; i < len; i++) { 206 for (i = 0; i < len; i++) {
309 char *path = NULL; 207 char *path = NULL;
@@ -365,24 +263,32 @@ static void print_summary(const char *filename)
365 } 263 }
366} 264}
367 265
368static void annotate_sym(struct hist_entry *he) 266static void hist_entry__print_hits(struct hist_entry *self)
369{ 267{
370 struct map *map = he->map; 268 struct symbol *sym = self->ms.sym;
269 struct sym_priv *priv = symbol__priv(sym);
270 struct sym_hist *h = priv->hist;
271 u64 len = sym->end - sym->start, offset;
272
273 for (offset = 0; offset < len; ++offset)
274 if (h->ip[offset] != 0)
275 printf("%*Lx: %Lu\n", BITS_PER_LONG / 2,
276 sym->start + offset, h->ip[offset]);
277 printf("%*s: %Lu\n", BITS_PER_LONG / 2, "h->sum", h->sum);
278}
279
280static int hist_entry__tty_annotate(struct hist_entry *he)
281{
282 struct map *map = he->ms.map;
371 struct dso *dso = map->dso; 283 struct dso *dso = map->dso;
372 struct symbol *sym = he->sym; 284 struct symbol *sym = he->ms.sym;
373 const char *filename = dso->long_name, *d_filename; 285 const char *filename = dso->long_name, *d_filename;
374 u64 len; 286 u64 len;
375 char command[PATH_MAX*2]; 287 LIST_HEAD(head);
376 FILE *file; 288 struct objdump_line *pos, *n;
377
378 if (!filename)
379 return;
380 289
381 if (verbose) 290 if (hist_entry__annotate(he, &head) < 0)
382 fprintf(stderr, "%s: filename=%s, sym=%s, start=%Lx, end=%Lx\n", 291 return -1;
383 __func__, filename, sym->name,
384 map->unmap_ip(map, sym->start),
385 map->unmap_ip(map, sym->end));
386 292
387 if (full_paths) 293 if (full_paths)
388 d_filename = filename; 294 d_filename = filename;
@@ -400,61 +306,78 @@ static void annotate_sym(struct hist_entry *he)
400 printf(" Percent | Source code & Disassembly of %s\n", d_filename); 306 printf(" Percent | Source code & Disassembly of %s\n", d_filename);
401 printf("------------------------------------------------\n"); 307 printf("------------------------------------------------\n");
402 308
403 if (verbose >= 2) 309 if (verbose)
404 printf("annotating [%p] %30s : [%p] %30s\n", 310 hist_entry__print_hits(he);
405 dso, dso->long_name, sym, sym->name);
406
407 sprintf(command, "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s",
408 map->unmap_ip(map, sym->start), map->unmap_ip(map, sym->end),
409 filename, filename);
410
411 if (verbose >= 3)
412 printf("doing: %s\n", command);
413
414 file = popen(command, "r");
415 if (!file)
416 return;
417 311
418 while (!feof(file)) { 312 list_for_each_entry_safe(pos, n, &head, node) {
419 if (parse_line(file, he, len) < 0) 313 objdump_line__print(pos, &head, he, len);
420 break; 314 list_del(&pos->node);
315 objdump_line__free(pos);
421 } 316 }
422 317
423 pclose(file);
424 if (print_line) 318 if (print_line)
425 free_source_line(he, len); 319 free_source_line(he, len);
320
321 return 0;
426} 322}
427 323
428static void perf_session__find_annotations(struct perf_session *self) 324static void hists__find_annotations(struct hists *self)
429{ 325{
430 struct rb_node *nd; 326 struct rb_node *first = rb_first(&self->entries), *nd = first;
327 int key = KEY_RIGHT;
431 328
432 for (nd = rb_first(&self->hists); nd; nd = rb_next(nd)) { 329 while (nd) {
433 struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node); 330 struct hist_entry *he = rb_entry(nd, struct hist_entry, rb_node);
434 struct sym_priv *priv; 331 struct sym_priv *priv;
435 332
436 if (he->sym == NULL) 333 if (he->ms.sym == NULL || he->ms.map->dso->annotate_warned)
437 continue; 334 goto find_next;
438 335
439 priv = symbol__priv(he->sym); 336 priv = symbol__priv(he->ms.sym);
440 if (priv->hist == NULL) 337 if (priv->hist == NULL) {
338find_next:
339 if (key == KEY_LEFT)
340 nd = rb_prev(nd);
341 else
342 nd = rb_next(nd);
441 continue; 343 continue;
344 }
442 345
443 annotate_sym(he); 346 if (use_browser > 0) {
444 /* 347 key = hist_entry__tui_annotate(he);
445 * Since we have a hist_entry per IP for the same symbol, free 348 if (is_exit_key(key))
446 * he->sym->hist to signal we already processed this symbol. 349 break;
447 */ 350 switch (key) {
448 free(priv->hist); 351 case KEY_RIGHT:
449 priv->hist = NULL; 352 case '\t':
353 nd = rb_next(nd);
354 break;
355 case KEY_LEFT:
356 if (nd == first)
357 continue;
358 nd = rb_prev(nd);
359 default:
360 break;
361 }
362 } else {
363 hist_entry__tty_annotate(he);
364 nd = rb_next(nd);
365 /*
366 * Since we have a hist_entry per IP for the same
367 * symbol, free he->ms.sym->hist to signal we already
368 * processed this symbol.
369 */
370 free(priv->hist);
371 priv->hist = NULL;
372 }
450 } 373 }
451} 374}
452 375
453static struct perf_event_ops event_ops = { 376static struct perf_event_ops event_ops = {
454 .process_sample_event = process_sample_event, 377 .sample = process_sample_event,
455 .process_mmap_event = event__process_mmap, 378 .mmap = event__process_mmap,
456 .process_comm_event = event__process_comm, 379 .comm = event__process_comm,
457 .process_fork_event = event__process_task, 380 .fork = event__process_task,
458}; 381};
459 382
460static int __cmd_annotate(void) 383static int __cmd_annotate(void)
@@ -462,7 +385,7 @@ static int __cmd_annotate(void)
462 int ret; 385 int ret;
463 struct perf_session *session; 386 struct perf_session *session;
464 387
465 session = perf_session__new(input_name, O_RDONLY, force); 388 session = perf_session__new(input_name, O_RDONLY, force, false);
466 if (session == NULL) 389 if (session == NULL)
467 return -ENOMEM; 390 return -ENOMEM;
468 391
@@ -471,7 +394,7 @@ static int __cmd_annotate(void)
471 goto out_delete; 394 goto out_delete;
472 395
473 if (dump_trace) { 396 if (dump_trace) {
474 event__print_totals(); 397 perf_session__fprintf_nr_events(session, stdout);
475 goto out_delete; 398 goto out_delete;
476 } 399 }
477 400
@@ -479,11 +402,11 @@ static int __cmd_annotate(void)
479 perf_session__fprintf(session, stdout); 402 perf_session__fprintf(session, stdout);
480 403
481 if (verbose > 2) 404 if (verbose > 2)
482 dsos__fprintf(stdout); 405 perf_session__fprintf_dsos(session, stdout);
483 406
484 perf_session__collapse_resort(session); 407 hists__collapse_resort(&session->hists);
485 perf_session__output_resort(session, session->event_total[0]); 408 hists__output_resort(&session->hists);
486 perf_session__find_annotations(session); 409 hists__find_annotations(&session->hists);
487out_delete: 410out_delete:
488 perf_session__delete(session); 411 perf_session__delete(session);
489 412
@@ -498,10 +421,12 @@ static const char * const annotate_usage[] = {
498static const struct option options[] = { 421static const struct option options[] = {
499 OPT_STRING('i', "input", &input_name, "file", 422 OPT_STRING('i', "input", &input_name, "file",
500 "input file name"), 423 "input file name"),
424 OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
425 "only consider symbols in these dsos"),
501 OPT_STRING('s', "symbol", &sym_hist_filter, "symbol", 426 OPT_STRING('s', "symbol", &sym_hist_filter, "symbol",
502 "symbol to annotate"), 427 "symbol to annotate"),
503 OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), 428 OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
504 OPT_BOOLEAN('v', "verbose", &verbose, 429 OPT_INCR('v', "verbose", &verbose,
505 "be more verbose (show symbol address, etc)"), 430 "be more verbose (show symbol address, etc)"),
506 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, 431 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
507 "dump raw trace in ASCII"), 432 "dump raw trace in ASCII"),
@@ -520,6 +445,8 @@ int cmd_annotate(int argc, const char **argv, const char *prefix __used)
520{ 445{
521 argc = parse_options(argc, argv, options, annotate_usage, 0); 446 argc = parse_options(argc, argv, options, annotate_usage, 0);
522 447
448 setup_browser();
449
523 symbol_conf.priv_size = sizeof(struct sym_priv); 450 symbol_conf.priv_size = sizeof(struct sym_priv);
524 symbol_conf.try_vmlinux_path = true; 451 symbol_conf.try_vmlinux_path = true;
525 452
@@ -539,12 +466,9 @@ int cmd_annotate(int argc, const char **argv, const char *prefix __used)
539 sym_hist_filter = argv[0]; 466 sym_hist_filter = argv[0];
540 } 467 }
541 468
542 setup_pager();
543
544 if (field_sep && *field_sep == '.') { 469 if (field_sep && *field_sep == '.') {
545 fputs("'.' is the only non valid --field-separator argument\n", 470 pr_err("'.' is the only non valid --field-separator argument\n");
546 stderr); 471 return -1;
547 exit(129);
548 } 472 }
549 473
550 return __cmd_annotate(); 474 return __cmd_annotate();
diff --git a/tools/perf/builtin-bench.c b/tools/perf/builtin-bench.c
index 46996774e559..fcb96269852a 100644
--- a/tools/perf/builtin-bench.c
+++ b/tools/perf/builtin-bench.c
@@ -95,7 +95,7 @@ static void dump_suites(int subsys_index)
95 return; 95 return;
96} 96}
97 97
98static char *bench_format_str; 98static const char *bench_format_str;
99int bench_format = BENCH_FORMAT_DEFAULT; 99int bench_format = BENCH_FORMAT_DEFAULT;
100 100
101static const struct option bench_options[] = { 101static const struct option bench_options[] = {
@@ -126,7 +126,7 @@ static void print_usage(void)
126 printf("\n"); 126 printf("\n");
127} 127}
128 128
129static int bench_str2int(char *str) 129static int bench_str2int(const char *str)
130{ 130{
131 if (!str) 131 if (!str)
132 return BENCH_FORMAT_DEFAULT; 132 return BENCH_FORMAT_DEFAULT;
diff --git a/tools/perf/builtin-buildid-cache.c b/tools/perf/builtin-buildid-cache.c
new file mode 100644
index 000000000000..f8e3d1852029
--- /dev/null
+++ b/tools/perf/builtin-buildid-cache.c
@@ -0,0 +1,133 @@
1/*
2 * builtin-buildid-cache.c
3 *
4 * Builtin buildid-cache command: Manages build-id cache
5 *
6 * Copyright (C) 2010, Red Hat Inc.
7 * Copyright (C) 2010, Arnaldo Carvalho de Melo <acme@redhat.com>
8 */
9#include "builtin.h"
10#include "perf.h"
11#include "util/cache.h"
12#include "util/debug.h"
13#include "util/header.h"
14#include "util/parse-options.h"
15#include "util/strlist.h"
16#include "util/symbol.h"
17
18static char const *add_name_list_str, *remove_name_list_str;
19
20static const char * const buildid_cache_usage[] = {
21 "perf buildid-cache [<options>]",
22 NULL
23};
24
25static const struct option buildid_cache_options[] = {
26 OPT_STRING('a', "add", &add_name_list_str,
27 "file list", "file(s) to add"),
28 OPT_STRING('r', "remove", &remove_name_list_str, "file list",
29 "file(s) to remove"),
30 OPT_INCR('v', "verbose", &verbose, "be more verbose"),
31 OPT_END()
32};
33
34static int build_id_cache__add_file(const char *filename, const char *debugdir)
35{
36 char sbuild_id[BUILD_ID_SIZE * 2 + 1];
37 u8 build_id[BUILD_ID_SIZE];
38 int err;
39
40 if (filename__read_build_id(filename, &build_id, sizeof(build_id)) < 0) {
41 pr_debug("Couldn't read a build-id in %s\n", filename);
42 return -1;
43 }
44
45 build_id__sprintf(build_id, sizeof(build_id), sbuild_id);
46 err = build_id_cache__add_s(sbuild_id, debugdir, filename, false);
47 if (verbose)
48 pr_info("Adding %s %s: %s\n", sbuild_id, filename,
49 err ? "FAIL" : "Ok");
50 return err;
51}
52
53static int build_id_cache__remove_file(const char *filename __used,
54 const char *debugdir __used)
55{
56 u8 build_id[BUILD_ID_SIZE];
57 char sbuild_id[BUILD_ID_SIZE * 2 + 1];
58
59 int err;
60
61 if (filename__read_build_id(filename, &build_id, sizeof(build_id)) < 0) {
62 pr_debug("Couldn't read a build-id in %s\n", filename);
63 return -1;
64 }
65
66 build_id__sprintf(build_id, sizeof(build_id), sbuild_id);
67 err = build_id_cache__remove_s(sbuild_id, debugdir);
68 if (verbose)
69 pr_info("Removing %s %s: %s\n", sbuild_id, filename,
70 err ? "FAIL" : "Ok");
71
72 return err;
73}
74
75static int __cmd_buildid_cache(void)
76{
77 struct strlist *list;
78 struct str_node *pos;
79 char debugdir[PATH_MAX];
80
81 snprintf(debugdir, sizeof(debugdir), "%s/%s", getenv("HOME"),
82 DEBUG_CACHE_DIR);
83
84 if (add_name_list_str) {
85 list = strlist__new(true, add_name_list_str);
86 if (list) {
87 strlist__for_each(pos, list)
88 if (build_id_cache__add_file(pos->s, debugdir)) {
89 if (errno == EEXIST) {
90 pr_debug("%s already in the cache\n",
91 pos->s);
92 continue;
93 }
94 pr_warning("Couldn't add %s: %s\n",
95 pos->s, strerror(errno));
96 }
97
98 strlist__delete(list);
99 }
100 }
101
102 if (remove_name_list_str) {
103 list = strlist__new(true, remove_name_list_str);
104 if (list) {
105 strlist__for_each(pos, list)
106 if (build_id_cache__remove_file(pos->s, debugdir)) {
107 if (errno == ENOENT) {
108 pr_debug("%s wasn't in the cache\n",
109 pos->s);
110 continue;
111 }
112 pr_warning("Couldn't remove %s: %s\n",
113 pos->s, strerror(errno));
114 }
115
116 strlist__delete(list);
117 }
118 }
119
120 return 0;
121}
122
123int cmd_buildid_cache(int argc, const char **argv, const char *prefix __used)
124{
125 argc = parse_options(argc, argv, buildid_cache_options,
126 buildid_cache_usage, 0);
127
128 if (symbol__init() < 0)
129 return -1;
130
131 setup_pager();
132 return __cmd_buildid_cache();
133}
diff --git a/tools/perf/builtin-buildid-list.c b/tools/perf/builtin-buildid-list.c
index 1e99ac806913..99890728409e 100644
--- a/tools/perf/builtin-buildid-list.c
+++ b/tools/perf/builtin-buildid-list.c
@@ -8,6 +8,7 @@
8 */ 8 */
9#include "builtin.h" 9#include "builtin.h"
10#include "perf.h" 10#include "perf.h"
11#include "util/build-id.h"
11#include "util/cache.h" 12#include "util/cache.h"
12#include "util/debug.h" 13#include "util/debug.h"
13#include "util/parse-options.h" 14#include "util/parse-options.h"
@@ -15,7 +16,8 @@
15#include "util/symbol.h" 16#include "util/symbol.h"
16 17
17static char const *input_name = "perf.data"; 18static char const *input_name = "perf.data";
18static int force; 19static bool force;
20static bool with_hits;
19 21
20static const char * const buildid_list_usage[] = { 22static const char * const buildid_list_usage[] = {
21 "perf buildid-list [<options>]", 23 "perf buildid-list [<options>]",
@@ -23,47 +25,30 @@ static const char * const buildid_list_usage[] = {
23}; 25};
24 26
25static const struct option options[] = { 27static const struct option options[] = {
28 OPT_BOOLEAN('H', "with-hits", &with_hits, "Show only DSOs with hits"),
26 OPT_STRING('i', "input", &input_name, "file", 29 OPT_STRING('i', "input", &input_name, "file",
27 "input file name"), 30 "input file name"),
28 OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), 31 OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
29 OPT_BOOLEAN('v', "verbose", &verbose, 32 OPT_INCR('v', "verbose", &verbose,
30 "be more verbose"), 33 "be more verbose"),
31 OPT_END() 34 OPT_END()
32}; 35};
33 36
34static int perf_file_section__process_buildids(struct perf_file_section *self,
35 int feat, int fd)
36{
37 if (feat != HEADER_BUILD_ID)
38 return 0;
39
40 if (lseek(fd, self->offset, SEEK_SET) < 0) {
41 pr_warning("Failed to lseek to %Ld offset for buildids!\n",
42 self->offset);
43 return -1;
44 }
45
46 if (perf_header__read_build_ids(fd, self->offset, self->size)) {
47 pr_warning("Failed to read buildids!\n");
48 return -1;
49 }
50
51 return 0;
52}
53
54static int __cmd_buildid_list(void) 37static int __cmd_buildid_list(void)
55{ 38{
56 int err = -1; 39 int err = -1;
57 struct perf_session *session; 40 struct perf_session *session;
58 41
59 session = perf_session__new(input_name, O_RDONLY, force); 42 session = perf_session__new(input_name, O_RDONLY, force, false);
60 if (session == NULL) 43 if (session == NULL)
61 return -1; 44 return -1;
62 45
63 err = perf_header__process_sections(&session->header, session->fd, 46 if (with_hits) {
64 perf_file_section__process_buildids); 47 symbol_conf.full_paths = true;
65 if (err >= 0) 48 perf_session__process_events(session, &build_id__mark_dso_hit_ops);
66 dsos__fprintf_buildid(stdout); 49 }
50
51 perf_session__fprintf_dsos_buildid(session, stdout, with_hits);
67 52
68 perf_session__delete(session); 53 perf_session__delete(session);
69 return err; 54 return err;
diff --git a/tools/perf/builtin-diff.c b/tools/perf/builtin-diff.c
index bd71b8ceafb7..a6e2fdc7a04e 100644
--- a/tools/perf/builtin-diff.c
+++ b/tools/perf/builtin-diff.c
@@ -19,22 +19,15 @@
19static char const *input_old = "perf.data.old", 19static char const *input_old = "perf.data.old",
20 *input_new = "perf.data"; 20 *input_new = "perf.data";
21static char diff__default_sort_order[] = "dso,symbol"; 21static char diff__default_sort_order[] = "dso,symbol";
22static int force; 22static bool force;
23static bool show_displacement; 23static bool show_displacement;
24 24
25static int perf_session__add_hist_entry(struct perf_session *self, 25static int hists__add_entry(struct hists *self,
26 struct addr_location *al, u64 count) 26 struct addr_location *al, u64 period)
27{ 27{
28 bool hit; 28 if (__hists__add_entry(self, al, NULL, period) != NULL)
29 struct hist_entry *he = __perf_session__add_hist_entry(self, al, NULL, 29 return 0;
30 count, &hit); 30 return -ENOMEM;
31 if (he == NULL)
32 return -ENOMEM;
33
34 if (hit)
35 he->count += count;
36
37 return 0;
38} 31}
39 32
40static int diff__process_sample_event(event_t *event, struct perf_session *session) 33static int diff__process_sample_event(event_t *event, struct perf_session *session)
@@ -42,8 +35,8 @@ static int diff__process_sample_event(event_t *event, struct perf_session *sessi
42 struct addr_location al; 35 struct addr_location al;
43 struct sample_data data = { .period = 1, }; 36 struct sample_data data = { .period = 1, };
44 37
45 dump_printf("(IP, %d): %d: %p\n", event->header.misc, 38 dump_printf("(IP, %d): %d: %#Lx\n", event->header.misc,
46 event->ip.pid, (void *)(long)event->ip.ip); 39 event->ip.pid, event->ip.ip);
47 40
48 if (event__preprocess_sample(event, session, &al, NULL) < 0) { 41 if (event__preprocess_sample(event, session, &al, NULL) < 0) {
49 pr_warning("problem processing %d event, skipping it.\n", 42 pr_warning("problem processing %d event, skipping it.\n",
@@ -51,27 +44,27 @@ static int diff__process_sample_event(event_t *event, struct perf_session *sessi
51 return -1; 44 return -1;
52 } 45 }
53 46
54 if (al.filtered) 47 if (al.filtered || al.sym == NULL)
55 return 0; 48 return 0;
56 49
57 event__parse_sample(event, session->sample_type, &data); 50 event__parse_sample(event, session->sample_type, &data);
58 51
59 if (al.sym && perf_session__add_hist_entry(session, &al, data.period)) { 52 if (hists__add_entry(&session->hists, &al, data.period)) {
60 pr_warning("problem incrementing symbol count, skipping event\n"); 53 pr_warning("problem incrementing symbol period, skipping event\n");
61 return -1; 54 return -1;
62 } 55 }
63 56
64 session->events_stats.total += data.period; 57 session->hists.stats.total_period += data.period;
65 return 0; 58 return 0;
66} 59}
67 60
68static struct perf_event_ops event_ops = { 61static struct perf_event_ops event_ops = {
69 .process_sample_event = diff__process_sample_event, 62 .sample = diff__process_sample_event,
70 .process_mmap_event = event__process_mmap, 63 .mmap = event__process_mmap,
71 .process_comm_event = event__process_comm, 64 .comm = event__process_comm,
72 .process_exit_event = event__process_task, 65 .exit = event__process_task,
73 .process_fork_event = event__process_task, 66 .fork = event__process_task,
74 .process_lost_event = event__process_lost, 67 .lost = event__process_lost,
75}; 68};
76 69
77static void perf_session__insert_hist_entry_by_name(struct rb_root *root, 70static void perf_session__insert_hist_entry_by_name(struct rb_root *root,
@@ -82,84 +75,69 @@ static void perf_session__insert_hist_entry_by_name(struct rb_root *root,
82 struct hist_entry *iter; 75 struct hist_entry *iter;
83 76
84 while (*p != NULL) { 77 while (*p != NULL) {
85 int cmp;
86 parent = *p; 78 parent = *p;
87 iter = rb_entry(parent, struct hist_entry, rb_node); 79 iter = rb_entry(parent, struct hist_entry, rb_node);
88 80 if (hist_entry__cmp(he, iter) < 0)
89 cmp = strcmp(he->map->dso->name, iter->map->dso->name);
90 if (cmp > 0)
91 p = &(*p)->rb_left; 81 p = &(*p)->rb_left;
92 else if (cmp < 0) 82 else
93 p = &(*p)->rb_right; 83 p = &(*p)->rb_right;
94 else {
95 cmp = strcmp(he->sym->name, iter->sym->name);
96 if (cmp > 0)
97 p = &(*p)->rb_left;
98 else
99 p = &(*p)->rb_right;
100 }
101 } 84 }
102 85
103 rb_link_node(&he->rb_node, parent, p); 86 rb_link_node(&he->rb_node, parent, p);
104 rb_insert_color(&he->rb_node, root); 87 rb_insert_color(&he->rb_node, root);
105} 88}
106 89
107static void perf_session__resort_by_name(struct perf_session *self) 90static void hists__resort_entries(struct hists *self)
108{ 91{
109 unsigned long position = 1; 92 unsigned long position = 1;
110 struct rb_root tmp = RB_ROOT; 93 struct rb_root tmp = RB_ROOT;
111 struct rb_node *next = rb_first(&self->hists); 94 struct rb_node *next = rb_first(&self->entries);
112 95
113 while (next != NULL) { 96 while (next != NULL) {
114 struct hist_entry *n = rb_entry(next, struct hist_entry, rb_node); 97 struct hist_entry *n = rb_entry(next, struct hist_entry, rb_node);
115 98
116 next = rb_next(&n->rb_node); 99 next = rb_next(&n->rb_node);
117 rb_erase(&n->rb_node, &self->hists); 100 rb_erase(&n->rb_node, &self->entries);
118 n->position = position++; 101 n->position = position++;
119 perf_session__insert_hist_entry_by_name(&tmp, n); 102 perf_session__insert_hist_entry_by_name(&tmp, n);
120 } 103 }
121 104
122 self->hists = tmp; 105 self->entries = tmp;
123} 106}
124 107
125static struct hist_entry * 108static void hists__set_positions(struct hists *self)
126perf_session__find_hist_entry_by_name(struct perf_session *self,
127 struct hist_entry *he)
128{ 109{
129 struct rb_node *n = self->hists.rb_node; 110 hists__output_resort(self);
111 hists__resort_entries(self);
112}
113
114static struct hist_entry *hists__find_entry(struct hists *self,
115 struct hist_entry *he)
116{
117 struct rb_node *n = self->entries.rb_node;
130 118
131 while (n) { 119 while (n) {
132 struct hist_entry *iter = rb_entry(n, struct hist_entry, rb_node); 120 struct hist_entry *iter = rb_entry(n, struct hist_entry, rb_node);
133 int cmp = strcmp(he->map->dso->name, iter->map->dso->name); 121 int64_t cmp = hist_entry__cmp(he, iter);
134 122
135 if (cmp > 0) 123 if (cmp < 0)
136 n = n->rb_left; 124 n = n->rb_left;
137 else if (cmp < 0) 125 else if (cmp > 0)
138 n = n->rb_right; 126 n = n->rb_right;
139 else { 127 else
140 cmp = strcmp(he->sym->name, iter->sym->name); 128 return iter;
141 if (cmp > 0)
142 n = n->rb_left;
143 else if (cmp < 0)
144 n = n->rb_right;
145 else
146 return iter;
147 }
148 } 129 }
149 130
150 return NULL; 131 return NULL;
151} 132}
152 133
153static void perf_session__match_hists(struct perf_session *old_session, 134static void hists__match(struct hists *older, struct hists *newer)
154 struct perf_session *new_session)
155{ 135{
156 struct rb_node *nd; 136 struct rb_node *nd;
157 137
158 perf_session__resort_by_name(old_session); 138 for (nd = rb_first(&newer->entries); nd; nd = rb_next(nd)) {
159
160 for (nd = rb_first(&new_session->hists); nd; nd = rb_next(nd)) {
161 struct hist_entry *pos = rb_entry(nd, struct hist_entry, rb_node); 139 struct hist_entry *pos = rb_entry(nd, struct hist_entry, rb_node);
162 pos->pair = perf_session__find_hist_entry_by_name(old_session, pos); 140 pos->pair = hists__find_entry(older, pos);
163 } 141 }
164} 142}
165 143
@@ -168,8 +146,8 @@ static int __cmd_diff(void)
168 int ret, i; 146 int ret, i;
169 struct perf_session *session[2]; 147 struct perf_session *session[2];
170 148
171 session[0] = perf_session__new(input_old, O_RDONLY, force); 149 session[0] = perf_session__new(input_old, O_RDONLY, force, false);
172 session[1] = perf_session__new(input_new, O_RDONLY, force); 150 session[1] = perf_session__new(input_new, O_RDONLY, force, false);
173 if (session[0] == NULL || session[1] == NULL) 151 if (session[0] == NULL || session[1] == NULL)
174 return -ENOMEM; 152 return -ENOMEM;
175 153
@@ -177,12 +155,15 @@ static int __cmd_diff(void)
177 ret = perf_session__process_events(session[i], &event_ops); 155 ret = perf_session__process_events(session[i], &event_ops);
178 if (ret) 156 if (ret)
179 goto out_delete; 157 goto out_delete;
180 perf_session__output_resort(session[i], session[i]->events_stats.total);
181 } 158 }
182 159
183 perf_session__match_hists(session[0], session[1]); 160 hists__output_resort(&session[1]->hists);
184 perf_session__fprintf_hists(session[1], session[0], 161 if (show_displacement)
185 show_displacement, stdout); 162 hists__set_positions(&session[0]->hists);
163
164 hists__match(&session[0]->hists, &session[1]->hists);
165 hists__fprintf(&session[1]->hists, &session[0]->hists,
166 show_displacement, stdout);
186out_delete: 167out_delete:
187 for (i = 0; i < 2; ++i) 168 for (i = 0; i < 2; ++i)
188 perf_session__delete(session[i]); 169 perf_session__delete(session[i]);
@@ -195,7 +176,7 @@ static const char * const diff_usage[] = {
195}; 176};
196 177
197static const struct option options[] = { 178static const struct option options[] = {
198 OPT_BOOLEAN('v', "verbose", &verbose, 179 OPT_INCR('v', "verbose", &verbose,
199 "be more verbose (show symbol address, etc)"), 180 "be more verbose (show symbol address, etc)"),
200 OPT_BOOLEAN('m', "displacement", &show_displacement, 181 OPT_BOOLEAN('m', "displacement", &show_displacement,
201 "Show position displacement relative to baseline"), 182 "Show position displacement relative to baseline"),
@@ -204,7 +185,7 @@ static const struct option options[] = {
204 OPT_BOOLEAN('f', "force", &force, "don't complain, do it"), 185 OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
205 OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules, 186 OPT_BOOLEAN('m', "modules", &symbol_conf.use_modules,
206 "load module symbols - WARNING: use only with -k and LIVE kernel"), 187 "load module symbols - WARNING: use only with -k and LIVE kernel"),
207 OPT_BOOLEAN('P', "full-paths", &event_ops.full_paths, 188 OPT_BOOLEAN('P', "full-paths", &symbol_conf.full_paths,
208 "Don't shorten the pathnames taking into account the cwd"), 189 "Don't shorten the pathnames taking into account the cwd"),
209 OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", 190 OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
210 "only consider symbols in these dsos"), 191 "only consider symbols in these dsos"),
@@ -232,6 +213,10 @@ int cmd_diff(int argc, const char **argv, const char *prefix __used)
232 input_new = argv[1]; 213 input_new = argv[1];
233 } else 214 } else
234 input_new = argv[0]; 215 input_new = argv[0];
216 } else if (symbol_conf.default_guest_vmlinux_name ||
217 symbol_conf.default_guest_kallsyms) {
218 input_old = "perf.data.host";
219 input_new = "perf.data.guest";
235 } 220 }
236 221
237 symbol_conf.exclude_other = false; 222 symbol_conf.exclude_other = false;
diff --git a/tools/perf/builtin-help.c b/tools/perf/builtin-help.c
index 9f810b17c25c..6d5a8a7faf48 100644
--- a/tools/perf/builtin-help.c
+++ b/tools/perf/builtin-help.c
@@ -29,14 +29,14 @@ enum help_format {
29 HELP_FORMAT_WEB, 29 HELP_FORMAT_WEB,
30}; 30};
31 31
32static int show_all = 0; 32static bool show_all = false;
33static enum help_format help_format = HELP_FORMAT_MAN; 33static enum help_format help_format = HELP_FORMAT_MAN;
34static struct option builtin_help_options[] = { 34static struct option builtin_help_options[] = {
35 OPT_BOOLEAN('a', "all", &show_all, "print all available commands"), 35 OPT_BOOLEAN('a', "all", &show_all, "print all available commands"),
36 OPT_SET_INT('m', "man", &help_format, "show man page", HELP_FORMAT_MAN), 36 OPT_SET_UINT('m', "man", &help_format, "show man page", HELP_FORMAT_MAN),
37 OPT_SET_INT('w', "web", &help_format, "show manual in web browser", 37 OPT_SET_UINT('w', "web", &help_format, "show manual in web browser",
38 HELP_FORMAT_WEB), 38 HELP_FORMAT_WEB),
39 OPT_SET_INT('i', "info", &help_format, "show info page", 39 OPT_SET_UINT('i', "info", &help_format, "show info page",
40 HELP_FORMAT_INFO), 40 HELP_FORMAT_INFO),
41 OPT_END(), 41 OPT_END(),
42}; 42};
@@ -286,8 +286,7 @@ void list_common_cmds_help(void)
286 286
287 puts(" The most commonly used perf commands are:"); 287 puts(" The most commonly used perf commands are:");
288 for (i = 0; i < ARRAY_SIZE(common_cmds); i++) { 288 for (i = 0; i < ARRAY_SIZE(common_cmds); i++) {
289 printf(" %s ", common_cmds[i].name); 289 printf(" %-*s ", longest, common_cmds[i].name);
290 mput_char(' ', longest - strlen(common_cmds[i].name));
291 puts(common_cmds[i].help); 290 puts(common_cmds[i].help);
292 } 291 }
293} 292}
@@ -314,8 +313,6 @@ static const char *cmd_to_page(const char *perf_cmd)
314 return "perf"; 313 return "perf";
315 else if (!prefixcmp(perf_cmd, "perf")) 314 else if (!prefixcmp(perf_cmd, "perf"))
316 return perf_cmd; 315 return perf_cmd;
317 else if (is_perf_command(perf_cmd))
318 return prepend("perf-", perf_cmd);
319 else 316 else
320 return prepend("perf-", perf_cmd); 317 return prepend("perf-", perf_cmd);
321} 318}
diff --git a/tools/perf/builtin-inject.c b/tools/perf/builtin-inject.c
new file mode 100644
index 000000000000..8e3e47b064ce
--- /dev/null
+++ b/tools/perf/builtin-inject.c
@@ -0,0 +1,228 @@
1/*
2 * builtin-inject.c
3 *
4 * Builtin inject command: Examine the live mode (stdin) event stream
5 * and repipe it to stdout while optionally injecting additional
6 * events into it.
7 */
8#include "builtin.h"
9
10#include "perf.h"
11#include "util/session.h"
12#include "util/debug.h"
13
14#include "util/parse-options.h"
15
16static char const *input_name = "-";
17static bool inject_build_ids;
18
19static int event__repipe(event_t *event __used,
20 struct perf_session *session __used)
21{
22 uint32_t size;
23 void *buf = event;
24
25 size = event->header.size;
26
27 while (size) {
28 int ret = write(STDOUT_FILENO, buf, size);
29 if (ret < 0)
30 return -errno;
31
32 size -= ret;
33 buf += ret;
34 }
35
36 return 0;
37}
38
39static int event__repipe_mmap(event_t *self, struct perf_session *session)
40{
41 int err;
42
43 err = event__process_mmap(self, session);
44 event__repipe(self, session);
45
46 return err;
47}
48
49static int event__repipe_task(event_t *self, struct perf_session *session)
50{
51 int err;
52
53 err = event__process_task(self, session);
54 event__repipe(self, session);
55
56 return err;
57}
58
59static int event__repipe_tracing_data(event_t *self,
60 struct perf_session *session)
61{
62 int err;
63
64 event__repipe(self, session);
65 err = event__process_tracing_data(self, session);
66
67 return err;
68}
69
70static int dso__read_build_id(struct dso *self)
71{
72 if (self->has_build_id)
73 return 0;
74
75 if (filename__read_build_id(self->long_name, self->build_id,
76 sizeof(self->build_id)) > 0) {
77 self->has_build_id = true;
78 return 0;
79 }
80
81 return -1;
82}
83
84static int dso__inject_build_id(struct dso *self, struct perf_session *session)
85{
86 u16 misc = PERF_RECORD_MISC_USER;
87 struct machine *machine;
88 int err;
89
90 if (dso__read_build_id(self) < 0) {
91 pr_debug("no build_id found for %s\n", self->long_name);
92 return -1;
93 }
94
95 machine = perf_session__find_host_machine(session);
96 if (machine == NULL) {
97 pr_err("Can't find machine for session\n");
98 return -1;
99 }
100
101 if (self->kernel)
102 misc = PERF_RECORD_MISC_KERNEL;
103
104 err = event__synthesize_build_id(self, misc, event__repipe,
105 machine, session);
106 if (err) {
107 pr_err("Can't synthesize build_id event for %s\n", self->long_name);
108 return -1;
109 }
110
111 return 0;
112}
113
114static int event__inject_buildid(event_t *event, struct perf_session *session)
115{
116 struct addr_location al;
117 struct thread *thread;
118 u8 cpumode;
119
120 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
121
122 thread = perf_session__findnew(session, event->ip.pid);
123 if (thread == NULL) {
124 pr_err("problem processing %d event, skipping it.\n",
125 event->header.type);
126 goto repipe;
127 }
128
129 thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION,
130 event->ip.pid, event->ip.ip, &al);
131
132 if (al.map != NULL) {
133 if (!al.map->dso->hit) {
134 al.map->dso->hit = 1;
135 if (map__load(al.map, NULL) >= 0) {
136 dso__inject_build_id(al.map->dso, session);
137 /*
138 * If this fails, too bad, let the other side
139 * account this as unresolved.
140 */
141 } else
142 pr_warning("no symbols found in %s, maybe "
143 "install a debug package?\n",
144 al.map->dso->long_name);
145 }
146 }
147
148repipe:
149 event__repipe(event, session);
150 return 0;
151}
152
153struct perf_event_ops inject_ops = {
154 .sample = event__repipe,
155 .mmap = event__repipe,
156 .comm = event__repipe,
157 .fork = event__repipe,
158 .exit = event__repipe,
159 .lost = event__repipe,
160 .read = event__repipe,
161 .throttle = event__repipe,
162 .unthrottle = event__repipe,
163 .attr = event__repipe,
164 .event_type = event__repipe,
165 .tracing_data = event__repipe,
166 .build_id = event__repipe,
167};
168
169extern volatile int session_done;
170
171static void sig_handler(int sig __attribute__((__unused__)))
172{
173 session_done = 1;
174}
175
176static int __cmd_inject(void)
177{
178 struct perf_session *session;
179 int ret = -EINVAL;
180
181 signal(SIGINT, sig_handler);
182
183 if (inject_build_ids) {
184 inject_ops.sample = event__inject_buildid;
185 inject_ops.mmap = event__repipe_mmap;
186 inject_ops.fork = event__repipe_task;
187 inject_ops.tracing_data = event__repipe_tracing_data;
188 }
189
190 session = perf_session__new(input_name, O_RDONLY, false, true);
191 if (session == NULL)
192 return -ENOMEM;
193
194 ret = perf_session__process_events(session, &inject_ops);
195
196 perf_session__delete(session);
197
198 return ret;
199}
200
201static const char * const report_usage[] = {
202 "perf inject [<options>]",
203 NULL
204};
205
206static const struct option options[] = {
207 OPT_BOOLEAN('b', "build-ids", &inject_build_ids,
208 "Inject build-ids into the output stream"),
209 OPT_INCR('v', "verbose", &verbose,
210 "be more verbose (show build ids, etc)"),
211 OPT_END()
212};
213
214int cmd_inject(int argc, const char **argv, const char *prefix __used)
215{
216 argc = parse_options(argc, argv, options, report_usage, 0);
217
218 /*
219 * Any (unrecognized) arguments left?
220 */
221 if (argc)
222 usage_with_options(report_usage, options);
223
224 if (symbol__init() < 0)
225 return -1;
226
227 return __cmd_inject();
228}
diff --git a/tools/perf/builtin-kmem.c b/tools/perf/builtin-kmem.c
index 93c67bf53d2c..31f60a2535e0 100644
--- a/tools/perf/builtin-kmem.c
+++ b/tools/perf/builtin-kmem.c
@@ -92,23 +92,18 @@ static void setup_cpunode_map(void)
92 if (!dir1) 92 if (!dir1)
93 return; 93 return;
94 94
95 while (true) { 95 while ((dent1 = readdir(dir1)) != NULL) {
96 dent1 = readdir(dir1); 96 if (dent1->d_type != DT_DIR ||
97 if (!dent1) 97 sscanf(dent1->d_name, "node%u", &mem) < 1)
98 break;
99
100 if (sscanf(dent1->d_name, "node%u", &mem) < 1)
101 continue; 98 continue;
102 99
103 snprintf(buf, PATH_MAX, "%s/%s", PATH_SYS_NODE, dent1->d_name); 100 snprintf(buf, PATH_MAX, "%s/%s", PATH_SYS_NODE, dent1->d_name);
104 dir2 = opendir(buf); 101 dir2 = opendir(buf);
105 if (!dir2) 102 if (!dir2)
106 continue; 103 continue;
107 while (true) { 104 while ((dent2 = readdir(dir2)) != NULL) {
108 dent2 = readdir(dir2); 105 if (dent2->d_type != DT_LNK ||
109 if (!dent2) 106 sscanf(dent2->d_name, "cpu%u", &cpu) < 1)
110 break;
111 if (sscanf(dent2->d_name, "cpu%u", &cpu) < 1)
112 continue; 107 continue;
113 cpunode_map[cpu] = mem; 108 cpunode_map[cpu] = mem;
114 } 109 }
@@ -321,11 +316,8 @@ static int process_sample_event(event_t *event, struct perf_session *session)
321 316
322 event__parse_sample(event, session->sample_type, &data); 317 event__parse_sample(event, session->sample_type, &data);
323 318
324 dump_printf("(IP, %d): %d/%d: %p period: %Ld\n", 319 dump_printf("(IP, %d): %d/%d: %#Lx period: %Ld\n", event->header.misc,
325 event->header.misc, 320 data.pid, data.tid, data.ip, data.period);
326 data.pid, data.tid,
327 (void *)(long)data.ip,
328 (long long)data.period);
329 321
330 thread = perf_session__findnew(session, event->ip.pid); 322 thread = perf_session__findnew(session, event->ip.pid);
331 if (thread == NULL) { 323 if (thread == NULL) {
@@ -342,22 +334,10 @@ static int process_sample_event(event_t *event, struct perf_session *session)
342 return 0; 334 return 0;
343} 335}
344 336
345static int sample_type_check(struct perf_session *session)
346{
347 if (!(session->sample_type & PERF_SAMPLE_RAW)) {
348 fprintf(stderr,
349 "No trace sample to read. Did you call perf record "
350 "without -R?");
351 return -1;
352 }
353
354 return 0;
355}
356
357static struct perf_event_ops event_ops = { 337static struct perf_event_ops event_ops = {
358 .process_sample_event = process_sample_event, 338 .sample = process_sample_event,
359 .process_comm_event = event__process_comm, 339 .comm = event__process_comm,
360 .sample_type_check = sample_type_check, 340 .ordered_samples = true,
361}; 341};
362 342
363static double fragmentation(unsigned long n_req, unsigned long n_alloc) 343static double fragmentation(unsigned long n_req, unsigned long n_alloc)
@@ -372,6 +352,7 @@ static void __print_result(struct rb_root *root, struct perf_session *session,
372 int n_lines, int is_caller) 352 int n_lines, int is_caller)
373{ 353{
374 struct rb_node *next; 354 struct rb_node *next;
355 struct machine *machine;
375 356
376 printf("%.102s\n", graph_dotted_line); 357 printf("%.102s\n", graph_dotted_line);
377 printf(" %-34s |", is_caller ? "Callsite": "Alloc Ptr"); 358 printf(" %-34s |", is_caller ? "Callsite": "Alloc Ptr");
@@ -380,23 +361,29 @@ static void __print_result(struct rb_root *root, struct perf_session *session,
380 361
381 next = rb_first(root); 362 next = rb_first(root);
382 363
364 machine = perf_session__find_host_machine(session);
365 if (!machine) {
366 pr_err("__print_result: couldn't find kernel information\n");
367 return;
368 }
383 while (next && n_lines--) { 369 while (next && n_lines--) {
384 struct alloc_stat *data = rb_entry(next, struct alloc_stat, 370 struct alloc_stat *data = rb_entry(next, struct alloc_stat,
385 node); 371 node);
386 struct symbol *sym = NULL; 372 struct symbol *sym = NULL;
373 struct map *map;
387 char buf[BUFSIZ]; 374 char buf[BUFSIZ];
388 u64 addr; 375 u64 addr;
389 376
390 if (is_caller) { 377 if (is_caller) {
391 addr = data->call_site; 378 addr = data->call_site;
392 if (!raw_ip) 379 if (!raw_ip)
393 sym = map_groups__find_function(&session->kmaps, session, addr, NULL); 380 sym = machine__find_kernel_function(machine, addr, &map, NULL);
394 } else 381 } else
395 addr = data->ptr; 382 addr = data->ptr;
396 383
397 if (sym != NULL) 384 if (sym != NULL)
398 snprintf(buf, sizeof(buf), "%s+%Lx", sym->name, 385 snprintf(buf, sizeof(buf), "%s+%Lx", sym->name,
399 addr - sym->start); 386 addr - map->unmap_ip(map, sym->start));
400 else 387 else
401 snprintf(buf, sizeof(buf), "%#Lx", addr); 388 snprintf(buf, sizeof(buf), "%#Lx", addr);
402 printf(" %-34s |", buf); 389 printf(" %-34s |", buf);
@@ -504,11 +491,17 @@ static void sort_result(void)
504 491
505static int __cmd_kmem(void) 492static int __cmd_kmem(void)
506{ 493{
507 int err; 494 int err = -EINVAL;
508 struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); 495 struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false);
509 if (session == NULL) 496 if (session == NULL)
510 return -ENOMEM; 497 return -ENOMEM;
511 498
499 if (perf_session__create_kernel_maps(session) < 0)
500 goto out_delete;
501
502 if (!perf_session__has_traces(session, "kmem record"))
503 goto out_delete;
504
512 setup_pager(); 505 setup_pager();
513 err = perf_session__process_events(session, &event_ops); 506 err = perf_session__process_events(session, &event_ops);
514 if (err != 0) 507 if (err != 0)
@@ -736,7 +729,6 @@ static const char *record_args[] = {
736 "record", 729 "record",
737 "-a", 730 "-a",
738 "-R", 731 "-R",
739 "-M",
740 "-f", 732 "-f",
741 "-c", "1", 733 "-c", "1",
742 "-e", "kmem:kmalloc", 734 "-e", "kmem:kmalloc",
diff --git a/tools/perf/builtin-kvm.c b/tools/perf/builtin-kvm.c
new file mode 100644
index 000000000000..34d1e853829d
--- /dev/null
+++ b/tools/perf/builtin-kvm.c
@@ -0,0 +1,144 @@
1#include "builtin.h"
2#include "perf.h"
3
4#include "util/util.h"
5#include "util/cache.h"
6#include "util/symbol.h"
7#include "util/thread.h"
8#include "util/header.h"
9#include "util/session.h"
10
11#include "util/parse-options.h"
12#include "util/trace-event.h"
13
14#include "util/debug.h"
15
16#include <sys/prctl.h>
17
18#include <semaphore.h>
19#include <pthread.h>
20#include <math.h>
21
22static const char *file_name;
23static char name_buffer[256];
24
25bool perf_host = 1;
26bool perf_guest;
27
28static const char * const kvm_usage[] = {
29 "perf kvm [<options>] {top|record|report|diff|buildid-list}",
30 NULL
31};
32
33static const struct option kvm_options[] = {
34 OPT_STRING('i', "input", &file_name, "file",
35 "Input file name"),
36 OPT_STRING('o', "output", &file_name, "file",
37 "Output file name"),
38 OPT_BOOLEAN(0, "guest", &perf_guest,
39 "Collect guest os data"),
40 OPT_BOOLEAN(0, "host", &perf_host,
41 "Collect guest os data"),
42 OPT_STRING(0, "guestmount", &symbol_conf.guestmount, "directory",
43 "guest mount directory under which every guest os"
44 " instance has a subdir"),
45 OPT_STRING(0, "guestvmlinux", &symbol_conf.default_guest_vmlinux_name,
46 "file", "file saving guest os vmlinux"),
47 OPT_STRING(0, "guestkallsyms", &symbol_conf.default_guest_kallsyms,
48 "file", "file saving guest os /proc/kallsyms"),
49 OPT_STRING(0, "guestmodules", &symbol_conf.default_guest_modules,
50 "file", "file saving guest os /proc/modules"),
51 OPT_END()
52};
53
54static int __cmd_record(int argc, const char **argv)
55{
56 int rec_argc, i = 0, j;
57 const char **rec_argv;
58
59 rec_argc = argc + 2;
60 rec_argv = calloc(rec_argc + 1, sizeof(char *));
61 rec_argv[i++] = strdup("record");
62 rec_argv[i++] = strdup("-o");
63 rec_argv[i++] = strdup(file_name);
64 for (j = 1; j < argc; j++, i++)
65 rec_argv[i] = argv[j];
66
67 BUG_ON(i != rec_argc);
68
69 return cmd_record(i, rec_argv, NULL);
70}
71
72static int __cmd_report(int argc, const char **argv)
73{
74 int rec_argc, i = 0, j;
75 const char **rec_argv;
76
77 rec_argc = argc + 2;
78 rec_argv = calloc(rec_argc + 1, sizeof(char *));
79 rec_argv[i++] = strdup("report");
80 rec_argv[i++] = strdup("-i");
81 rec_argv[i++] = strdup(file_name);
82 for (j = 1; j < argc; j++, i++)
83 rec_argv[i] = argv[j];
84
85 BUG_ON(i != rec_argc);
86
87 return cmd_report(i, rec_argv, NULL);
88}
89
90static int __cmd_buildid_list(int argc, const char **argv)
91{
92 int rec_argc, i = 0, j;
93 const char **rec_argv;
94
95 rec_argc = argc + 2;
96 rec_argv = calloc(rec_argc + 1, sizeof(char *));
97 rec_argv[i++] = strdup("buildid-list");
98 rec_argv[i++] = strdup("-i");
99 rec_argv[i++] = strdup(file_name);
100 for (j = 1; j < argc; j++, i++)
101 rec_argv[i] = argv[j];
102
103 BUG_ON(i != rec_argc);
104
105 return cmd_buildid_list(i, rec_argv, NULL);
106}
107
108int cmd_kvm(int argc, const char **argv, const char *prefix __used)
109{
110 perf_host = perf_guest = 0;
111
112 argc = parse_options(argc, argv, kvm_options, kvm_usage,
113 PARSE_OPT_STOP_AT_NON_OPTION);
114 if (!argc)
115 usage_with_options(kvm_usage, kvm_options);
116
117 if (!perf_host)
118 perf_guest = 1;
119
120 if (!file_name) {
121 if (perf_host && !perf_guest)
122 sprintf(name_buffer, "perf.data.host");
123 else if (!perf_host && perf_guest)
124 sprintf(name_buffer, "perf.data.guest");
125 else
126 sprintf(name_buffer, "perf.data.kvm");
127 file_name = name_buffer;
128 }
129
130 if (!strncmp(argv[0], "rec", 3))
131 return __cmd_record(argc, argv);
132 else if (!strncmp(argv[0], "rep", 3))
133 return __cmd_report(argc, argv);
134 else if (!strncmp(argv[0], "diff", 4))
135 return cmd_diff(argc, argv, NULL);
136 else if (!strncmp(argv[0], "top", 3))
137 return cmd_top(argc, argv, NULL);
138 else if (!strncmp(argv[0], "buildid-list", 12))
139 return __cmd_buildid_list(argc, argv);
140 else
141 usage_with_options(kvm_usage, kvm_options);
142
143 return 0;
144}
diff --git a/tools/perf/builtin-lock.c b/tools/perf/builtin-lock.c
new file mode 100644
index 000000000000..821c1586a22b
--- /dev/null
+++ b/tools/perf/builtin-lock.c
@@ -0,0 +1,1005 @@
1#include "builtin.h"
2#include "perf.h"
3
4#include "util/util.h"
5#include "util/cache.h"
6#include "util/symbol.h"
7#include "util/thread.h"
8#include "util/header.h"
9
10#include "util/parse-options.h"
11#include "util/trace-event.h"
12
13#include "util/debug.h"
14#include "util/session.h"
15
16#include <sys/types.h>
17#include <sys/prctl.h>
18#include <semaphore.h>
19#include <pthread.h>
20#include <math.h>
21#include <limits.h>
22
23#include <linux/list.h>
24#include <linux/hash.h>
25
26static struct perf_session *session;
27
28/* based on kernel/lockdep.c */
29#define LOCKHASH_BITS 12
30#define LOCKHASH_SIZE (1UL << LOCKHASH_BITS)
31
32static struct list_head lockhash_table[LOCKHASH_SIZE];
33
34#define __lockhashfn(key) hash_long((unsigned long)key, LOCKHASH_BITS)
35#define lockhashentry(key) (lockhash_table + __lockhashfn((key)))
36
37struct lock_stat {
38 struct list_head hash_entry;
39 struct rb_node rb; /* used for sorting */
40
41 /*
42 * FIXME: raw_field_value() returns unsigned long long,
43 * so address of lockdep_map should be dealed as 64bit.
44 * Is there more better solution?
45 */
46 void *addr; /* address of lockdep_map, used as ID */
47 char *name; /* for strcpy(), we cannot use const */
48
49 unsigned int nr_acquire;
50 unsigned int nr_acquired;
51 unsigned int nr_contended;
52 unsigned int nr_release;
53
54 unsigned int nr_readlock;
55 unsigned int nr_trylock;
56 /* these times are in nano sec. */
57 u64 wait_time_total;
58 u64 wait_time_min;
59 u64 wait_time_max;
60
61 int discard; /* flag of blacklist */
62};
63
64/*
65 * States of lock_seq_stat
66 *
67 * UNINITIALIZED is required for detecting first event of acquire.
68 * As the nature of lock events, there is no guarantee
69 * that the first event for the locks are acquire,
70 * it can be acquired, contended or release.
71 */
72#define SEQ_STATE_UNINITIALIZED 0 /* initial state */
73#define SEQ_STATE_RELEASED 1
74#define SEQ_STATE_ACQUIRING 2
75#define SEQ_STATE_ACQUIRED 3
76#define SEQ_STATE_READ_ACQUIRED 4
77#define SEQ_STATE_CONTENDED 5
78
79/*
80 * MAX_LOCK_DEPTH
81 * Imported from include/linux/sched.h.
82 * Should this be synchronized?
83 */
84#define MAX_LOCK_DEPTH 48
85
86/*
87 * struct lock_seq_stat:
88 * Place to put on state of one lock sequence
89 * 1) acquire -> acquired -> release
90 * 2) acquire -> contended -> acquired -> release
91 * 3) acquire (with read or try) -> release
92 * 4) Are there other patterns?
93 */
94struct lock_seq_stat {
95 struct list_head list;
96 int state;
97 u64 prev_event_time;
98 void *addr;
99
100 int read_count;
101};
102
103struct thread_stat {
104 struct rb_node rb;
105
106 u32 tid;
107 struct list_head seq_list;
108};
109
110static struct rb_root thread_stats;
111
112static struct thread_stat *thread_stat_find(u32 tid)
113{
114 struct rb_node *node;
115 struct thread_stat *st;
116
117 node = thread_stats.rb_node;
118 while (node) {
119 st = container_of(node, struct thread_stat, rb);
120 if (st->tid == tid)
121 return st;
122 else if (tid < st->tid)
123 node = node->rb_left;
124 else
125 node = node->rb_right;
126 }
127
128 return NULL;
129}
130
131static void thread_stat_insert(struct thread_stat *new)
132{
133 struct rb_node **rb = &thread_stats.rb_node;
134 struct rb_node *parent = NULL;
135 struct thread_stat *p;
136
137 while (*rb) {
138 p = container_of(*rb, struct thread_stat, rb);
139 parent = *rb;
140
141 if (new->tid < p->tid)
142 rb = &(*rb)->rb_left;
143 else if (new->tid > p->tid)
144 rb = &(*rb)->rb_right;
145 else
146 BUG_ON("inserting invalid thread_stat\n");
147 }
148
149 rb_link_node(&new->rb, parent, rb);
150 rb_insert_color(&new->rb, &thread_stats);
151}
152
153static struct thread_stat *thread_stat_findnew_after_first(u32 tid)
154{
155 struct thread_stat *st;
156
157 st = thread_stat_find(tid);
158 if (st)
159 return st;
160
161 st = zalloc(sizeof(struct thread_stat));
162 if (!st)
163 die("memory allocation failed\n");
164
165 st->tid = tid;
166 INIT_LIST_HEAD(&st->seq_list);
167
168 thread_stat_insert(st);
169
170 return st;
171}
172
173static struct thread_stat *thread_stat_findnew_first(u32 tid);
174static struct thread_stat *(*thread_stat_findnew)(u32 tid) =
175 thread_stat_findnew_first;
176
177static struct thread_stat *thread_stat_findnew_first(u32 tid)
178{
179 struct thread_stat *st;
180
181 st = zalloc(sizeof(struct thread_stat));
182 if (!st)
183 die("memory allocation failed\n");
184 st->tid = tid;
185 INIT_LIST_HEAD(&st->seq_list);
186
187 rb_link_node(&st->rb, NULL, &thread_stats.rb_node);
188 rb_insert_color(&st->rb, &thread_stats);
189
190 thread_stat_findnew = thread_stat_findnew_after_first;
191 return st;
192}
193
194/* build simple key function one is bigger than two */
195#define SINGLE_KEY(member) \
196 static int lock_stat_key_ ## member(struct lock_stat *one, \
197 struct lock_stat *two) \
198 { \
199 return one->member > two->member; \
200 }
201
202SINGLE_KEY(nr_acquired)
203SINGLE_KEY(nr_contended)
204SINGLE_KEY(wait_time_total)
205SINGLE_KEY(wait_time_min)
206SINGLE_KEY(wait_time_max)
207
208struct lock_key {
209 /*
210 * name: the value for specify by user
211 * this should be simpler than raw name of member
212 * e.g. nr_acquired -> acquired, wait_time_total -> wait_total
213 */
214 const char *name;
215 int (*key)(struct lock_stat*, struct lock_stat*);
216};
217
218static const char *sort_key = "acquired";
219
220static int (*compare)(struct lock_stat *, struct lock_stat *);
221
222static struct rb_root result; /* place to store sorted data */
223
224#define DEF_KEY_LOCK(name, fn_suffix) \
225 { #name, lock_stat_key_ ## fn_suffix }
226struct lock_key keys[] = {
227 DEF_KEY_LOCK(acquired, nr_acquired),
228 DEF_KEY_LOCK(contended, nr_contended),
229 DEF_KEY_LOCK(wait_total, wait_time_total),
230 DEF_KEY_LOCK(wait_min, wait_time_min),
231 DEF_KEY_LOCK(wait_max, wait_time_max),
232
233 /* extra comparisons much complicated should be here */
234
235 { NULL, NULL }
236};
237
238static void select_key(void)
239{
240 int i;
241
242 for (i = 0; keys[i].name; i++) {
243 if (!strcmp(keys[i].name, sort_key)) {
244 compare = keys[i].key;
245 return;
246 }
247 }
248
249 die("Unknown compare key:%s\n", sort_key);
250}
251
252static void insert_to_result(struct lock_stat *st,
253 int (*bigger)(struct lock_stat *, struct lock_stat *))
254{
255 struct rb_node **rb = &result.rb_node;
256 struct rb_node *parent = NULL;
257 struct lock_stat *p;
258
259 while (*rb) {
260 p = container_of(*rb, struct lock_stat, rb);
261 parent = *rb;
262
263 if (bigger(st, p))
264 rb = &(*rb)->rb_left;
265 else
266 rb = &(*rb)->rb_right;
267 }
268
269 rb_link_node(&st->rb, parent, rb);
270 rb_insert_color(&st->rb, &result);
271}
272
273/* returns left most element of result, and erase it */
274static struct lock_stat *pop_from_result(void)
275{
276 struct rb_node *node = result.rb_node;
277
278 if (!node)
279 return NULL;
280
281 while (node->rb_left)
282 node = node->rb_left;
283
284 rb_erase(node, &result);
285 return container_of(node, struct lock_stat, rb);
286}
287
288static struct lock_stat *lock_stat_findnew(void *addr, const char *name)
289{
290 struct list_head *entry = lockhashentry(addr);
291 struct lock_stat *ret, *new;
292
293 list_for_each_entry(ret, entry, hash_entry) {
294 if (ret->addr == addr)
295 return ret;
296 }
297
298 new = zalloc(sizeof(struct lock_stat));
299 if (!new)
300 goto alloc_failed;
301
302 new->addr = addr;
303 new->name = zalloc(sizeof(char) * strlen(name) + 1);
304 if (!new->name)
305 goto alloc_failed;
306 strcpy(new->name, name);
307
308 new->wait_time_min = ULLONG_MAX;
309
310 list_add(&new->hash_entry, entry);
311 return new;
312
313alloc_failed:
314 die("memory allocation failed\n");
315}
316
317static char const *input_name = "perf.data";
318
319struct raw_event_sample {
320 u32 size;
321 char data[0];
322};
323
324struct trace_acquire_event {
325 void *addr;
326 const char *name;
327 int flag;
328};
329
330struct trace_acquired_event {
331 void *addr;
332 const char *name;
333};
334
335struct trace_contended_event {
336 void *addr;
337 const char *name;
338};
339
340struct trace_release_event {
341 void *addr;
342 const char *name;
343};
344
345struct trace_lock_handler {
346 void (*acquire_event)(struct trace_acquire_event *,
347 struct event *,
348 int cpu,
349 u64 timestamp,
350 struct thread *thread);
351
352 void (*acquired_event)(struct trace_acquired_event *,
353 struct event *,
354 int cpu,
355 u64 timestamp,
356 struct thread *thread);
357
358 void (*contended_event)(struct trace_contended_event *,
359 struct event *,
360 int cpu,
361 u64 timestamp,
362 struct thread *thread);
363
364 void (*release_event)(struct trace_release_event *,
365 struct event *,
366 int cpu,
367 u64 timestamp,
368 struct thread *thread);
369};
370
371static struct lock_seq_stat *get_seq(struct thread_stat *ts, void *addr)
372{
373 struct lock_seq_stat *seq;
374
375 list_for_each_entry(seq, &ts->seq_list, list) {
376 if (seq->addr == addr)
377 return seq;
378 }
379
380 seq = zalloc(sizeof(struct lock_seq_stat));
381 if (!seq)
382 die("Not enough memory\n");
383 seq->state = SEQ_STATE_UNINITIALIZED;
384 seq->addr = addr;
385
386 list_add(&seq->list, &ts->seq_list);
387 return seq;
388}
389
390enum broken_state {
391 BROKEN_ACQUIRE,
392 BROKEN_ACQUIRED,
393 BROKEN_CONTENDED,
394 BROKEN_RELEASE,
395 BROKEN_MAX,
396};
397
398static int bad_hist[BROKEN_MAX];
399
400enum acquire_flags {
401 TRY_LOCK = 1,
402 READ_LOCK = 2,
403};
404
405static void
406report_lock_acquire_event(struct trace_acquire_event *acquire_event,
407 struct event *__event __used,
408 int cpu __used,
409 u64 timestamp __used,
410 struct thread *thread __used)
411{
412 struct lock_stat *ls;
413 struct thread_stat *ts;
414 struct lock_seq_stat *seq;
415
416 ls = lock_stat_findnew(acquire_event->addr, acquire_event->name);
417 if (ls->discard)
418 return;
419
420 ts = thread_stat_findnew(thread->pid);
421 seq = get_seq(ts, acquire_event->addr);
422
423 switch (seq->state) {
424 case SEQ_STATE_UNINITIALIZED:
425 case SEQ_STATE_RELEASED:
426 if (!acquire_event->flag) {
427 seq->state = SEQ_STATE_ACQUIRING;
428 } else {
429 if (acquire_event->flag & TRY_LOCK)
430 ls->nr_trylock++;
431 if (acquire_event->flag & READ_LOCK)
432 ls->nr_readlock++;
433 seq->state = SEQ_STATE_READ_ACQUIRED;
434 seq->read_count = 1;
435 ls->nr_acquired++;
436 }
437 break;
438 case SEQ_STATE_READ_ACQUIRED:
439 if (acquire_event->flag & READ_LOCK) {
440 seq->read_count++;
441 ls->nr_acquired++;
442 goto end;
443 } else {
444 goto broken;
445 }
446 break;
447 case SEQ_STATE_ACQUIRED:
448 case SEQ_STATE_ACQUIRING:
449 case SEQ_STATE_CONTENDED:
450broken:
451 /* broken lock sequence, discard it */
452 ls->discard = 1;
453 bad_hist[BROKEN_ACQUIRE]++;
454 list_del(&seq->list);
455 free(seq);
456 goto end;
457 break;
458 default:
459 BUG_ON("Unknown state of lock sequence found!\n");
460 break;
461 }
462
463 ls->nr_acquire++;
464 seq->prev_event_time = timestamp;
465end:
466 return;
467}
468
469static void
470report_lock_acquired_event(struct trace_acquired_event *acquired_event,
471 struct event *__event __used,
472 int cpu __used,
473 u64 timestamp __used,
474 struct thread *thread __used)
475{
476 struct lock_stat *ls;
477 struct thread_stat *ts;
478 struct lock_seq_stat *seq;
479 u64 contended_term;
480
481 ls = lock_stat_findnew(acquired_event->addr, acquired_event->name);
482 if (ls->discard)
483 return;
484
485 ts = thread_stat_findnew(thread->pid);
486 seq = get_seq(ts, acquired_event->addr);
487
488 switch (seq->state) {
489 case SEQ_STATE_UNINITIALIZED:
490 /* orphan event, do nothing */
491 return;
492 case SEQ_STATE_ACQUIRING:
493 break;
494 case SEQ_STATE_CONTENDED:
495 contended_term = timestamp - seq->prev_event_time;
496 ls->wait_time_total += contended_term;
497 if (contended_term < ls->wait_time_min)
498 ls->wait_time_min = contended_term;
499 if (ls->wait_time_max < contended_term)
500 ls->wait_time_max = contended_term;
501 break;
502 case SEQ_STATE_RELEASED:
503 case SEQ_STATE_ACQUIRED:
504 case SEQ_STATE_READ_ACQUIRED:
505 /* broken lock sequence, discard it */
506 ls->discard = 1;
507 bad_hist[BROKEN_ACQUIRED]++;
508 list_del(&seq->list);
509 free(seq);
510 goto end;
511 break;
512
513 default:
514 BUG_ON("Unknown state of lock sequence found!\n");
515 break;
516 }
517
518 seq->state = SEQ_STATE_ACQUIRED;
519 ls->nr_acquired++;
520 seq->prev_event_time = timestamp;
521end:
522 return;
523}
524
525static void
526report_lock_contended_event(struct trace_contended_event *contended_event,
527 struct event *__event __used,
528 int cpu __used,
529 u64 timestamp __used,
530 struct thread *thread __used)
531{
532 struct lock_stat *ls;
533 struct thread_stat *ts;
534 struct lock_seq_stat *seq;
535
536 ls = lock_stat_findnew(contended_event->addr, contended_event->name);
537 if (ls->discard)
538 return;
539
540 ts = thread_stat_findnew(thread->pid);
541 seq = get_seq(ts, contended_event->addr);
542
543 switch (seq->state) {
544 case SEQ_STATE_UNINITIALIZED:
545 /* orphan event, do nothing */
546 return;
547 case SEQ_STATE_ACQUIRING:
548 break;
549 case SEQ_STATE_RELEASED:
550 case SEQ_STATE_ACQUIRED:
551 case SEQ_STATE_READ_ACQUIRED:
552 case SEQ_STATE_CONTENDED:
553 /* broken lock sequence, discard it */
554 ls->discard = 1;
555 bad_hist[BROKEN_CONTENDED]++;
556 list_del(&seq->list);
557 free(seq);
558 goto end;
559 break;
560 default:
561 BUG_ON("Unknown state of lock sequence found!\n");
562 break;
563 }
564
565 seq->state = SEQ_STATE_CONTENDED;
566 ls->nr_contended++;
567 seq->prev_event_time = timestamp;
568end:
569 return;
570}
571
572static void
573report_lock_release_event(struct trace_release_event *release_event,
574 struct event *__event __used,
575 int cpu __used,
576 u64 timestamp __used,
577 struct thread *thread __used)
578{
579 struct lock_stat *ls;
580 struct thread_stat *ts;
581 struct lock_seq_stat *seq;
582
583 ls = lock_stat_findnew(release_event->addr, release_event->name);
584 if (ls->discard)
585 return;
586
587 ts = thread_stat_findnew(thread->pid);
588 seq = get_seq(ts, release_event->addr);
589
590 switch (seq->state) {
591 case SEQ_STATE_UNINITIALIZED:
592 goto end;
593 break;
594 case SEQ_STATE_ACQUIRED:
595 break;
596 case SEQ_STATE_READ_ACQUIRED:
597 seq->read_count--;
598 BUG_ON(seq->read_count < 0);
599 if (!seq->read_count) {
600 ls->nr_release++;
601 goto end;
602 }
603 break;
604 case SEQ_STATE_ACQUIRING:
605 case SEQ_STATE_CONTENDED:
606 case SEQ_STATE_RELEASED:
607 /* broken lock sequence, discard it */
608 ls->discard = 1;
609 bad_hist[BROKEN_RELEASE]++;
610 goto free_seq;
611 break;
612 default:
613 BUG_ON("Unknown state of lock sequence found!\n");
614 break;
615 }
616
617 ls->nr_release++;
618free_seq:
619 list_del(&seq->list);
620 free(seq);
621end:
622 return;
623}
624
625/* lock oriented handlers */
626/* TODO: handlers for CPU oriented, thread oriented */
627static struct trace_lock_handler report_lock_ops = {
628 .acquire_event = report_lock_acquire_event,
629 .acquired_event = report_lock_acquired_event,
630 .contended_event = report_lock_contended_event,
631 .release_event = report_lock_release_event,
632};
633
634static struct trace_lock_handler *trace_handler;
635
636static void
637process_lock_acquire_event(void *data,
638 struct event *event __used,
639 int cpu __used,
640 u64 timestamp __used,
641 struct thread *thread __used)
642{
643 struct trace_acquire_event acquire_event;
644 u64 tmp; /* this is required for casting... */
645
646 tmp = raw_field_value(event, "lockdep_addr", data);
647 memcpy(&acquire_event.addr, &tmp, sizeof(void *));
648 acquire_event.name = (char *)raw_field_ptr(event, "name", data);
649 acquire_event.flag = (int)raw_field_value(event, "flag", data);
650
651 if (trace_handler->acquire_event)
652 trace_handler->acquire_event(&acquire_event, event, cpu, timestamp, thread);
653}
654
655static void
656process_lock_acquired_event(void *data,
657 struct event *event __used,
658 int cpu __used,
659 u64 timestamp __used,
660 struct thread *thread __used)
661{
662 struct trace_acquired_event acquired_event;
663 u64 tmp; /* this is required for casting... */
664
665 tmp = raw_field_value(event, "lockdep_addr", data);
666 memcpy(&acquired_event.addr, &tmp, sizeof(void *));
667 acquired_event.name = (char *)raw_field_ptr(event, "name", data);
668
669 if (trace_handler->acquire_event)
670 trace_handler->acquired_event(&acquired_event, event, cpu, timestamp, thread);
671}
672
673static void
674process_lock_contended_event(void *data,
675 struct event *event __used,
676 int cpu __used,
677 u64 timestamp __used,
678 struct thread *thread __used)
679{
680 struct trace_contended_event contended_event;
681 u64 tmp; /* this is required for casting... */
682
683 tmp = raw_field_value(event, "lockdep_addr", data);
684 memcpy(&contended_event.addr, &tmp, sizeof(void *));
685 contended_event.name = (char *)raw_field_ptr(event, "name", data);
686
687 if (trace_handler->acquire_event)
688 trace_handler->contended_event(&contended_event, event, cpu, timestamp, thread);
689}
690
691static void
692process_lock_release_event(void *data,
693 struct event *event __used,
694 int cpu __used,
695 u64 timestamp __used,
696 struct thread *thread __used)
697{
698 struct trace_release_event release_event;
699 u64 tmp; /* this is required for casting... */
700
701 tmp = raw_field_value(event, "lockdep_addr", data);
702 memcpy(&release_event.addr, &tmp, sizeof(void *));
703 release_event.name = (char *)raw_field_ptr(event, "name", data);
704
705 if (trace_handler->acquire_event)
706 trace_handler->release_event(&release_event, event, cpu, timestamp, thread);
707}
708
709static void
710process_raw_event(void *data, int cpu, u64 timestamp, struct thread *thread)
711{
712 struct event *event;
713 int type;
714
715 type = trace_parse_common_type(data);
716 event = trace_find_event(type);
717
718 if (!strcmp(event->name, "lock_acquire"))
719 process_lock_acquire_event(data, event, cpu, timestamp, thread);
720 if (!strcmp(event->name, "lock_acquired"))
721 process_lock_acquired_event(data, event, cpu, timestamp, thread);
722 if (!strcmp(event->name, "lock_contended"))
723 process_lock_contended_event(data, event, cpu, timestamp, thread);
724 if (!strcmp(event->name, "lock_release"))
725 process_lock_release_event(data, event, cpu, timestamp, thread);
726}
727
728static void print_bad_events(int bad, int total)
729{
730 /* Output for debug, this have to be removed */
731 int i;
732 const char *name[4] =
733 { "acquire", "acquired", "contended", "release" };
734
735 pr_info("\n=== output for debug===\n\n");
736 pr_info("bad: %d, total: %d\n", bad, total);
737 pr_info("bad rate: %f %%\n", (double)bad / (double)total * 100);
738 pr_info("histogram of events caused bad sequence\n");
739 for (i = 0; i < BROKEN_MAX; i++)
740 pr_info(" %10s: %d\n", name[i], bad_hist[i]);
741}
742
743/* TODO: various way to print, coloring, nano or milli sec */
744static void print_result(void)
745{
746 struct lock_stat *st;
747 char cut_name[20];
748 int bad, total;
749
750 pr_info("%20s ", "Name");
751 pr_info("%10s ", "acquired");
752 pr_info("%10s ", "contended");
753
754 pr_info("%15s ", "total wait (ns)");
755 pr_info("%15s ", "max wait (ns)");
756 pr_info("%15s ", "min wait (ns)");
757
758 pr_info("\n\n");
759
760 bad = total = 0;
761 while ((st = pop_from_result())) {
762 total++;
763 if (st->discard) {
764 bad++;
765 continue;
766 }
767 bzero(cut_name, 20);
768
769 if (strlen(st->name) < 16) {
770 /* output raw name */
771 pr_info("%20s ", st->name);
772 } else {
773 strncpy(cut_name, st->name, 16);
774 cut_name[16] = '.';
775 cut_name[17] = '.';
776 cut_name[18] = '.';
777 cut_name[19] = '\0';
778 /* cut off name for saving output style */
779 pr_info("%20s ", cut_name);
780 }
781
782 pr_info("%10u ", st->nr_acquired);
783 pr_info("%10u ", st->nr_contended);
784
785 pr_info("%15llu ", st->wait_time_total);
786 pr_info("%15llu ", st->wait_time_max);
787 pr_info("%15llu ", st->wait_time_min == ULLONG_MAX ?
788 0 : st->wait_time_min);
789 pr_info("\n");
790 }
791
792 print_bad_events(bad, total);
793}
794
795static bool info_threads, info_map;
796
797static void dump_threads(void)
798{
799 struct thread_stat *st;
800 struct rb_node *node;
801 struct thread *t;
802
803 pr_info("%10s: comm\n", "Thread ID");
804
805 node = rb_first(&thread_stats);
806 while (node) {
807 st = container_of(node, struct thread_stat, rb);
808 t = perf_session__findnew(session, st->tid);
809 pr_info("%10d: %s\n", st->tid, t->comm);
810 node = rb_next(node);
811 };
812}
813
814static void dump_map(void)
815{
816 unsigned int i;
817 struct lock_stat *st;
818
819 pr_info("Address of instance: name of class\n");
820 for (i = 0; i < LOCKHASH_SIZE; i++) {
821 list_for_each_entry(st, &lockhash_table[i], hash_entry) {
822 pr_info(" %p: %s\n", st->addr, st->name);
823 }
824 }
825}
826
827static void dump_info(void)
828{
829 if (info_threads)
830 dump_threads();
831 else if (info_map)
832 dump_map();
833 else
834 die("Unknown type of information\n");
835}
836
837static int process_sample_event(event_t *self, struct perf_session *s)
838{
839 struct sample_data data;
840 struct thread *thread;
841
842 bzero(&data, sizeof(data));
843 event__parse_sample(self, s->sample_type, &data);
844
845 thread = perf_session__findnew(s, data.tid);
846 if (thread == NULL) {
847 pr_debug("problem processing %d event, skipping it.\n",
848 self->header.type);
849 return -1;
850 }
851
852 process_raw_event(data.raw_data, data.cpu, data.time, thread);
853
854 return 0;
855}
856
857static struct perf_event_ops eops = {
858 .sample = process_sample_event,
859 .comm = event__process_comm,
860 .ordered_samples = true,
861};
862
863static int read_events(void)
864{
865 session = perf_session__new(input_name, O_RDONLY, 0, false);
866 if (!session)
867 die("Initializing perf session failed\n");
868
869 return perf_session__process_events(session, &eops);
870}
871
872static void sort_result(void)
873{
874 unsigned int i;
875 struct lock_stat *st;
876
877 for (i = 0; i < LOCKHASH_SIZE; i++) {
878 list_for_each_entry(st, &lockhash_table[i], hash_entry) {
879 insert_to_result(st, compare);
880 }
881 }
882}
883
884static void __cmd_report(void)
885{
886 setup_pager();
887 select_key();
888 read_events();
889 sort_result();
890 print_result();
891}
892
893static const char * const report_usage[] = {
894 "perf lock report [<options>]",
895 NULL
896};
897
898static const struct option report_options[] = {
899 OPT_STRING('k', "key", &sort_key, "acquired",
900 "key for sorting"),
901 /* TODO: type */
902 OPT_END()
903};
904
905static const char * const info_usage[] = {
906 "perf lock info [<options>]",
907 NULL
908};
909
910static const struct option info_options[] = {
911 OPT_BOOLEAN('t', "threads", &info_threads,
912 "dump thread list in perf.data"),
913 OPT_BOOLEAN('m', "map", &info_map,
914 "map of lock instances (name:address table)"),
915 OPT_END()
916};
917
918static const char * const lock_usage[] = {
919 "perf lock [<options>] {record|trace|report}",
920 NULL
921};
922
923static const struct option lock_options[] = {
924 OPT_STRING('i', "input", &input_name, "file", "input file name"),
925 OPT_INCR('v', "verbose", &verbose, "be more verbose (show symbol address, etc)"),
926 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, "dump raw trace in ASCII"),
927 OPT_END()
928};
929
930static const char *record_args[] = {
931 "record",
932 "-R",
933 "-f",
934 "-m", "1024",
935 "-c", "1",
936 "-e", "lock:lock_acquire:r",
937 "-e", "lock:lock_acquired:r",
938 "-e", "lock:lock_contended:r",
939 "-e", "lock:lock_release:r",
940};
941
942static int __cmd_record(int argc, const char **argv)
943{
944 unsigned int rec_argc, i, j;
945 const char **rec_argv;
946
947 rec_argc = ARRAY_SIZE(record_args) + argc - 1;
948 rec_argv = calloc(rec_argc + 1, sizeof(char *));
949
950 for (i = 0; i < ARRAY_SIZE(record_args); i++)
951 rec_argv[i] = strdup(record_args[i]);
952
953 for (j = 1; j < (unsigned int)argc; j++, i++)
954 rec_argv[i] = argv[j];
955
956 BUG_ON(i != rec_argc);
957
958 return cmd_record(i, rec_argv, NULL);
959}
960
961int cmd_lock(int argc, const char **argv, const char *prefix __used)
962{
963 unsigned int i;
964
965 symbol__init();
966 for (i = 0; i < LOCKHASH_SIZE; i++)
967 INIT_LIST_HEAD(lockhash_table + i);
968
969 argc = parse_options(argc, argv, lock_options, lock_usage,
970 PARSE_OPT_STOP_AT_NON_OPTION);
971 if (!argc)
972 usage_with_options(lock_usage, lock_options);
973
974 if (!strncmp(argv[0], "rec", 3)) {
975 return __cmd_record(argc, argv);
976 } else if (!strncmp(argv[0], "report", 6)) {
977 trace_handler = &report_lock_ops;
978 if (argc) {
979 argc = parse_options(argc, argv,
980 report_options, report_usage, 0);
981 if (argc)
982 usage_with_options(report_usage, report_options);
983 }
984 __cmd_report();
985 } else if (!strcmp(argv[0], "trace")) {
986 /* Aliased to 'perf trace' */
987 return cmd_trace(argc, argv, prefix);
988 } else if (!strcmp(argv[0], "info")) {
989 if (argc) {
990 argc = parse_options(argc, argv,
991 info_options, info_usage, 0);
992 if (argc)
993 usage_with_options(info_usage, info_options);
994 }
995 /* recycling report_lock_ops */
996 trace_handler = &report_lock_ops;
997 setup_pager();
998 read_events();
999 dump_info();
1000 } else {
1001 usage_with_options(lock_usage, lock_options);
1002 }
1003
1004 return 0;
1005}
diff --git a/tools/perf/builtin-probe.c b/tools/perf/builtin-probe.c
index c1e6774fd3ed..e4a4da32a568 100644
--- a/tools/perf/builtin-probe.c
+++ b/tools/perf/builtin-probe.c
@@ -36,51 +36,50 @@
36#include "builtin.h" 36#include "builtin.h"
37#include "util/util.h" 37#include "util/util.h"
38#include "util/strlist.h" 38#include "util/strlist.h"
39#include "util/event.h" 39#include "util/symbol.h"
40#include "util/debug.h" 40#include "util/debug.h"
41#include "util/debugfs.h" 41#include "util/debugfs.h"
42#include "util/symbol.h"
43#include "util/thread.h"
44#include "util/session.h"
45#include "util/parse-options.h" 42#include "util/parse-options.h"
46#include "util/parse-events.h" /* For debugfs_path */
47#include "util/probe-finder.h" 43#include "util/probe-finder.h"
48#include "util/probe-event.h" 44#include "util/probe-event.h"
49 45
50#define MAX_PATH_LEN 256 46#define MAX_PATH_LEN 256
51#define MAX_PROBES 128
52 47
53/* Session management structure */ 48/* Session management structure */
54static struct { 49static struct {
55 bool need_dwarf;
56 bool list_events; 50 bool list_events;
57 bool force_add; 51 bool force_add;
58 int nr_probe; 52 bool show_lines;
59 struct probe_point probes[MAX_PROBES]; 53 int nevents;
54 struct perf_probe_event events[MAX_PROBES];
60 struct strlist *dellist; 55 struct strlist *dellist;
61 struct perf_session *psession; 56 struct line_range line_range;
62 struct map *kmap; 57 int max_probe_points;
63} session; 58} params;
64 59
65 60
66/* Parse an event definition. Note that any error must die. */ 61/* Parse an event definition. Note that any error must die. */
67static void parse_probe_event(const char *str) 62static int parse_probe_event(const char *str)
68{ 63{
69 struct probe_point *pp = &session.probes[session.nr_probe]; 64 struct perf_probe_event *pev = &params.events[params.nevents];
65 int ret;
70 66
71 pr_debug("probe-definition(%d): %s\n", session.nr_probe, str); 67 pr_debug("probe-definition(%d): %s\n", params.nevents, str);
72 if (++session.nr_probe == MAX_PROBES) 68 if (++params.nevents == MAX_PROBES) {
73 die("Too many probes (> %d) are specified.", MAX_PROBES); 69 pr_err("Too many probes (> %d) were specified.", MAX_PROBES);
70 return -1;
71 }
74 72
75 /* Parse perf-probe event into probe_point */ 73 /* Parse a perf-probe command into event */
76 parse_perf_probe_event(str, pp, &session.need_dwarf); 74 ret = parse_perf_probe_command(str, pev);
75 pr_debug("%d arguments\n", pev->nargs);
77 76
78 pr_debug("%d arguments\n", pp->nr_args); 77 return ret;
79} 78}
80 79
81static void parse_probe_event_argv(int argc, const char **argv) 80static int parse_probe_event_argv(int argc, const char **argv)
82{ 81{
83 int i, len; 82 int i, len, ret;
84 char *buf; 83 char *buf;
85 84
86 /* Bind up rest arguments */ 85 /* Bind up rest arguments */
@@ -88,54 +87,48 @@ static void parse_probe_event_argv(int argc, const char **argv)
88 for (i = 0; i < argc; i++) 87 for (i = 0; i < argc; i++)
89 len += strlen(argv[i]) + 1; 88 len += strlen(argv[i]) + 1;
90 buf = zalloc(len + 1); 89 buf = zalloc(len + 1);
91 if (!buf) 90 if (buf == NULL)
92 die("Failed to allocate memory for binding arguments."); 91 return -ENOMEM;
93 len = 0; 92 len = 0;
94 for (i = 0; i < argc; i++) 93 for (i = 0; i < argc; i++)
95 len += sprintf(&buf[len], "%s ", argv[i]); 94 len += sprintf(&buf[len], "%s ", argv[i]);
96 parse_probe_event(buf); 95 ret = parse_probe_event(buf);
97 free(buf); 96 free(buf);
97 return ret;
98} 98}
99 99
100static int opt_add_probe_event(const struct option *opt __used, 100static int opt_add_probe_event(const struct option *opt __used,
101 const char *str, int unset __used) 101 const char *str, int unset __used)
102{ 102{
103 if (str) 103 if (str)
104 parse_probe_event(str); 104 return parse_probe_event(str);
105 return 0; 105 else
106 return 0;
106} 107}
107 108
108static int opt_del_probe_event(const struct option *opt __used, 109static int opt_del_probe_event(const struct option *opt __used,
109 const char *str, int unset __used) 110 const char *str, int unset __used)
110{ 111{
111 if (str) { 112 if (str) {
112 if (!session.dellist) 113 if (!params.dellist)
113 session.dellist = strlist__new(true, NULL); 114 params.dellist = strlist__new(true, NULL);
114 strlist__add(session.dellist, str); 115 strlist__add(params.dellist, str);
115 } 116 }
116 return 0; 117 return 0;
117} 118}
118 119
119/* Currently just checking function name from symbol map */ 120#ifdef DWARF_SUPPORT
120static void evaluate_probe_point(struct probe_point *pp) 121static int opt_show_lines(const struct option *opt __used,
122 const char *str, int unset __used)
121{ 123{
122 struct symbol *sym; 124 int ret = 0;
123 sym = map__find_symbol_by_name(session.kmap, pp->function,
124 session.psession, NULL);
125 if (!sym)
126 die("Kernel symbol \'%s\' not found - probe not added.",
127 pp->function);
128}
129 125
130#ifndef NO_LIBDWARF 126 if (str)
131static int open_vmlinux(void) 127 ret = parse_line_range_desc(str, &params.line_range);
132{ 128 INIT_LIST_HEAD(&params.line_range.line_list);
133 if (map__load(session.kmap, session.psession, NULL) < 0) { 129 params.show_lines = true;
134 pr_debug("Failed to load kernel map.\n"); 130
135 return -EINVAL; 131 return ret;
136 }
137 pr_debug("Try to open %s\n", session.kmap->dso->long_name);
138 return open(session.kmap->dso->long_name, O_RDONLY);
139} 132}
140#endif 133#endif
141 134
@@ -144,54 +137,61 @@ static const char * const probe_usage[] = {
144 "perf probe [<options>] --add 'PROBEDEF' [--add 'PROBEDEF' ...]", 137 "perf probe [<options>] --add 'PROBEDEF' [--add 'PROBEDEF' ...]",
145 "perf probe [<options>] --del '[GROUP:]EVENT' ...", 138 "perf probe [<options>] --del '[GROUP:]EVENT' ...",
146 "perf probe --list", 139 "perf probe --list",
140#ifdef DWARF_SUPPORT
141 "perf probe --line 'LINEDESC'",
142#endif
147 NULL 143 NULL
148}; 144};
149 145
150static const struct option options[] = { 146static const struct option options[] = {
151 OPT_BOOLEAN('v', "verbose", &verbose, 147 OPT_INCR('v', "verbose", &verbose,
152 "be more verbose (show parsed arguments, etc)"), 148 "be more verbose (show parsed arguments, etc)"),
153#ifndef NO_LIBDWARF 149 OPT_BOOLEAN('l', "list", &params.list_events,
154 OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
155 "file", "vmlinux pathname"),
156#endif
157 OPT_BOOLEAN('l', "list", &session.list_events,
158 "list up current probe events"), 150 "list up current probe events"),
159 OPT_CALLBACK('d', "del", NULL, "[GROUP:]EVENT", "delete a probe event.", 151 OPT_CALLBACK('d', "del", NULL, "[GROUP:]EVENT", "delete a probe event.",
160 opt_del_probe_event), 152 opt_del_probe_event),
161 OPT_CALLBACK('a', "add", NULL, 153 OPT_CALLBACK('a', "add", NULL,
162#ifdef NO_LIBDWARF 154#ifdef DWARF_SUPPORT
163 "[EVENT=]FUNC[+OFFS|%return] [ARG ...]", 155 "[EVENT=]FUNC[@SRC][+OFF|%return|:RL|;PT]|SRC:AL|SRC;PT"
156 " [[NAME=]ARG ...]",
164#else 157#else
165 "[EVENT=]FUNC[+OFFS|%return|:RLN][@SRC]|SRC:ALN [ARG ...]", 158 "[EVENT=]FUNC[+OFF|%return] [[NAME=]ARG ...]",
166#endif 159#endif
167 "probe point definition, where\n" 160 "probe point definition, where\n"
168 "\t\tGROUP:\tGroup name (optional)\n" 161 "\t\tGROUP:\tGroup name (optional)\n"
169 "\t\tEVENT:\tEvent name\n" 162 "\t\tEVENT:\tEvent name\n"
170 "\t\tFUNC:\tFunction name\n" 163 "\t\tFUNC:\tFunction name\n"
171 "\t\tOFFS:\tOffset from function entry (in byte)\n" 164 "\t\tOFF:\tOffset from function entry (in byte)\n"
172 "\t\t%return:\tPut the probe at function return\n" 165 "\t\t%return:\tPut the probe at function return\n"
173#ifdef NO_LIBDWARF 166#ifdef DWARF_SUPPORT
174 "\t\tARG:\tProbe argument (only \n"
175#else
176 "\t\tSRC:\tSource code path\n" 167 "\t\tSRC:\tSource code path\n"
177 "\t\tRLN:\tRelative line number from function entry.\n" 168 "\t\tRL:\tRelative line number from function entry.\n"
178 "\t\tALN:\tAbsolute line number in file.\n" 169 "\t\tAL:\tAbsolute line number in file.\n"
170 "\t\tPT:\tLazy expression of line code.\n"
179 "\t\tARG:\tProbe argument (local variable name or\n" 171 "\t\tARG:\tProbe argument (local variable name or\n"
180#endif
181 "\t\t\tkprobe-tracer argument format.)\n", 172 "\t\t\tkprobe-tracer argument format.)\n",
173#else
174 "\t\tARG:\tProbe argument (kprobe-tracer argument format.)\n",
175#endif
182 opt_add_probe_event), 176 opt_add_probe_event),
183 OPT_BOOLEAN('f', "force", &session.force_add, "forcibly add events" 177 OPT_BOOLEAN('f', "force", &params.force_add, "forcibly add events"
184 " with existing name"), 178 " with existing name"),
179#ifdef DWARF_SUPPORT
180 OPT_CALLBACK('L', "line", NULL,
181 "FUNC[:RLN[+NUM|-RLN2]]|SRC:ALN[+NUM|-ALN2]",
182 "Show source code lines.", opt_show_lines),
183 OPT_STRING('k', "vmlinux", &symbol_conf.vmlinux_name,
184 "file", "vmlinux pathname"),
185#endif
186 OPT__DRY_RUN(&probe_event_dry_run),
187 OPT_INTEGER('\0', "max-probes", &params.max_probe_points,
188 "Set how many probe points can be found for a probe."),
185 OPT_END() 189 OPT_END()
186}; 190};
187 191
188int cmd_probe(int argc, const char **argv, const char *prefix __used) 192int cmd_probe(int argc, const char **argv, const char *prefix __used)
189{ 193{
190 int i, ret; 194 int ret;
191#ifndef NO_LIBDWARF
192 int fd;
193#endif
194 struct probe_point *pp;
195 195
196 argc = parse_options(argc, argv, options, probe_usage, 196 argc = parse_options(argc, argv, options, probe_usage,
197 PARSE_OPT_STOP_AT_NON_OPTION); 197 PARSE_OPT_STOP_AT_NON_OPTION);
@@ -200,110 +200,69 @@ int cmd_probe(int argc, const char **argv, const char *prefix __used)
200 pr_warning(" Error: '-' is not supported.\n"); 200 pr_warning(" Error: '-' is not supported.\n");
201 usage_with_options(probe_usage, options); 201 usage_with_options(probe_usage, options);
202 } 202 }
203 parse_probe_event_argv(argc, argv); 203 ret = parse_probe_event_argv(argc, argv);
204 if (ret < 0) {
205 pr_err(" Error: Parse Error. (%d)\n", ret);
206 return ret;
207 }
204 } 208 }
205 209
206 if ((!session.nr_probe && !session.dellist && !session.list_events)) 210 if (params.max_probe_points == 0)
207 usage_with_options(probe_usage, options); 211 params.max_probe_points = MAX_PROBES;
208 212
209 if (debugfs_valid_mountpoint(debugfs_path) < 0) 213 if ((!params.nevents && !params.dellist && !params.list_events &&
210 die("Failed to find debugfs path."); 214 !params.show_lines))
215 usage_with_options(probe_usage, options);
211 216
212 if (session.list_events) { 217 if (params.list_events) {
213 if (session.nr_probe != 0 || session.dellist) { 218 if (params.nevents != 0 || params.dellist) {
214 pr_warning(" Error: Don't use --list with" 219 pr_err(" Error: Don't use --list with --add/--del.\n");
215 " --add/--del.\n");
216 usage_with_options(probe_usage, options); 220 usage_with_options(probe_usage, options);
217 } 221 }
218 show_perf_probe_events(); 222 if (params.show_lines) {
219 return 0; 223 pr_err(" Error: Don't use --list with --line.\n");
220 } 224 usage_with_options(probe_usage, options);
221 225 }
222 if (session.dellist) { 226 ret = show_perf_probe_events();
223 del_trace_kprobe_events(session.dellist); 227 if (ret < 0)
224 strlist__delete(session.dellist); 228 pr_err(" Error: Failed to show event list. (%d)\n",
225 if (session.nr_probe == 0) 229 ret);
226 return 0; 230 return ret;
227 } 231 }
228 232
229 /* Initialize symbol maps for vmlinux */ 233#ifdef DWARF_SUPPORT
230 symbol_conf.sort_by_name = true; 234 if (params.show_lines) {
231 if (symbol_conf.vmlinux_name == NULL) 235 if (params.nevents != 0 || params.dellist) {
232 symbol_conf.try_vmlinux_path = true; 236 pr_warning(" Error: Don't use --line with"
233 if (symbol__init() < 0) 237 " --add/--del.\n");
234 die("Failed to init symbol map."); 238 usage_with_options(probe_usage, options);
235 session.psession = perf_session__new(NULL, O_WRONLY, false); 239 }
236 if (session.psession == NULL)
237 die("Failed to init perf_session.");
238 session.kmap = map_groups__find_by_name(&session.psession->kmaps,
239 MAP__FUNCTION,
240 "[kernel.kallsyms]");
241 if (!session.kmap)
242 die("Could not find kernel map.\n");
243
244 if (session.need_dwarf)
245#ifdef NO_LIBDWARF
246 die("Debuginfo-analysis is not supported");
247#else /* !NO_LIBDWARF */
248 pr_debug("Some probes require debuginfo.\n");
249
250 fd = open_vmlinux();
251 if (fd < 0) {
252 if (session.need_dwarf)
253 die("Could not open debuginfo file.");
254 240
255 pr_debug("Could not open vmlinux/module file." 241 ret = show_line_range(&params.line_range);
256 " Try to use symbols.\n"); 242 if (ret < 0)
257 goto end_dwarf; 243 pr_err(" Error: Failed to show lines. (%d)\n", ret);
244 return ret;
258 } 245 }
246#endif
259 247
260 /* Searching probe points */ 248 if (params.dellist) {
261 for (i = 0; i < session.nr_probe; i++) { 249 ret = del_perf_probe_events(params.dellist);
262 pp = &session.probes[i]; 250 strlist__delete(params.dellist);
263 if (pp->found) 251 if (ret < 0) {
264 continue; 252 pr_err(" Error: Failed to delete events. (%d)\n", ret);
265 253 return ret;
266 lseek(fd, SEEK_SET, 0);
267 ret = find_probepoint(fd, pp);
268 if (ret > 0)
269 continue;
270 if (ret == 0) { /* No error but failed to find probe point. */
271 synthesize_perf_probe_point(pp);
272 die("Probe point '%s' not found. - probe not added.",
273 pp->probes[0]);
274 } 254 }
275 /* Error path */
276 if (session.need_dwarf) {
277 if (ret == -ENOENT)
278 pr_warning("No dwarf info found in the vmlinux - please rebuild with CONFIG_DEBUG_INFO=y.\n");
279 die("Could not analyze debuginfo.");
280 }
281 pr_debug("An error occurred in debuginfo analysis."
282 " Try to use symbols.\n");
283 break;
284 } 255 }
285 close(fd);
286
287end_dwarf:
288#endif /* !NO_LIBDWARF */
289
290 /* Synthesize probes without dwarf */
291 for (i = 0; i < session.nr_probe; i++) {
292 pp = &session.probes[i];
293 if (pp->found) /* This probe is already found. */
294 continue;
295 256
296 evaluate_probe_point(pp); 257 if (params.nevents) {
297 ret = synthesize_trace_kprobe_event(pp); 258 ret = add_perf_probe_events(params.events, params.nevents,
298 if (ret == -E2BIG) 259 params.force_add,
299 die("probe point definition becomes too long."); 260 params.max_probe_points);
300 else if (ret < 0) 261 if (ret < 0) {
301 die("Failed to synthesize a probe point."); 262 pr_err(" Error: Failed to add events. (%d)\n", ret);
263 return ret;
264 }
302 } 265 }
303
304 /* Settng up probe points */
305 add_trace_kprobe_events(session.probes, session.nr_probe,
306 session.force_add);
307 return 0; 266 return 0;
308} 267}
309 268
diff --git a/tools/perf/builtin-record.c b/tools/perf/builtin-record.c
index 265425322734..711745f56bba 100644
--- a/tools/perf/builtin-record.c
+++ b/tools/perf/builtin-record.c
@@ -5,63 +5,73 @@
5 * (or a CPU, or a PID) into the perf.data output file - for 5 * (or a CPU, or a PID) into the perf.data output file - for
6 * later analysis via perf report. 6 * later analysis via perf report.
7 */ 7 */
8#define _FILE_OFFSET_BITS 64
9
8#include "builtin.h" 10#include "builtin.h"
9 11
10#include "perf.h" 12#include "perf.h"
11 13
14#include "util/build-id.h"
12#include "util/util.h" 15#include "util/util.h"
13#include "util/parse-options.h" 16#include "util/parse-options.h"
14#include "util/parse-events.h" 17#include "util/parse-events.h"
15#include "util/string.h"
16 18
17#include "util/header.h" 19#include "util/header.h"
18#include "util/event.h" 20#include "util/event.h"
19#include "util/debug.h" 21#include "util/debug.h"
20#include "util/session.h" 22#include "util/session.h"
21#include "util/symbol.h" 23#include "util/symbol.h"
24#include "util/cpumap.h"
22 25
23#include <unistd.h> 26#include <unistd.h>
24#include <sched.h> 27#include <sched.h>
28#include <sys/mman.h>
29
30enum write_mode_t {
31 WRITE_FORCE,
32 WRITE_APPEND
33};
25 34
26static int fd[MAX_NR_CPUS][MAX_COUNTERS]; 35static int *fd[MAX_NR_CPUS][MAX_COUNTERS];
27 36
28static long default_interval = 0; 37static u64 user_interval = ULLONG_MAX;
38static u64 default_interval = 0;
29 39
30static int nr_cpus = 0; 40static int nr_cpus = 0;
31static unsigned int page_size; 41static unsigned int page_size;
32static unsigned int mmap_pages = 128; 42static unsigned int mmap_pages = 128;
43static unsigned int user_freq = UINT_MAX;
33static int freq = 1000; 44static int freq = 1000;
34static int output; 45static int output;
46static int pipe_output = 0;
35static const char *output_name = "perf.data"; 47static const char *output_name = "perf.data";
36static int group = 0; 48static int group = 0;
37static unsigned int realtime_prio = 0; 49static int realtime_prio = 0;
38static int raw_samples = 0; 50static bool raw_samples = false;
39static int system_wide = 0; 51static bool system_wide = false;
40static int profile_cpu = -1; 52static int profile_cpu = -1;
41static pid_t target_pid = -1; 53static pid_t target_pid = -1;
54static pid_t target_tid = -1;
55static pid_t *all_tids = NULL;
56static int thread_num = 0;
42static pid_t child_pid = -1; 57static pid_t child_pid = -1;
43static int inherit = 1; 58static bool no_inherit = false;
44static int force = 0; 59static enum write_mode_t write_mode = WRITE_FORCE;
45static int append_file = 0; 60static bool call_graph = false;
46static int call_graph = 0; 61static bool inherit_stat = false;
47static int inherit_stat = 0; 62static bool no_samples = false;
48static int no_samples = 0; 63static bool sample_address = false;
49static int sample_address = 0;
50static int multiplex = 0;
51static int multiplex_fd = -1;
52 64
53static long samples = 0; 65static long samples = 0;
54static struct timeval last_read;
55static struct timeval this_read;
56
57static u64 bytes_written = 0; 66static u64 bytes_written = 0;
58 67
59static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS]; 68static struct pollfd *event_array;
60 69
61static int nr_poll = 0; 70static int nr_poll = 0;
62static int nr_cpu = 0; 71static int nr_cpu = 0;
63 72
64static int file_new = 1; 73static int file_new = 1;
74static off_t post_processing_offset;
65 75
66static struct perf_session *session; 76static struct perf_session *session;
67 77
@@ -72,7 +82,7 @@ struct mmap_data {
72 unsigned int prev; 82 unsigned int prev;
73}; 83};
74 84
75static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; 85static struct mmap_data mmap_array[MAX_NR_CPUS];
76 86
77static unsigned long mmap_read_head(struct mmap_data *md) 87static unsigned long mmap_read_head(struct mmap_data *md)
78{ 88{
@@ -96,6 +106,11 @@ static void mmap_write_tail(struct mmap_data *md, unsigned long tail)
96 pc->data_tail = tail; 106 pc->data_tail = tail;
97} 107}
98 108
109static void advance_output(size_t size)
110{
111 bytes_written += size;
112}
113
99static void write_output(void *buf, size_t size) 114static void write_output(void *buf, size_t size)
100{ 115{
101 while (size) { 116 while (size) {
@@ -111,22 +126,10 @@ static void write_output(void *buf, size_t size)
111 } 126 }
112} 127}
113 128
114static void write_event(event_t *buf, size_t size)
115{
116 /*
117 * Add it to the list of DSOs, so that when we finish this
118 * record session we can pick the available build-ids.
119 */
120 if (buf->header.type == PERF_RECORD_MMAP)
121 dsos__findnew(buf->mmap.filename);
122
123 write_output(buf, size);
124}
125
126static int process_synthesized_event(event_t *event, 129static int process_synthesized_event(event_t *event,
127 struct perf_session *self __used) 130 struct perf_session *self __used)
128{ 131{
129 write_event(event, event->header.size); 132 write_output(event, event->header.size);
130 return 0; 133 return 0;
131} 134}
132 135
@@ -139,8 +142,6 @@ static void mmap_read(struct mmap_data *md)
139 void *buf; 142 void *buf;
140 int diff; 143 int diff;
141 144
142 gettimeofday(&this_read, NULL);
143
144 /* 145 /*
145 * If we're further behind than half the buffer, there's a chance 146 * If we're further behind than half the buffer, there's a chance
146 * the writer will bite our tail and mess up the samples under us. 147 * the writer will bite our tail and mess up the samples under us.
@@ -151,23 +152,13 @@ static void mmap_read(struct mmap_data *md)
151 */ 152 */
152 diff = head - old; 153 diff = head - old;
153 if (diff < 0) { 154 if (diff < 0) {
154 struct timeval iv; 155 fprintf(stderr, "WARNING: failed to keep up with mmap data\n");
155 unsigned long msecs;
156
157 timersub(&this_read, &last_read, &iv);
158 msecs = iv.tv_sec*1000 + iv.tv_usec/1000;
159
160 fprintf(stderr, "WARNING: failed to keep up with mmap data."
161 " Last read %lu msecs ago.\n", msecs);
162
163 /* 156 /*
164 * head points to a known good entry, start there. 157 * head points to a known good entry, start there.
165 */ 158 */
166 old = head; 159 old = head;
167 } 160 }
168 161
169 last_read = this_read;
170
171 if (old != head) 162 if (old != head)
172 samples++; 163 samples++;
173 164
@@ -178,14 +169,14 @@ static void mmap_read(struct mmap_data *md)
178 size = md->mask + 1 - (old & md->mask); 169 size = md->mask + 1 - (old & md->mask);
179 old += size; 170 old += size;
180 171
181 write_event(buf, size); 172 write_output(buf, size);
182 } 173 }
183 174
184 buf = &data[old & md->mask]; 175 buf = &data[old & md->mask];
185 size = head - old; 176 size = head - old;
186 old += size; 177 old += size;
187 178
188 write_event(buf, size); 179 write_output(buf, size);
189 180
190 md->prev = old; 181 md->prev = old;
191 mmap_write_tail(md, old); 182 mmap_write_tail(md, old);
@@ -202,7 +193,7 @@ static void sig_handler(int sig)
202 193
203static void sig_atexit(void) 194static void sig_atexit(void)
204{ 195{
205 if (child_pid != -1) 196 if (child_pid > 0)
206 kill(child_pid, SIGTERM); 197 kill(child_pid, SIGTERM);
207 198
208 if (signr == -1) 199 if (signr == -1)
@@ -232,12 +223,13 @@ static struct perf_header_attr *get_header_attr(struct perf_event_attr *a, int n
232 return h_attr; 223 return h_attr;
233} 224}
234 225
235static void create_counter(int counter, int cpu, pid_t pid) 226static void create_counter(int counter, int cpu)
236{ 227{
237 char *filter = filters[counter]; 228 char *filter = filters[counter];
238 struct perf_event_attr *attr = attrs + counter; 229 struct perf_event_attr *attr = attrs + counter;
239 struct perf_header_attr *h_attr; 230 struct perf_header_attr *h_attr;
240 int track = !counter; /* only the first counter needs these */ 231 int track = !counter; /* only the first counter needs these */
232 int thread_index;
241 int ret; 233 int ret;
242 struct { 234 struct {
243 u64 count; 235 u64 count;
@@ -252,10 +244,22 @@ static void create_counter(int counter, int cpu, pid_t pid)
252 244
253 attr->sample_type |= PERF_SAMPLE_IP | PERF_SAMPLE_TID; 245 attr->sample_type |= PERF_SAMPLE_IP | PERF_SAMPLE_TID;
254 246
255 if (freq) { 247 if (nr_counters > 1)
256 attr->sample_type |= PERF_SAMPLE_PERIOD; 248 attr->sample_type |= PERF_SAMPLE_ID;
257 attr->freq = 1; 249
258 attr->sample_freq = freq; 250 /*
251 * We default some events to a 1 default interval. But keep
252 * it a weak assumption overridable by the user.
253 */
254 if (!attr->sample_period || (user_freq != UINT_MAX &&
255 user_interval != ULLONG_MAX)) {
256 if (freq) {
257 attr->sample_type |= PERF_SAMPLE_PERIOD;
258 attr->freq = 1;
259 attr->sample_freq = freq;
260 } else {
261 attr->sample_period = default_interval;
262 }
259 } 263 }
260 264
261 if (no_samples) 265 if (no_samples)
@@ -278,146 +282,236 @@ static void create_counter(int counter, int cpu, pid_t pid)
278 282
279 attr->mmap = track; 283 attr->mmap = track;
280 attr->comm = track; 284 attr->comm = track;
281 attr->inherit = inherit; 285 attr->inherit = !no_inherit;
282 attr->disabled = 1; 286 if (target_pid == -1 && target_tid == -1 && !system_wide) {
287 attr->disabled = 1;
288 attr->enable_on_exec = 1;
289 }
283 290
291 for (thread_index = 0; thread_index < thread_num; thread_index++) {
284try_again: 292try_again:
285 fd[nr_cpu][counter] = sys_perf_event_open(attr, pid, cpu, group_fd, 0); 293 fd[nr_cpu][counter][thread_index] = sys_perf_event_open(attr,
286 294 all_tids[thread_index], cpu, group_fd, 0);
287 if (fd[nr_cpu][counter] < 0) { 295
288 int err = errno; 296 if (fd[nr_cpu][counter][thread_index] < 0) {
289 297 int err = errno;
290 if (err == EPERM || err == EACCES) 298
291 die("Permission error - are you root?\n"); 299 if (err == EPERM || err == EACCES)
292 else if (err == ENODEV && profile_cpu != -1) 300 die("Permission error - are you root?\n"
293 die("No such device - did you specify an out-of-range profile CPU?\n"); 301 "\t Consider tweaking"
302 " /proc/sys/kernel/perf_event_paranoid.\n");
303 else if (err == ENODEV && profile_cpu != -1) {
304 die("No such device - did you specify"
305 " an out-of-range profile CPU?\n");
306 }
294 307
295 /* 308 /*
296 * If it's cycles then fall back to hrtimer 309 * If it's cycles then fall back to hrtimer
297 * based cpu-clock-tick sw counter, which 310 * based cpu-clock-tick sw counter, which
298 * is always available even if no PMU support: 311 * is always available even if no PMU support:
299 */ 312 */
300 if (attr->type == PERF_TYPE_HARDWARE 313 if (attr->type == PERF_TYPE_HARDWARE
301 && attr->config == PERF_COUNT_HW_CPU_CYCLES) { 314 && attr->config == PERF_COUNT_HW_CPU_CYCLES) {
302 315
303 if (verbose) 316 if (verbose)
304 warning(" ... trying to fall back to cpu-clock-ticks\n"); 317 warning(" ... trying to fall back to cpu-clock-ticks\n");
305 attr->type = PERF_TYPE_SOFTWARE; 318 attr->type = PERF_TYPE_SOFTWARE;
306 attr->config = PERF_COUNT_SW_CPU_CLOCK; 319 attr->config = PERF_COUNT_SW_CPU_CLOCK;
307 goto try_again; 320 goto try_again;
308 } 321 }
309 printf("\n"); 322 printf("\n");
310 error("perfcounter syscall returned with %d (%s)\n", 323 error("perfcounter syscall returned with %d (%s)\n",
311 fd[nr_cpu][counter], strerror(err)); 324 fd[nr_cpu][counter][thread_index], strerror(err));
312 325
313#if defined(__i386__) || defined(__x86_64__) 326#if defined(__i386__) || defined(__x86_64__)
314 if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP) 327 if (attr->type == PERF_TYPE_HARDWARE && err == EOPNOTSUPP)
315 die("No hardware sampling interrupt available. No APIC? If so then you can boot the kernel with the \"lapic\" boot parameter to force-enable it.\n"); 328 die("No hardware sampling interrupt available."
329 " No APIC? If so then you can boot the kernel"
330 " with the \"lapic\" boot parameter to"
331 " force-enable it.\n");
316#endif 332#endif
317 333
318 die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); 334 die("No CONFIG_PERF_EVENTS=y kernel support configured?\n");
319 exit(-1);
320 }
321
322 h_attr = get_header_attr(attr, counter);
323 if (h_attr == NULL)
324 die("nomem\n");
325
326 if (!file_new) {
327 if (memcmp(&h_attr->attr, attr, sizeof(*attr))) {
328 fprintf(stderr, "incompatible append\n");
329 exit(-1); 335 exit(-1);
330 } 336 }
331 }
332 337
333 if (read(fd[nr_cpu][counter], &read_data, sizeof(read_data)) == -1) { 338 h_attr = get_header_attr(attr, counter);
334 perror("Unable to read perf file descriptor\n"); 339 if (h_attr == NULL)
335 exit(-1); 340 die("nomem\n");
336 }
337 341
338 if (perf_header_attr__add_id(h_attr, read_data.id) < 0) { 342 if (!file_new) {
339 pr_warning("Not enough memory to add id\n"); 343 if (memcmp(&h_attr->attr, attr, sizeof(*attr))) {
340 exit(-1); 344 fprintf(stderr, "incompatible append\n");
341 } 345 exit(-1);
346 }
347 }
342 348
343 assert(fd[nr_cpu][counter] >= 0); 349 if (read(fd[nr_cpu][counter][thread_index], &read_data, sizeof(read_data)) == -1) {
344 fcntl(fd[nr_cpu][counter], F_SETFL, O_NONBLOCK); 350 perror("Unable to read perf file descriptor\n");
351 exit(-1);
352 }
345 353
346 /* 354 if (perf_header_attr__add_id(h_attr, read_data.id) < 0) {
347 * First counter acts as the group leader: 355 pr_warning("Not enough memory to add id\n");
348 */ 356 exit(-1);
349 if (group && group_fd == -1) 357 }
350 group_fd = fd[nr_cpu][counter];
351 if (multiplex && multiplex_fd == -1)
352 multiplex_fd = fd[nr_cpu][counter];
353 358
354 if (multiplex && fd[nr_cpu][counter] != multiplex_fd) { 359 assert(fd[nr_cpu][counter][thread_index] >= 0);
360 fcntl(fd[nr_cpu][counter][thread_index], F_SETFL, O_NONBLOCK);
355 361
356 ret = ioctl(fd[nr_cpu][counter], PERF_EVENT_IOC_SET_OUTPUT, multiplex_fd); 362 /*
357 assert(ret != -1); 363 * First counter acts as the group leader:
358 } else { 364 */
359 event_array[nr_poll].fd = fd[nr_cpu][counter]; 365 if (group && group_fd == -1)
360 event_array[nr_poll].events = POLLIN; 366 group_fd = fd[nr_cpu][counter][thread_index];
361 nr_poll++; 367
362 368 if (counter || thread_index) {
363 mmap_array[nr_cpu][counter].counter = counter; 369 ret = ioctl(fd[nr_cpu][counter][thread_index],
364 mmap_array[nr_cpu][counter].prev = 0; 370 PERF_EVENT_IOC_SET_OUTPUT,
365 mmap_array[nr_cpu][counter].mask = mmap_pages*page_size - 1; 371 fd[nr_cpu][0][0]);
366 mmap_array[nr_cpu][counter].base = mmap(NULL, (mmap_pages+1)*page_size, 372 if (ret) {
367 PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter], 0); 373 error("failed to set output: %d (%s)\n", errno,
368 if (mmap_array[nr_cpu][counter].base == MAP_FAILED) { 374 strerror(errno));
369 error("failed to mmap with %d (%s)\n", errno, strerror(errno)); 375 exit(-1);
370 exit(-1); 376 }
377 } else {
378 mmap_array[nr_cpu].counter = counter;
379 mmap_array[nr_cpu].prev = 0;
380 mmap_array[nr_cpu].mask = mmap_pages*page_size - 1;
381 mmap_array[nr_cpu].base = mmap(NULL, (mmap_pages+1)*page_size,
382 PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter][thread_index], 0);
383 if (mmap_array[nr_cpu].base == MAP_FAILED) {
384 error("failed to mmap with %d (%s)\n", errno, strerror(errno));
385 exit(-1);
386 }
387
388 event_array[nr_poll].fd = fd[nr_cpu][counter][thread_index];
389 event_array[nr_poll].events = POLLIN;
390 nr_poll++;
371 } 391 }
372 }
373 392
374 if (filter != NULL) { 393 if (filter != NULL) {
375 ret = ioctl(fd[nr_cpu][counter], 394 ret = ioctl(fd[nr_cpu][counter][thread_index],
376 PERF_EVENT_IOC_SET_FILTER, filter); 395 PERF_EVENT_IOC_SET_FILTER, filter);
377 if (ret) { 396 if (ret) {
378 error("failed to set filter with %d (%s)\n", errno, 397 error("failed to set filter with %d (%s)\n", errno,
379 strerror(errno)); 398 strerror(errno));
380 exit(-1); 399 exit(-1);
400 }
381 } 401 }
382 } 402 }
383
384 ioctl(fd[nr_cpu][counter], PERF_EVENT_IOC_ENABLE);
385} 403}
386 404
387static void open_counters(int cpu, pid_t pid) 405static void open_counters(int cpu)
388{ 406{
389 int counter; 407 int counter;
390 408
391 group_fd = -1; 409 group_fd = -1;
392 for (counter = 0; counter < nr_counters; counter++) 410 for (counter = 0; counter < nr_counters; counter++)
393 create_counter(counter, cpu, pid); 411 create_counter(counter, cpu);
394 412
395 nr_cpu++; 413 nr_cpu++;
396} 414}
397 415
416static int process_buildids(void)
417{
418 u64 size = lseek(output, 0, SEEK_CUR);
419
420 if (size == 0)
421 return 0;
422
423 session->fd = output;
424 return __perf_session__process_events(session, post_processing_offset,
425 size - post_processing_offset,
426 size, &build_id__mark_dso_hit_ops);
427}
428
398static void atexit_header(void) 429static void atexit_header(void)
399{ 430{
400 session->header.data_size += bytes_written; 431 if (!pipe_output) {
432 session->header.data_size += bytes_written;
401 433
402 perf_header__write(&session->header, output, true); 434 process_buildids();
435 perf_header__write(&session->header, output, true);
436 }
437}
438
439static void event__synthesize_guest_os(struct machine *machine, void *data)
440{
441 int err;
442 char *guest_kallsyms;
443 char path[PATH_MAX];
444 struct perf_session *psession = data;
445
446 if (machine__is_host(machine))
447 return;
448
449 /*
450 *As for guest kernel when processing subcommand record&report,
451 *we arrange module mmap prior to guest kernel mmap and trigger
452 *a preload dso because default guest module symbols are loaded
453 *from guest kallsyms instead of /lib/modules/XXX/XXX. This
454 *method is used to avoid symbol missing when the first addr is
455 *in module instead of in guest kernel.
456 */
457 err = event__synthesize_modules(process_synthesized_event,
458 psession, machine);
459 if (err < 0)
460 pr_err("Couldn't record guest kernel [%d]'s reference"
461 " relocation symbol.\n", machine->pid);
462
463 if (machine__is_default_guest(machine))
464 guest_kallsyms = (char *) symbol_conf.default_guest_kallsyms;
465 else {
466 sprintf(path, "%s/proc/kallsyms", machine->root_dir);
467 guest_kallsyms = path;
468 }
469
470 /*
471 * We use _stext for guest kernel because guest kernel's /proc/kallsyms
472 * have no _text sometimes.
473 */
474 err = event__synthesize_kernel_mmap(process_synthesized_event,
475 psession, machine, "_text");
476 if (err < 0)
477 err = event__synthesize_kernel_mmap(process_synthesized_event,
478 psession, machine, "_stext");
479 if (err < 0)
480 pr_err("Couldn't record guest kernel [%d]'s reference"
481 " relocation symbol.\n", machine->pid);
482}
483
484static struct perf_event_header finished_round_event = {
485 .size = sizeof(struct perf_event_header),
486 .type = PERF_RECORD_FINISHED_ROUND,
487};
488
489static void mmap_read_all(void)
490{
491 int i;
492
493 for (i = 0; i < nr_cpu; i++) {
494 if (mmap_array[i].base)
495 mmap_read(&mmap_array[i]);
496 }
497
498 if (perf_header__has_feat(&session->header, HEADER_TRACE_INFO))
499 write_output(&finished_round_event, sizeof(finished_round_event));
403} 500}
404 501
405static int __cmd_record(int argc, const char **argv) 502static int __cmd_record(int argc, const char **argv)
406{ 503{
407 int i, counter; 504 int i, counter;
408 struct stat st; 505 struct stat st;
409 pid_t pid = 0;
410 int flags; 506 int flags;
411 int err; 507 int err;
412 unsigned long waking = 0; 508 unsigned long waking = 0;
413 int child_ready_pipe[2], go_pipe[2]; 509 int child_ready_pipe[2], go_pipe[2];
414 const bool forks = target_pid == -1 && argc > 0; 510 const bool forks = argc > 0;
415 char buf; 511 char buf;
512 struct machine *machine;
416 513
417 page_size = sysconf(_SC_PAGE_SIZE); 514 page_size = sysconf(_SC_PAGE_SIZE);
418 nr_cpus = sysconf(_SC_NPROCESSORS_ONLN);
419 assert(nr_cpus <= MAX_NR_CPUS);
420 assert(nr_cpus >= 0);
421 515
422 atexit(sig_atexit); 516 atexit(sig_atexit);
423 signal(SIGCHLD, sig_handler); 517 signal(SIGCHLD, sig_handler);
@@ -428,70 +522,63 @@ static int __cmd_record(int argc, const char **argv)
428 exit(-1); 522 exit(-1);
429 } 523 }
430 524
431 if (!stat(output_name, &st) && st.st_size) { 525 if (!strcmp(output_name, "-"))
432 if (!force) { 526 pipe_output = 1;
433 if (!append_file) { 527 else if (!stat(output_name, &st) && st.st_size) {
434 pr_err("Error, output file %s exists, use -A " 528 if (write_mode == WRITE_FORCE) {
435 "to append or -f to overwrite.\n",
436 output_name);
437 exit(-1);
438 }
439 } else {
440 char oldname[PATH_MAX]; 529 char oldname[PATH_MAX];
441 snprintf(oldname, sizeof(oldname), "%s.old", 530 snprintf(oldname, sizeof(oldname), "%s.old",
442 output_name); 531 output_name);
443 unlink(oldname); 532 unlink(oldname);
444 rename(output_name, oldname); 533 rename(output_name, oldname);
445 } 534 }
446 } else { 535 } else if (write_mode == WRITE_APPEND) {
447 append_file = 0; 536 write_mode = WRITE_FORCE;
448 } 537 }
449 538
450 flags = O_CREAT|O_RDWR; 539 flags = O_CREAT|O_RDWR;
451 if (append_file) 540 if (write_mode == WRITE_APPEND)
452 file_new = 0; 541 file_new = 0;
453 else 542 else
454 flags |= O_TRUNC; 543 flags |= O_TRUNC;
455 544
456 output = open(output_name, flags, S_IRUSR|S_IWUSR); 545 if (pipe_output)
546 output = STDOUT_FILENO;
547 else
548 output = open(output_name, flags, S_IRUSR | S_IWUSR);
457 if (output < 0) { 549 if (output < 0) {
458 perror("failed to create output file"); 550 perror("failed to create output file");
459 exit(-1); 551 exit(-1);
460 } 552 }
461 553
462 session = perf_session__new(output_name, O_WRONLY, force); 554 session = perf_session__new(output_name, O_WRONLY,
555 write_mode == WRITE_FORCE, false);
463 if (session == NULL) { 556 if (session == NULL) {
464 pr_err("Not enough memory for reading perf file header\n"); 557 pr_err("Not enough memory for reading perf file header\n");
465 return -1; 558 return -1;
466 } 559 }
467 560
468 if (!file_new) { 561 if (!file_new) {
469 err = perf_header__read(&session->header, output); 562 err = perf_header__read(session, output);
470 if (err < 0) 563 if (err < 0)
471 return err; 564 return err;
472 } 565 }
473 566
474 if (raw_samples) { 567 if (have_tracepoints(attrs, nr_counters))
475 perf_header__set_feat(&session->header, HEADER_TRACE_INFO); 568 perf_header__set_feat(&session->header, HEADER_TRACE_INFO);
476 } else {
477 for (i = 0; i < nr_counters; i++) {
478 if (attrs[i].sample_type & PERF_SAMPLE_RAW) {
479 perf_header__set_feat(&session->header, HEADER_TRACE_INFO);
480 break;
481 }
482 }
483 }
484 569
485 atexit(atexit_header); 570 atexit(atexit_header);
486 571
487 if (forks) { 572 if (forks) {
488 pid = fork(); 573 child_pid = fork();
489 if (pid < 0) { 574 if (child_pid < 0) {
490 perror("failed to fork"); 575 perror("failed to fork");
491 exit(-1); 576 exit(-1);
492 } 577 }
493 578
494 if (!pid) { 579 if (!child_pid) {
580 if (pipe_output)
581 dup2(2, 1);
495 close(child_ready_pipe[0]); 582 close(child_ready_pipe[0]);
496 close(go_pipe[1]); 583 close(go_pipe[1]);
497 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); 584 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC);
@@ -520,10 +607,8 @@ static int __cmd_record(int argc, const char **argv)
520 exit(-1); 607 exit(-1);
521 } 608 }
522 609
523 child_pid = pid; 610 if (!system_wide && target_tid == -1 && target_pid == -1)
524 611 all_tids[0] = child_pid;
525 if (!system_wide)
526 target_pid = pid;
527 612
528 close(child_ready_pipe[1]); 613 close(child_ready_pipe[1]);
529 close(go_pipe[0]); 614 close(go_pipe[0]);
@@ -537,22 +622,90 @@ static int __cmd_record(int argc, const char **argv)
537 close(child_ready_pipe[0]); 622 close(child_ready_pipe[0]);
538 } 623 }
539 624
540 625 if ((!system_wide && no_inherit) || profile_cpu != -1) {
541 if ((!system_wide && !inherit) || profile_cpu != -1) { 626 open_counters(profile_cpu);
542 open_counters(profile_cpu, target_pid);
543 } else { 627 } else {
628 nr_cpus = read_cpu_map();
544 for (i = 0; i < nr_cpus; i++) 629 for (i = 0; i < nr_cpus; i++)
545 open_counters(i, target_pid); 630 open_counters(cpumap[i]);
546 } 631 }
547 632
548 if (file_new) { 633 if (pipe_output) {
634 err = perf_header__write_pipe(output);
635 if (err < 0)
636 return err;
637 } else if (file_new) {
549 err = perf_header__write(&session->header, output, false); 638 err = perf_header__write(&session->header, output, false);
550 if (err < 0) 639 if (err < 0)
551 return err; 640 return err;
552 } 641 }
553 642
643 post_processing_offset = lseek(output, 0, SEEK_CUR);
644
645 if (pipe_output) {
646 err = event__synthesize_attrs(&session->header,
647 process_synthesized_event,
648 session);
649 if (err < 0) {
650 pr_err("Couldn't synthesize attrs.\n");
651 return err;
652 }
653
654 err = event__synthesize_event_types(process_synthesized_event,
655 session);
656 if (err < 0) {
657 pr_err("Couldn't synthesize event_types.\n");
658 return err;
659 }
660
661 if (have_tracepoints(attrs, nr_counters)) {
662 /*
663 * FIXME err <= 0 here actually means that
664 * there were no tracepoints so its not really
665 * an error, just that we don't need to
666 * synthesize anything. We really have to
667 * return this more properly and also
668 * propagate errors that now are calling die()
669 */
670 err = event__synthesize_tracing_data(output, attrs,
671 nr_counters,
672 process_synthesized_event,
673 session);
674 if (err <= 0) {
675 pr_err("Couldn't record tracing data.\n");
676 return err;
677 }
678 advance_output(err);
679 }
680 }
681
682 machine = perf_session__find_host_machine(session);
683 if (!machine) {
684 pr_err("Couldn't find native kernel information.\n");
685 return -1;
686 }
687
688 err = event__synthesize_kernel_mmap(process_synthesized_event,
689 session, machine, "_text");
690 if (err < 0)
691 err = event__synthesize_kernel_mmap(process_synthesized_event,
692 session, machine, "_stext");
693 if (err < 0) {
694 pr_err("Couldn't record kernel reference relocation symbol.\n");
695 return err;
696 }
697
698 err = event__synthesize_modules(process_synthesized_event,
699 session, machine);
700 if (err < 0) {
701 pr_err("Couldn't record kernel reference relocation symbol.\n");
702 return err;
703 }
704 if (perf_guest)
705 perf_session__process_machines(session, event__synthesize_guest_os);
706
554 if (!system_wide && profile_cpu == -1) 707 if (!system_wide && profile_cpu == -1)
555 event__synthesize_thread(pid, process_synthesized_event, 708 event__synthesize_thread(target_tid, process_synthesized_event,
556 session); 709 session);
557 else 710 else
558 event__synthesize_threads(process_synthesized_event, session); 711 event__synthesize_threads(process_synthesized_event, session);
@@ -575,13 +728,9 @@ static int __cmd_record(int argc, const char **argv)
575 728
576 for (;;) { 729 for (;;) {
577 int hits = samples; 730 int hits = samples;
731 int thread;
578 732
579 for (i = 0; i < nr_cpu; i++) { 733 mmap_read_all();
580 for (counter = 0; counter < nr_counters; counter++) {
581 if (mmap_array[i][counter].base)
582 mmap_read(&mmap_array[i][counter]);
583 }
584 }
585 734
586 if (hits == samples) { 735 if (hits == samples) {
587 if (done) 736 if (done)
@@ -592,8 +741,15 @@ static int __cmd_record(int argc, const char **argv)
592 741
593 if (done) { 742 if (done) {
594 for (i = 0; i < nr_cpu; i++) { 743 for (i = 0; i < nr_cpu; i++) {
595 for (counter = 0; counter < nr_counters; counter++) 744 for (counter = 0;
596 ioctl(fd[i][counter], PERF_EVENT_IOC_DISABLE); 745 counter < nr_counters;
746 counter++) {
747 for (thread = 0;
748 thread < thread_num;
749 thread++)
750 ioctl(fd[i][counter][thread],
751 PERF_EVENT_IOC_DISABLE);
752 }
597 } 753 }
598 } 754 }
599 } 755 }
@@ -618,6 +774,8 @@ static const char * const record_usage[] = {
618 NULL 774 NULL
619}; 775};
620 776
777static bool force, append_file;
778
621static const struct option options[] = { 779static const struct option options[] = {
622 OPT_CALLBACK('e', "event", NULL, "event", 780 OPT_CALLBACK('e', "event", NULL, "event",
623 "event selector. use 'perf list' to list available events", 781 "event selector. use 'perf list' to list available events",
@@ -625,7 +783,9 @@ static const struct option options[] = {
625 OPT_CALLBACK(0, "filter", NULL, "filter", 783 OPT_CALLBACK(0, "filter", NULL, "filter",
626 "event filter", parse_filter), 784 "event filter", parse_filter),
627 OPT_INTEGER('p', "pid", &target_pid, 785 OPT_INTEGER('p', "pid", &target_pid,
628 "record events on existing pid"), 786 "record events on existing process id"),
787 OPT_INTEGER('t', "tid", &target_tid,
788 "record events on existing thread id"),
629 OPT_INTEGER('r', "realtime", &realtime_prio, 789 OPT_INTEGER('r', "realtime", &realtime_prio,
630 "collect data with this RT SCHED_FIFO priority"), 790 "collect data with this RT SCHED_FIFO priority"),
631 OPT_BOOLEAN('R', "raw-samples", &raw_samples, 791 OPT_BOOLEAN('R', "raw-samples", &raw_samples,
@@ -637,20 +797,17 @@ static const struct option options[] = {
637 OPT_INTEGER('C', "profile_cpu", &profile_cpu, 797 OPT_INTEGER('C', "profile_cpu", &profile_cpu,
638 "CPU to profile on"), 798 "CPU to profile on"),
639 OPT_BOOLEAN('f', "force", &force, 799 OPT_BOOLEAN('f', "force", &force,
640 "overwrite existing data file"), 800 "overwrite existing data file (deprecated)"),
641 OPT_LONG('c', "count", &default_interval, 801 OPT_U64('c', "count", &user_interval, "event period to sample"),
642 "event period to sample"),
643 OPT_STRING('o', "output", &output_name, "file", 802 OPT_STRING('o', "output", &output_name, "file",
644 "output file name"), 803 "output file name"),
645 OPT_BOOLEAN('i', "inherit", &inherit, 804 OPT_BOOLEAN('i', "no-inherit", &no_inherit,
646 "child tasks inherit counters"), 805 "child tasks do not inherit counters"),
647 OPT_INTEGER('F', "freq", &freq, 806 OPT_UINTEGER('F', "freq", &user_freq, "profile at this frequency"),
648 "profile at this frequency"), 807 OPT_UINTEGER('m', "mmap-pages", &mmap_pages, "number of mmap data pages"),
649 OPT_INTEGER('m', "mmap-pages", &mmap_pages,
650 "number of mmap data pages"),
651 OPT_BOOLEAN('g', "call-graph", &call_graph, 808 OPT_BOOLEAN('g', "call-graph", &call_graph,
652 "do call-graph (stack chain/backtrace) recording"), 809 "do call-graph (stack chain/backtrace) recording"),
653 OPT_BOOLEAN('v', "verbose", &verbose, 810 OPT_INCR('v', "verbose", &verbose,
654 "be more verbose (show counter open errors, etc)"), 811 "be more verbose (show counter open errors, etc)"),
655 OPT_BOOLEAN('s', "stat", &inherit_stat, 812 OPT_BOOLEAN('s', "stat", &inherit_stat,
656 "per thread counts"), 813 "per thread counts"),
@@ -658,20 +815,29 @@ static const struct option options[] = {
658 "Sample addresses"), 815 "Sample addresses"),
659 OPT_BOOLEAN('n', "no-samples", &no_samples, 816 OPT_BOOLEAN('n', "no-samples", &no_samples,
660 "don't sample"), 817 "don't sample"),
661 OPT_BOOLEAN('M', "multiplex", &multiplex,
662 "multiplex counter output in a single channel"),
663 OPT_END() 818 OPT_END()
664}; 819};
665 820
666int cmd_record(int argc, const char **argv, const char *prefix __used) 821int cmd_record(int argc, const char **argv, const char *prefix __used)
667{ 822{
668 int counter; 823 int i,j;
669 824
670 argc = parse_options(argc, argv, options, record_usage, 825 argc = parse_options(argc, argv, options, record_usage,
671 PARSE_OPT_STOP_AT_NON_OPTION); 826 PARSE_OPT_STOP_AT_NON_OPTION);
672 if (!argc && target_pid == -1 && !system_wide && profile_cpu == -1) 827 if (!argc && target_pid == -1 && target_tid == -1 &&
828 !system_wide && profile_cpu == -1)
673 usage_with_options(record_usage, options); 829 usage_with_options(record_usage, options);
674 830
831 if (force && append_file) {
832 fprintf(stderr, "Can't overwrite and append at the same time."
833 " You need to choose between -f and -A");
834 usage_with_options(record_usage, options);
835 } else if (append_file) {
836 write_mode = WRITE_APPEND;
837 } else {
838 write_mode = WRITE_FORCE;
839 }
840
675 symbol__init(); 841 symbol__init();
676 842
677 if (!nr_counters) { 843 if (!nr_counters) {
@@ -680,6 +846,40 @@ int cmd_record(int argc, const char **argv, const char *prefix __used)
680 attrs[0].config = PERF_COUNT_HW_CPU_CYCLES; 846 attrs[0].config = PERF_COUNT_HW_CPU_CYCLES;
681 } 847 }
682 848
849 if (target_pid != -1) {
850 target_tid = target_pid;
851 thread_num = find_all_tid(target_pid, &all_tids);
852 if (thread_num <= 0) {
853 fprintf(stderr, "Can't find all threads of pid %d\n",
854 target_pid);
855 usage_with_options(record_usage, options);
856 }
857 } else {
858 all_tids=malloc(sizeof(pid_t));
859 if (!all_tids)
860 return -ENOMEM;
861
862 all_tids[0] = target_tid;
863 thread_num = 1;
864 }
865
866 for (i = 0; i < MAX_NR_CPUS; i++) {
867 for (j = 0; j < MAX_COUNTERS; j++) {
868 fd[i][j] = malloc(sizeof(int)*thread_num);
869 if (!fd[i][j])
870 return -ENOMEM;
871 }
872 }
873 event_array = malloc(
874 sizeof(struct pollfd)*MAX_NR_CPUS*MAX_COUNTERS*thread_num);
875 if (!event_array)
876 return -ENOMEM;
877
878 if (user_interval != ULLONG_MAX)
879 default_interval = user_interval;
880 if (user_freq != UINT_MAX)
881 freq = user_freq;
882
683 /* 883 /*
684 * User specified count overrides default frequency. 884 * User specified count overrides default frequency.
685 */ 885 */
@@ -692,12 +892,5 @@ int cmd_record(int argc, const char **argv, const char *prefix __used)
692 exit(EXIT_FAILURE); 892 exit(EXIT_FAILURE);
693 } 893 }
694 894
695 for (counter = 0; counter < nr_counters; counter++) {
696 if (attrs[counter].sample_period)
697 continue;
698
699 attrs[counter].sample_period = default_interval;
700 }
701
702 return __cmd_record(argc, argv); 895 return __cmd_record(argc, argv);
703} 896}
diff --git a/tools/perf/builtin-report.c b/tools/perf/builtin-report.c
index 860f1eeeea7d..fd7407c7205c 100644
--- a/tools/perf/builtin-report.c
+++ b/tools/perf/builtin-report.c
@@ -14,7 +14,6 @@
14#include "util/cache.h" 14#include "util/cache.h"
15#include <linux/rbtree.h> 15#include <linux/rbtree.h>
16#include "util/symbol.h" 16#include "util/symbol.h"
17#include "util/string.h"
18#include "util/callchain.h" 17#include "util/callchain.h"
19#include "util/strlist.h" 18#include "util/strlist.h"
20#include "util/values.h" 19#include "util/values.h"
@@ -33,54 +32,120 @@
33 32
34static char const *input_name = "perf.data"; 33static char const *input_name = "perf.data";
35 34
36static int force; 35static bool force;
36static bool hide_unresolved;
37static bool dont_use_callchains;
37 38
38static int show_threads; 39static bool show_threads;
39static struct perf_read_values show_threads_values; 40static struct perf_read_values show_threads_values;
40 41
41static char default_pretty_printing_style[] = "normal"; 42static const char default_pretty_printing_style[] = "normal";
42static char *pretty_printing_style = default_pretty_printing_style; 43static const char *pretty_printing_style = default_pretty_printing_style;
43 44
44static char callchain_default_opt[] = "fractal,0.5"; 45static char callchain_default_opt[] = "fractal,0.5";
45 46
47static struct hists *perf_session__hists_findnew(struct perf_session *self,
48 u64 event_stream, u32 type,
49 u64 config)
50{
51 struct rb_node **p = &self->hists_tree.rb_node;
52 struct rb_node *parent = NULL;
53 struct hists *iter, *new;
54
55 while (*p != NULL) {
56 parent = *p;
57 iter = rb_entry(parent, struct hists, rb_node);
58 if (iter->config == config)
59 return iter;
60
61
62 if (config > iter->config)
63 p = &(*p)->rb_right;
64 else
65 p = &(*p)->rb_left;
66 }
67
68 new = malloc(sizeof(struct hists));
69 if (new == NULL)
70 return NULL;
71 memset(new, 0, sizeof(struct hists));
72 new->event_stream = event_stream;
73 new->config = config;
74 new->type = type;
75 rb_link_node(&new->rb_node, parent, p);
76 rb_insert_color(&new->rb_node, &self->hists_tree);
77 return new;
78}
79
46static int perf_session__add_hist_entry(struct perf_session *self, 80static int perf_session__add_hist_entry(struct perf_session *self,
47 struct addr_location *al, 81 struct addr_location *al,
48 struct ip_callchain *chain, u64 count) 82 struct sample_data *data)
49{ 83{
50 struct symbol **syms = NULL, *parent = NULL; 84 struct map_symbol *syms = NULL;
51 bool hit; 85 struct symbol *parent = NULL;
86 int err = -ENOMEM;
52 struct hist_entry *he; 87 struct hist_entry *he;
88 struct hists *hists;
89 struct perf_event_attr *attr;
53 90
54 if ((sort__has_parent || symbol_conf.use_callchain) && chain) 91 if ((sort__has_parent || symbol_conf.use_callchain) && data->callchain) {
55 syms = perf_session__resolve_callchain(self, al->thread, 92 syms = perf_session__resolve_callchain(self, al->thread,
56 chain, &parent); 93 data->callchain, &parent);
57 he = __perf_session__add_hist_entry(self, al, parent, count, &hit); 94 if (syms == NULL)
58 if (he == NULL) 95 return -ENOMEM;
59 return -ENOMEM; 96 }
60
61 if (hit)
62 he->count += count;
63 97
98 attr = perf_header__find_attr(data->id, &self->header);
99 if (attr)
100 hists = perf_session__hists_findnew(self, data->id, attr->type, attr->config);
101 else
102 hists = perf_session__hists_findnew(self, data->id, 0, 0);
103 if (hists == NULL)
104 goto out_free_syms;
105 he = __hists__add_entry(hists, al, parent, data->period);
106 if (he == NULL)
107 goto out_free_syms;
108 err = 0;
64 if (symbol_conf.use_callchain) { 109 if (symbol_conf.use_callchain) {
65 if (!hit) 110 err = append_chain(he->callchain, data->callchain, syms, data->period);
66 callchain_init(&he->callchain); 111 if (err)
67 append_chain(&he->callchain, chain, syms); 112 goto out_free_syms;
68 free(syms);
69 } 113 }
70 114 /*
71 return 0; 115 * Only in the newt browser we are doing integrated annotation,
116 * so we don't allocated the extra space needed because the stdio
117 * code will not use it.
118 */
119 if (use_browser > 0)
120 err = hist_entry__inc_addr_samples(he, al->addr);
121out_free_syms:
122 free(syms);
123 return err;
72} 124}
73 125
74static int validate_chain(struct ip_callchain *chain, event_t *event) 126static int add_event_total(struct perf_session *session,
127 struct sample_data *data,
128 struct perf_event_attr *attr)
75{ 129{
76 unsigned int chain_size; 130 struct hists *hists;
77 131
78 chain_size = event->header.size; 132 if (attr)
79 chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event; 133 hists = perf_session__hists_findnew(session, data->id,
134 attr->type, attr->config);
135 else
136 hists = perf_session__hists_findnew(session, data->id, 0, 0);
80 137
81 if (chain->nr*sizeof(u64) > chain_size) 138 if (!hists)
82 return -1; 139 return -ENOMEM;
83 140
141 hists->stats.total_period += data->period;
142 /*
143 * FIXME: add_event_total should be moved from here to
144 * perf_session__process_event so that the proper hist is passed to
145 * the event_op methods.
146 */
147 hists__inc_nr_events(hists, PERF_RECORD_SAMPLE);
148 session->hists.stats.total_period += data->period;
84 return 0; 149 return 0;
85} 150}
86 151
@@ -88,21 +153,19 @@ static int process_sample_event(event_t *event, struct perf_session *session)
88{ 153{
89 struct sample_data data = { .period = 1, }; 154 struct sample_data data = { .period = 1, };
90 struct addr_location al; 155 struct addr_location al;
156 struct perf_event_attr *attr;
91 157
92 event__parse_sample(event, session->sample_type, &data); 158 event__parse_sample(event, session->sample_type, &data);
93 159
94 dump_printf("(IP, %d): %d/%d: %p period: %Ld\n", 160 dump_printf("(IP, %d): %d/%d: %#Lx period: %Ld\n", event->header.misc,
95 event->header.misc, 161 data.pid, data.tid, data.ip, data.period);
96 data.pid, data.tid,
97 (void *)(long)data.ip,
98 (long long)data.period);
99 162
100 if (session->sample_type & PERF_SAMPLE_CALLCHAIN) { 163 if (session->sample_type & PERF_SAMPLE_CALLCHAIN) {
101 unsigned int i; 164 unsigned int i;
102 165
103 dump_printf("... chain: nr:%Lu\n", data.callchain->nr); 166 dump_printf("... chain: nr:%Lu\n", data.callchain->nr);
104 167
105 if (validate_chain(data.callchain, event) < 0) { 168 if (!ip_callchain__valid(data.callchain, event)) {
106 pr_debug("call-chain problem with event, " 169 pr_debug("call-chain problem with event, "
107 "skipping it.\n"); 170 "skipping it.\n");
108 return 0; 171 return 0;
@@ -121,15 +184,21 @@ static int process_sample_event(event_t *event, struct perf_session *session)
121 return -1; 184 return -1;
122 } 185 }
123 186
124 if (al.filtered) 187 if (al.filtered || (hide_unresolved && al.sym == NULL))
125 return 0; 188 return 0;
126 189
127 if (perf_session__add_hist_entry(session, &al, data.callchain, data.period)) { 190 if (perf_session__add_hist_entry(session, &al, &data)) {
128 pr_debug("problem incrementing symbol count, skipping event\n"); 191 pr_debug("problem incrementing symbol period, skipping event\n");
192 return -1;
193 }
194
195 attr = perf_header__find_attr(data.id, &session->header);
196
197 if (add_event_total(session, &data, attr)) {
198 pr_debug("problem adding event period\n");
129 return -1; 199 return -1;
130 } 200 }
131 201
132 session->events_stats.total += data.period;
133 return 0; 202 return 0;
134} 203}
135 204
@@ -156,14 +225,14 @@ static int process_read_event(event_t *event, struct perf_session *session __use
156 return 0; 225 return 0;
157} 226}
158 227
159static int sample_type_check(struct perf_session *session) 228static int perf_session__setup_sample_type(struct perf_session *self)
160{ 229{
161 if (!(session->sample_type & PERF_SAMPLE_CALLCHAIN)) { 230 if (!(self->sample_type & PERF_SAMPLE_CALLCHAIN)) {
162 if (sort__has_parent) { 231 if (sort__has_parent) {
163 fprintf(stderr, "selected --sort parent, but no" 232 fprintf(stderr, "selected --sort parent, but no"
164 " callchain data. Did you call" 233 " callchain data. Did you call"
165 " perf record without -g?\n"); 234 " perf record without -g?\n");
166 return -1; 235 return -EINVAL;
167 } 236 }
168 if (symbol_conf.use_callchain) { 237 if (symbol_conf.use_callchain) {
169 fprintf(stderr, "selected -g but no callchain data." 238 fprintf(stderr, "selected -g but no callchain data."
@@ -171,12 +240,13 @@ static int sample_type_check(struct perf_session *session)
171 " -g?\n"); 240 " -g?\n");
172 return -1; 241 return -1;
173 } 242 }
174 } else if (callchain_param.mode != CHAIN_NONE && !symbol_conf.use_callchain) { 243 } else if (!dont_use_callchains && callchain_param.mode != CHAIN_NONE &&
244 !symbol_conf.use_callchain) {
175 symbol_conf.use_callchain = true; 245 symbol_conf.use_callchain = true;
176 if (register_callchain_param(&callchain_param) < 0) { 246 if (register_callchain_param(&callchain_param) < 0) {
177 fprintf(stderr, "Can't register callchain" 247 fprintf(stderr, "Can't register callchain"
178 " params\n"); 248 " params\n");
179 return -1; 249 return -EINVAL;
180 } 250 }
181 } 251 }
182 252
@@ -184,35 +254,98 @@ static int sample_type_check(struct perf_session *session)
184} 254}
185 255
186static struct perf_event_ops event_ops = { 256static struct perf_event_ops event_ops = {
187 .process_sample_event = process_sample_event, 257 .sample = process_sample_event,
188 .process_mmap_event = event__process_mmap, 258 .mmap = event__process_mmap,
189 .process_comm_event = event__process_comm, 259 .comm = event__process_comm,
190 .process_exit_event = event__process_task, 260 .exit = event__process_task,
191 .process_fork_event = event__process_task, 261 .fork = event__process_task,
192 .process_lost_event = event__process_lost, 262 .lost = event__process_lost,
193 .process_read_event = process_read_event, 263 .read = process_read_event,
194 .sample_type_check = sample_type_check, 264 .attr = event__process_attr,
265 .event_type = event__process_event_type,
266 .tracing_data = event__process_tracing_data,
267 .build_id = event__process_build_id,
195}; 268};
196 269
270extern volatile int session_done;
271
272static void sig_handler(int sig __used)
273{
274 session_done = 1;
275}
276
277static size_t hists__fprintf_nr_sample_events(struct hists *self,
278 const char *evname, FILE *fp)
279{
280 size_t ret;
281 char unit;
282 unsigned long nr_events = self->stats.nr_events[PERF_RECORD_SAMPLE];
283
284 nr_events = convert_unit(nr_events, &unit);
285 ret = fprintf(fp, "# Events: %lu%c", nr_events, unit);
286 if (evname != NULL)
287 ret += fprintf(fp, " %s", evname);
288 return ret + fprintf(fp, "\n#\n");
289}
290
291static int hists__tty_browse_tree(struct rb_root *tree, const char *help)
292{
293 struct rb_node *next = rb_first(tree);
294
295 while (next) {
296 struct hists *hists = rb_entry(next, struct hists, rb_node);
297 const char *evname = NULL;
298
299 if (rb_first(&hists->entries) != rb_last(&hists->entries))
300 evname = __event_name(hists->type, hists->config);
301
302 hists__fprintf_nr_sample_events(hists, evname, stdout);
303 hists__fprintf(hists, NULL, false, stdout);
304 fprintf(stdout, "\n\n");
305 next = rb_next(&hists->rb_node);
306 }
307
308 if (sort_order == default_sort_order &&
309 parent_pattern == default_parent_pattern) {
310 fprintf(stdout, "#\n# (%s)\n#\n", help);
311
312 if (show_threads) {
313 bool style = !strcmp(pretty_printing_style, "raw");
314 perf_read_values_display(stdout, &show_threads_values,
315 style);
316 perf_read_values_destroy(&show_threads_values);
317 }
318 }
319
320 return 0;
321}
197 322
198static int __cmd_report(void) 323static int __cmd_report(void)
199{ 324{
200 int ret; 325 int ret = -EINVAL;
201 struct perf_session *session; 326 struct perf_session *session;
327 struct rb_node *next;
328 const char *help = "For a higher level overview, try: perf report --sort comm,dso";
329
330 signal(SIGINT, sig_handler);
202 331
203 session = perf_session__new(input_name, O_RDONLY, force); 332 session = perf_session__new(input_name, O_RDONLY, force, false);
204 if (session == NULL) 333 if (session == NULL)
205 return -ENOMEM; 334 return -ENOMEM;
206 335
207 if (show_threads) 336 if (show_threads)
208 perf_read_values_init(&show_threads_values); 337 perf_read_values_init(&show_threads_values);
209 338
339 ret = perf_session__setup_sample_type(session);
340 if (ret)
341 goto out_delete;
342
210 ret = perf_session__process_events(session, &event_ops); 343 ret = perf_session__process_events(session, &event_ops);
211 if (ret) 344 if (ret)
212 goto out_delete; 345 goto out_delete;
213 346
214 if (dump_trace) { 347 if (dump_trace) {
215 event__print_totals(); 348 perf_session__fprintf_nr_events(session, stdout);
216 goto out_delete; 349 goto out_delete;
217 } 350 }
218 351
@@ -220,22 +353,23 @@ static int __cmd_report(void)
220 perf_session__fprintf(session, stdout); 353 perf_session__fprintf(session, stdout);
221 354
222 if (verbose > 2) 355 if (verbose > 2)
223 dsos__fprintf(stdout); 356 perf_session__fprintf_dsos(session, stdout);
224 357
225 perf_session__collapse_resort(session); 358 next = rb_first(&session->hists_tree);
226 perf_session__output_resort(session, session->events_stats.total); 359 while (next) {
227 fprintf(stdout, "# Samples: %Ld\n#\n", session->events_stats.total); 360 struct hists *hists;
228 perf_session__fprintf_hists(session, NULL, false, stdout);
229 if (sort_order == default_sort_order &&
230 parent_pattern == default_parent_pattern)
231 fprintf(stdout, "#\n# (For a higher level overview, try: perf report --sort comm,dso)\n#\n");
232 361
233 if (show_threads) { 362 hists = rb_entry(next, struct hists, rb_node);
234 bool raw_printing_style = !strcmp(pretty_printing_style, "raw"); 363 hists__collapse_resort(hists);
235 perf_read_values_display(stdout, &show_threads_values, 364 hists__output_resort(hists);
236 raw_printing_style); 365 next = rb_next(&hists->rb_node);
237 perf_read_values_destroy(&show_threads_values);
238 } 366 }
367
368 if (use_browser > 0)
369 hists__tui_browse_tree(&session->hists_tree, help);
370 else
371 hists__tty_browse_tree(&session->hists_tree, help);
372
239out_delete: 373out_delete:
240 perf_session__delete(session); 374 perf_session__delete(session);
241 return ret; 375 return ret;
@@ -243,11 +377,19 @@ out_delete:
243 377
244static int 378static int
245parse_callchain_opt(const struct option *opt __used, const char *arg, 379parse_callchain_opt(const struct option *opt __used, const char *arg,
246 int unset __used) 380 int unset)
247{ 381{
248 char *tok; 382 char *tok, *tok2;
249 char *endptr; 383 char *endptr;
250 384
385 /*
386 * --no-call-graph
387 */
388 if (unset) {
389 dont_use_callchains = true;
390 return 0;
391 }
392
251 symbol_conf.use_callchain = true; 393 symbol_conf.use_callchain = true;
252 394
253 if (!arg) 395 if (!arg)
@@ -282,10 +424,13 @@ parse_callchain_opt(const struct option *opt __used, const char *arg,
282 if (!tok) 424 if (!tok)
283 goto setup; 425 goto setup;
284 426
427 tok2 = strtok(NULL, ",");
285 callchain_param.min_percent = strtod(tok, &endptr); 428 callchain_param.min_percent = strtod(tok, &endptr);
286 if (tok == endptr) 429 if (tok == endptr)
287 return -1; 430 return -1;
288 431
432 if (tok2)
433 callchain_param.print_limit = strtod(tok2, &endptr);
289setup: 434setup:
290 if (register_callchain_param(&callchain_param) < 0) { 435 if (register_callchain_param(&callchain_param) < 0) {
291 fprintf(stderr, "Can't register callchain params\n"); 436 fprintf(stderr, "Can't register callchain params\n");
@@ -302,7 +447,7 @@ static const char * const report_usage[] = {
302static const struct option options[] = { 447static const struct option options[] = {
303 OPT_STRING('i', "input", &input_name, "file", 448 OPT_STRING('i', "input", &input_name, "file",
304 "input file name"), 449 "input file name"),
305 OPT_BOOLEAN('v', "verbose", &verbose, 450 OPT_INCR('v', "verbose", &verbose,
306 "be more verbose (show symbol address, etc)"), 451 "be more verbose (show symbol address, etc)"),
307 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, 452 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
308 "dump raw trace in ASCII"), 453 "dump raw trace in ASCII"),
@@ -319,14 +464,16 @@ static const struct option options[] = {
319 "pretty printing style key: normal raw"), 464 "pretty printing style key: normal raw"),
320 OPT_STRING('s', "sort", &sort_order, "key[,key2...]", 465 OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
321 "sort by key(s): pid, comm, dso, symbol, parent"), 466 "sort by key(s): pid, comm, dso, symbol, parent"),
322 OPT_BOOLEAN('P', "full-paths", &event_ops.full_paths, 467 OPT_BOOLEAN('P', "full-paths", &symbol_conf.full_paths,
323 "Don't shorten the pathnames taking into account the cwd"), 468 "Don't shorten the pathnames taking into account the cwd"),
469 OPT_BOOLEAN(0, "showcpuutilization", &symbol_conf.show_cpu_utilization,
470 "Show sample percentage for different cpu modes"),
324 OPT_STRING('p', "parent", &parent_pattern, "regex", 471 OPT_STRING('p', "parent", &parent_pattern, "regex",
325 "regex filter to identify parent, see: '--sort parent'"), 472 "regex filter to identify parent, see: '--sort parent'"),
326 OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other, 473 OPT_BOOLEAN('x', "exclude-other", &symbol_conf.exclude_other,
327 "Only display entries with parent-match"), 474 "Only display entries with parent-match"),
328 OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent", 475 OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent",
329 "Display callchains using output_type and min percent threshold. " 476 "Display callchains using output_type (graph, flat, fractal, or none) and min percent threshold. "
330 "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt), 477 "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt),
331 OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]", 478 OPT_STRING('d', "dsos", &symbol_conf.dso_list_str, "dso[,dso...]",
332 "only consider symbols in these dsos"), 479 "only consider symbols in these dsos"),
@@ -340,6 +487,8 @@ static const struct option options[] = {
340 OPT_STRING('t', "field-separator", &symbol_conf.field_sep, "separator", 487 OPT_STRING('t', "field-separator", &symbol_conf.field_sep, "separator",
341 "separator for columns, no spaces will be added between " 488 "separator for columns, no spaces will be added between "
342 "columns '.' is reserved."), 489 "columns '.' is reserved."),
490 OPT_BOOLEAN('U', "hide-unresolved", &hide_unresolved,
491 "Only display entries resolved to a symbol"),
343 OPT_END() 492 OPT_END()
344}; 493};
345 494
@@ -347,7 +496,15 @@ int cmd_report(int argc, const char **argv, const char *prefix __used)
347{ 496{
348 argc = parse_options(argc, argv, options, report_usage, 0); 497 argc = parse_options(argc, argv, options, report_usage, 0);
349 498
350 setup_pager(); 499 if (strcmp(input_name, "-") != 0)
500 setup_browser();
501 /*
502 * Only in the newt browser we are doing integrated annotation,
503 * so don't allocate extra space that won't be used in the stdio
504 * implementation.
505 */
506 if (use_browser > 0)
507 symbol_conf.priv_size = sizeof(struct sym_priv);
351 508
352 if (symbol__init() < 0) 509 if (symbol__init() < 0)
353 return -1; 510 return -1;
@@ -355,7 +512,8 @@ int cmd_report(int argc, const char **argv, const char *prefix __used)
355 setup_sorting(report_usage, options); 512 setup_sorting(report_usage, options);
356 513
357 if (parent_pattern != default_parent_pattern) { 514 if (parent_pattern != default_parent_pattern) {
358 sort_dimension__add("parent"); 515 if (sort_dimension__add("parent") < 0)
516 return -1;
359 sort_parent.elide = 1; 517 sort_parent.elide = 1;
360 } else 518 } else
361 symbol_conf.exclude_other = false; 519 symbol_conf.exclude_other = false;
diff --git a/tools/perf/builtin-sched.c b/tools/perf/builtin-sched.c
index 80209df6cfe8..55f3b5dcc731 100644
--- a/tools/perf/builtin-sched.c
+++ b/tools/perf/builtin-sched.c
@@ -22,7 +22,7 @@
22static char const *input_name = "perf.data"; 22static char const *input_name = "perf.data";
23 23
24static char default_sort_order[] = "avg, max, switch, runtime"; 24static char default_sort_order[] = "avg, max, switch, runtime";
25static char *sort_order = default_sort_order; 25static const char *sort_order = default_sort_order;
26 26
27static int profile_cpu = -1; 27static int profile_cpu = -1;
28 28
@@ -68,10 +68,10 @@ enum sched_event_type {
68 68
69struct sched_atom { 69struct sched_atom {
70 enum sched_event_type type; 70 enum sched_event_type type;
71 int specific_wait;
71 u64 timestamp; 72 u64 timestamp;
72 u64 duration; 73 u64 duration;
73 unsigned long nr; 74 unsigned long nr;
74 int specific_wait;
75 sem_t *wait_sem; 75 sem_t *wait_sem;
76 struct task_desc *wakee; 76 struct task_desc *wakee;
77}; 77};
@@ -105,7 +105,7 @@ static u64 sum_runtime;
105static u64 sum_fluct; 105static u64 sum_fluct;
106static u64 run_avg; 106static u64 run_avg;
107 107
108static unsigned long replay_repeat = 10; 108static unsigned int replay_repeat = 10;
109static unsigned long nr_timestamps; 109static unsigned long nr_timestamps;
110static unsigned long nr_unordered_timestamps; 110static unsigned long nr_unordered_timestamps;
111static unsigned long nr_state_machine_bugs; 111static unsigned long nr_state_machine_bugs;
@@ -1621,11 +1621,8 @@ static int process_sample_event(event_t *event, struct perf_session *session)
1621 1621
1622 event__parse_sample(event, session->sample_type, &data); 1622 event__parse_sample(event, session->sample_type, &data);
1623 1623
1624 dump_printf("(IP, %d): %d/%d: %p period: %Ld\n", 1624 dump_printf("(IP, %d): %d/%d: %#Lx period: %Ld\n", event->header.misc,
1625 event->header.misc, 1625 data.pid, data.tid, data.ip, data.period);
1626 data.pid, data.tid,
1627 (void *)(long)data.ip,
1628 (long long)data.period);
1629 1626
1630 thread = perf_session__findnew(session, data.pid); 1627 thread = perf_session__findnew(session, data.pid);
1631 if (thread == NULL) { 1628 if (thread == NULL) {
@@ -1644,42 +1641,28 @@ static int process_sample_event(event_t *event, struct perf_session *session)
1644 return 0; 1641 return 0;
1645} 1642}
1646 1643
1647static int process_lost_event(event_t *event __used,
1648 struct perf_session *session __used)
1649{
1650 nr_lost_chunks++;
1651 nr_lost_events += event->lost.lost;
1652
1653 return 0;
1654}
1655
1656static int sample_type_check(struct perf_session *session __used)
1657{
1658 if (!(session->sample_type & PERF_SAMPLE_RAW)) {
1659 fprintf(stderr,
1660 "No trace sample to read. Did you call perf record "
1661 "without -R?");
1662 return -1;
1663 }
1664
1665 return 0;
1666}
1667
1668static struct perf_event_ops event_ops = { 1644static struct perf_event_ops event_ops = {
1669 .process_sample_event = process_sample_event, 1645 .sample = process_sample_event,
1670 .process_comm_event = event__process_comm, 1646 .comm = event__process_comm,
1671 .process_lost_event = process_lost_event, 1647 .lost = event__process_lost,
1672 .sample_type_check = sample_type_check, 1648 .fork = event__process_task,
1649 .ordered_samples = true,
1673}; 1650};
1674 1651
1675static int read_events(void) 1652static int read_events(void)
1676{ 1653{
1677 int err; 1654 int err = -EINVAL;
1678 struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); 1655 struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false);
1679 if (session == NULL) 1656 if (session == NULL)
1680 return -ENOMEM; 1657 return -ENOMEM;
1681 1658
1682 err = perf_session__process_events(session, &event_ops); 1659 if (perf_session__has_traces(session, "record -R")) {
1660 err = perf_session__process_events(session, &event_ops);
1661 nr_events = session->hists.stats.nr_events[0];
1662 nr_lost_events = session->hists.stats.total_lost;
1663 nr_lost_chunks = session->hists.stats.nr_events[PERF_RECORD_LOST];
1664 }
1665
1683 perf_session__delete(session); 1666 perf_session__delete(session);
1684 return err; 1667 return err;
1685} 1668}
@@ -1804,7 +1787,7 @@ static const char * const sched_usage[] = {
1804static const struct option sched_options[] = { 1787static const struct option sched_options[] = {
1805 OPT_STRING('i', "input", &input_name, "file", 1788 OPT_STRING('i', "input", &input_name, "file",
1806 "input file name"), 1789 "input file name"),
1807 OPT_BOOLEAN('v', "verbose", &verbose, 1790 OPT_INCR('v', "verbose", &verbose,
1808 "be more verbose (show symbol address, etc)"), 1791 "be more verbose (show symbol address, etc)"),
1809 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, 1792 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
1810 "dump raw trace in ASCII"), 1793 "dump raw trace in ASCII"),
@@ -1819,7 +1802,7 @@ static const char * const latency_usage[] = {
1819static const struct option latency_options[] = { 1802static const struct option latency_options[] = {
1820 OPT_STRING('s', "sort", &sort_order, "key[,key2...]", 1803 OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
1821 "sort by key(s): runtime, switch, avg, max"), 1804 "sort by key(s): runtime, switch, avg, max"),
1822 OPT_BOOLEAN('v', "verbose", &verbose, 1805 OPT_INCR('v', "verbose", &verbose,
1823 "be more verbose (show symbol address, etc)"), 1806 "be more verbose (show symbol address, etc)"),
1824 OPT_INTEGER('C', "CPU", &profile_cpu, 1807 OPT_INTEGER('C', "CPU", &profile_cpu,
1825 "CPU to profile on"), 1808 "CPU to profile on"),
@@ -1834,9 +1817,9 @@ static const char * const replay_usage[] = {
1834}; 1817};
1835 1818
1836static const struct option replay_options[] = { 1819static const struct option replay_options[] = {
1837 OPT_INTEGER('r', "repeat", &replay_repeat, 1820 OPT_UINTEGER('r', "repeat", &replay_repeat,
1838 "repeat the workload replay N times (-1: infinite)"), 1821 "repeat the workload replay N times (-1: infinite)"),
1839 OPT_BOOLEAN('v', "verbose", &verbose, 1822 OPT_INCR('v', "verbose", &verbose,
1840 "be more verbose (show symbol address, etc)"), 1823 "be more verbose (show symbol address, etc)"),
1841 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, 1824 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
1842 "dump raw trace in ASCII"), 1825 "dump raw trace in ASCII"),
@@ -1864,7 +1847,6 @@ static const char *record_args[] = {
1864 "record", 1847 "record",
1865 "-a", 1848 "-a",
1866 "-R", 1849 "-R",
1867 "-M",
1868 "-f", 1850 "-f",
1869 "-m", "1024", 1851 "-m", "1024",
1870 "-c", "1", 1852 "-c", "1",
diff --git a/tools/perf/builtin-stat.c b/tools/perf/builtin-stat.c
index c70d72003557..9a39ca3c3ac4 100644
--- a/tools/perf/builtin-stat.c
+++ b/tools/perf/builtin-stat.c
@@ -44,9 +44,13 @@
44#include "util/parse-events.h" 44#include "util/parse-events.h"
45#include "util/event.h" 45#include "util/event.h"
46#include "util/debug.h" 46#include "util/debug.h"
47#include "util/header.h"
48#include "util/cpumap.h"
49#include "util/thread.h"
47 50
48#include <sys/prctl.h> 51#include <sys/prctl.h>
49#include <math.h> 52#include <math.h>
53#include <locale.h>
50 54
51static struct perf_event_attr default_attrs[] = { 55static struct perf_event_attr default_attrs[] = {
52 56
@@ -64,21 +68,28 @@ static struct perf_event_attr default_attrs[] = {
64 68
65}; 69};
66 70
67static int system_wide = 0; 71static bool system_wide = false;
68static unsigned int nr_cpus = 0; 72static unsigned int nr_cpus = 0;
69static int run_idx = 0; 73static int run_idx = 0;
70 74
71static int run_count = 1; 75static int run_count = 1;
72static int inherit = 1; 76static bool no_inherit = false;
73static int scale = 1; 77static bool scale = true;
74static pid_t target_pid = -1; 78static pid_t target_pid = -1;
79static pid_t target_tid = -1;
80static pid_t *all_tids = NULL;
81static int thread_num = 0;
75static pid_t child_pid = -1; 82static pid_t child_pid = -1;
76static int null_run = 0; 83static bool null_run = false;
84static bool big_num = false;
77 85
78static int fd[MAX_NR_CPUS][MAX_COUNTERS]; 86
87static int *fd[MAX_NR_CPUS][MAX_COUNTERS];
79 88
80static int event_scaled[MAX_COUNTERS]; 89static int event_scaled[MAX_COUNTERS];
81 90
91static volatile int done = 0;
92
82struct stats 93struct stats
83{ 94{
84 double n, mean, M2; 95 double n, mean, M2;
@@ -136,9 +147,11 @@ struct stats runtime_branches_stats;
136#define ERR_PERF_OPEN \ 147#define ERR_PERF_OPEN \
137"Error: counter %d, sys_perf_event_open() syscall returned with %d (%s)\n" 148"Error: counter %d, sys_perf_event_open() syscall returned with %d (%s)\n"
138 149
139static void create_perf_stat_counter(int counter, int pid) 150static int create_perf_stat_counter(int counter)
140{ 151{
141 struct perf_event_attr *attr = attrs + counter; 152 struct perf_event_attr *attr = attrs + counter;
153 int thread;
154 int ncreated = 0;
142 155
143 if (scale) 156 if (scale)
144 attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED | 157 attr->read_format = PERF_FORMAT_TOTAL_TIME_ENABLED |
@@ -148,21 +161,33 @@ static void create_perf_stat_counter(int counter, int pid)
148 unsigned int cpu; 161 unsigned int cpu;
149 162
150 for (cpu = 0; cpu < nr_cpus; cpu++) { 163 for (cpu = 0; cpu < nr_cpus; cpu++) {
151 fd[cpu][counter] = sys_perf_event_open(attr, -1, cpu, -1, 0); 164 fd[cpu][counter][0] = sys_perf_event_open(attr,
152 if (fd[cpu][counter] < 0 && verbose) 165 -1, cpumap[cpu], -1, 0);
153 fprintf(stderr, ERR_PERF_OPEN, counter, 166 if (fd[cpu][counter][0] < 0)
154 fd[cpu][counter], strerror(errno)); 167 pr_debug(ERR_PERF_OPEN, counter,
168 fd[cpu][counter][0], strerror(errno));
169 else
170 ++ncreated;
155 } 171 }
156 } else { 172 } else {
157 attr->inherit = inherit; 173 attr->inherit = !no_inherit;
158 attr->disabled = 1; 174 if (target_pid == -1 && target_tid == -1) {
159 attr->enable_on_exec = 1; 175 attr->disabled = 1;
160 176 attr->enable_on_exec = 1;
161 fd[0][counter] = sys_perf_event_open(attr, pid, -1, -1, 0); 177 }
162 if (fd[0][counter] < 0 && verbose) 178 for (thread = 0; thread < thread_num; thread++) {
163 fprintf(stderr, ERR_PERF_OPEN, counter, 179 fd[0][counter][thread] = sys_perf_event_open(attr,
164 fd[0][counter], strerror(errno)); 180 all_tids[thread], -1, -1, 0);
181 if (fd[0][counter][thread] < 0)
182 pr_debug(ERR_PERF_OPEN, counter,
183 fd[0][counter][thread],
184 strerror(errno));
185 else
186 ++ncreated;
187 }
165 } 188 }
189
190 return ncreated;
166} 191}
167 192
168/* 193/*
@@ -186,25 +211,28 @@ static void read_counter(int counter)
186 unsigned int cpu; 211 unsigned int cpu;
187 size_t res, nv; 212 size_t res, nv;
188 int scaled; 213 int scaled;
189 int i; 214 int i, thread;
190 215
191 count[0] = count[1] = count[2] = 0; 216 count[0] = count[1] = count[2] = 0;
192 217
193 nv = scale ? 3 : 1; 218 nv = scale ? 3 : 1;
194 for (cpu = 0; cpu < nr_cpus; cpu++) { 219 for (cpu = 0; cpu < nr_cpus; cpu++) {
195 if (fd[cpu][counter] < 0) 220 for (thread = 0; thread < thread_num; thread++) {
196 continue; 221 if (fd[cpu][counter][thread] < 0)
197 222 continue;
198 res = read(fd[cpu][counter], single_count, nv * sizeof(u64)); 223
199 assert(res == nv * sizeof(u64)); 224 res = read(fd[cpu][counter][thread],
200 225 single_count, nv * sizeof(u64));
201 close(fd[cpu][counter]); 226 assert(res == nv * sizeof(u64));
202 fd[cpu][counter] = -1; 227
203 228 close(fd[cpu][counter][thread]);
204 count[0] += single_count[0]; 229 fd[cpu][counter][thread] = -1;
205 if (scale) { 230
206 count[1] += single_count[1]; 231 count[0] += single_count[0];
207 count[2] += single_count[2]; 232 if (scale) {
233 count[1] += single_count[1];
234 count[2] += single_count[2];
235 }
208 } 236 }
209 } 237 }
210 238
@@ -246,72 +274,88 @@ static int run_perf_stat(int argc __used, const char **argv)
246{ 274{
247 unsigned long long t0, t1; 275 unsigned long long t0, t1;
248 int status = 0; 276 int status = 0;
249 int counter; 277 int counter, ncreated = 0;
250 int pid;
251 int child_ready_pipe[2], go_pipe[2]; 278 int child_ready_pipe[2], go_pipe[2];
279 const bool forks = (argc > 0);
252 char buf; 280 char buf;
253 281
254 if (!system_wide) 282 if (!system_wide)
255 nr_cpus = 1; 283 nr_cpus = 1;
256 284
257 if (pipe(child_ready_pipe) < 0 || pipe(go_pipe) < 0) { 285 if (forks && (pipe(child_ready_pipe) < 0 || pipe(go_pipe) < 0)) {
258 perror("failed to create pipes"); 286 perror("failed to create pipes");
259 exit(1); 287 exit(1);
260 } 288 }
261 289
262 if ((pid = fork()) < 0) 290 if (forks) {
263 perror("failed to fork"); 291 if ((child_pid = fork()) < 0)
264 292 perror("failed to fork");
265 if (!pid) { 293
266 close(child_ready_pipe[0]); 294 if (!child_pid) {
267 close(go_pipe[1]); 295 close(child_ready_pipe[0]);
268 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC); 296 close(go_pipe[1]);
297 fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC);
298
299 /*
300 * Do a dummy execvp to get the PLT entry resolved,
301 * so we avoid the resolver overhead on the real
302 * execvp call.
303 */
304 execvp("", (char **)argv);
305
306 /*
307 * Tell the parent we're ready to go
308 */
309 close(child_ready_pipe[1]);
310
311 /*
312 * Wait until the parent tells us to go.
313 */
314 if (read(go_pipe[0], &buf, 1) == -1)
315 perror("unable to read pipe");
316
317 execvp(argv[0], (char **)argv);
318
319 perror(argv[0]);
320 exit(-1);
321 }
269 322
270 /* 323 if (target_tid == -1 && target_pid == -1 && !system_wide)
271 * Do a dummy execvp to get the PLT entry resolved, 324 all_tids[0] = child_pid;
272 * so we avoid the resolver overhead on the real
273 * execvp call.
274 */
275 execvp("", (char **)argv);
276 325
277 /* 326 /*
278 * Tell the parent we're ready to go 327 * Wait for the child to be ready to exec.
279 */ 328 */
280 close(child_ready_pipe[1]); 329 close(child_ready_pipe[1]);
281 330 close(go_pipe[0]);
282 /* 331 if (read(child_ready_pipe[0], &buf, 1) == -1)
283 * Wait until the parent tells us to go.
284 */
285 if (read(go_pipe[0], &buf, 1) == -1)
286 perror("unable to read pipe"); 332 perror("unable to read pipe");
287 333 close(child_ready_pipe[0]);
288 execvp(argv[0], (char **)argv);
289
290 perror(argv[0]);
291 exit(-1);
292 } 334 }
293 335
294 child_pid = pid;
295
296 /*
297 * Wait for the child to be ready to exec.
298 */
299 close(child_ready_pipe[1]);
300 close(go_pipe[0]);
301 if (read(child_ready_pipe[0], &buf, 1) == -1)
302 perror("unable to read pipe");
303 close(child_ready_pipe[0]);
304
305 for (counter = 0; counter < nr_counters; counter++) 336 for (counter = 0; counter < nr_counters; counter++)
306 create_perf_stat_counter(counter, pid); 337 ncreated += create_perf_stat_counter(counter);
338
339 if (ncreated == 0) {
340 pr_err("No permission to collect %sstats.\n"
341 "Consider tweaking /proc/sys/kernel/perf_event_paranoid.\n",
342 system_wide ? "system-wide " : "");
343 if (child_pid != -1)
344 kill(child_pid, SIGTERM);
345 return -1;
346 }
307 347
308 /* 348 /*
309 * Enable counters and exec the command: 349 * Enable counters and exec the command:
310 */ 350 */
311 t0 = rdclock(); 351 t0 = rdclock();
312 352
313 close(go_pipe[1]); 353 if (forks) {
314 wait(&status); 354 close(go_pipe[1]);
355 wait(&status);
356 } else {
357 while(!done) sleep(1);
358 }
315 359
316 t1 = rdclock(); 360 t1 = rdclock();
317 361
@@ -336,7 +380,7 @@ static void nsec_printout(int counter, double avg)
336{ 380{
337 double msecs = avg / 1e6; 381 double msecs = avg / 1e6;
338 382
339 fprintf(stderr, " %14.6f %-24s", msecs, event_name(counter)); 383 fprintf(stderr, " %18.6f %-24s", msecs, event_name(counter));
340 384
341 if (MATCH_EVENT(SOFTWARE, SW_TASK_CLOCK, counter)) { 385 if (MATCH_EVENT(SOFTWARE, SW_TASK_CLOCK, counter)) {
342 fprintf(stderr, " # %10.3f CPUs ", 386 fprintf(stderr, " # %10.3f CPUs ",
@@ -348,7 +392,10 @@ static void abs_printout(int counter, double avg)
348{ 392{
349 double total, ratio = 0.0; 393 double total, ratio = 0.0;
350 394
351 fprintf(stderr, " %14.0f %-24s", avg, event_name(counter)); 395 if (big_num)
396 fprintf(stderr, " %'18.0f %-24s", avg, event_name(counter));
397 else
398 fprintf(stderr, " %18.0f %-24s", avg, event_name(counter));
352 399
353 if (MATCH_EVENT(HARDWARE, HW_INSTRUCTIONS, counter)) { 400 if (MATCH_EVENT(HARDWARE, HW_INSTRUCTIONS, counter)) {
354 total = avg_stats(&runtime_cycles_stats); 401 total = avg_stats(&runtime_cycles_stats);
@@ -385,7 +432,7 @@ static void print_counter(int counter)
385 int scaled = event_scaled[counter]; 432 int scaled = event_scaled[counter];
386 433
387 if (scaled == -1) { 434 if (scaled == -1) {
388 fprintf(stderr, " %14s %-24s\n", 435 fprintf(stderr, " %18s %-24s\n",
389 "<not counted>", event_name(counter)); 436 "<not counted>", event_name(counter));
390 return; 437 return;
391 } 438 }
@@ -417,10 +464,15 @@ static void print_stat(int argc, const char **argv)
417 fflush(stdout); 464 fflush(stdout);
418 465
419 fprintf(stderr, "\n"); 466 fprintf(stderr, "\n");
420 fprintf(stderr, " Performance counter stats for \'%s", argv[0]); 467 fprintf(stderr, " Performance counter stats for ");
421 468 if(target_pid == -1 && target_tid == -1) {
422 for (i = 1; i < argc; i++) 469 fprintf(stderr, "\'%s", argv[0]);
423 fprintf(stderr, " %s", argv[i]); 470 for (i = 1; i < argc; i++)
471 fprintf(stderr, " %s", argv[i]);
472 } else if (target_pid != -1)
473 fprintf(stderr, "process id \'%d", target_pid);
474 else
475 fprintf(stderr, "thread id \'%d", target_tid);
424 476
425 fprintf(stderr, "\'"); 477 fprintf(stderr, "\'");
426 if (run_count > 1) 478 if (run_count > 1)
@@ -431,7 +483,7 @@ static void print_stat(int argc, const char **argv)
431 print_counter(counter); 483 print_counter(counter);
432 484
433 fprintf(stderr, "\n"); 485 fprintf(stderr, "\n");
434 fprintf(stderr, " %14.9f seconds time elapsed", 486 fprintf(stderr, " %18.9f seconds time elapsed",
435 avg_stats(&walltime_nsecs_stats)/1e9); 487 avg_stats(&walltime_nsecs_stats)/1e9);
436 if (run_count > 1) { 488 if (run_count > 1) {
437 fprintf(stderr, " ( +- %7.3f%% )", 489 fprintf(stderr, " ( +- %7.3f%% )",
@@ -445,6 +497,9 @@ static volatile int signr = -1;
445 497
446static void skip_signal(int signo) 498static void skip_signal(int signo)
447{ 499{
500 if(child_pid == -1)
501 done = 1;
502
448 signr = signo; 503 signr = signo;
449} 504}
450 505
@@ -461,7 +516,7 @@ static void sig_atexit(void)
461} 516}
462 517
463static const char * const stat_usage[] = { 518static const char * const stat_usage[] = {
464 "perf stat [<options>] <command>", 519 "perf stat [<options>] [<command>]",
465 NULL 520 NULL
466}; 521};
467 522
@@ -469,30 +524,37 @@ static const struct option options[] = {
469 OPT_CALLBACK('e', "event", NULL, "event", 524 OPT_CALLBACK('e', "event", NULL, "event",
470 "event selector. use 'perf list' to list available events", 525 "event selector. use 'perf list' to list available events",
471 parse_events), 526 parse_events),
472 OPT_BOOLEAN('i', "inherit", &inherit, 527 OPT_BOOLEAN('i', "no-inherit", &no_inherit,
473 "child tasks inherit counters"), 528 "child tasks do not inherit counters"),
474 OPT_INTEGER('p', "pid", &target_pid, 529 OPT_INTEGER('p', "pid", &target_pid,
475 "stat events on existing pid"), 530 "stat events on existing process id"),
531 OPT_INTEGER('t', "tid", &target_tid,
532 "stat events on existing thread id"),
476 OPT_BOOLEAN('a', "all-cpus", &system_wide, 533 OPT_BOOLEAN('a', "all-cpus", &system_wide,
477 "system-wide collection from all CPUs"), 534 "system-wide collection from all CPUs"),
478 OPT_BOOLEAN('c', "scale", &scale, 535 OPT_BOOLEAN('c', "scale", &scale,
479 "scale/normalize counters"), 536 "scale/normalize counters"),
480 OPT_BOOLEAN('v', "verbose", &verbose, 537 OPT_INCR('v', "verbose", &verbose,
481 "be more verbose (show counter open errors, etc)"), 538 "be more verbose (show counter open errors, etc)"),
482 OPT_INTEGER('r', "repeat", &run_count, 539 OPT_INTEGER('r', "repeat", &run_count,
483 "repeat command and print average + stddev (max: 100)"), 540 "repeat command and print average + stddev (max: 100)"),
484 OPT_BOOLEAN('n', "null", &null_run, 541 OPT_BOOLEAN('n', "null", &null_run,
485 "null run - dont start any counters"), 542 "null run - dont start any counters"),
543 OPT_BOOLEAN('B', "big-num", &big_num,
544 "print large numbers with thousands\' separators"),
486 OPT_END() 545 OPT_END()
487}; 546};
488 547
489int cmd_stat(int argc, const char **argv, const char *prefix __used) 548int cmd_stat(int argc, const char **argv, const char *prefix __used)
490{ 549{
491 int status; 550 int status;
551 int i,j;
552
553 setlocale(LC_ALL, "");
492 554
493 argc = parse_options(argc, argv, options, stat_usage, 555 argc = parse_options(argc, argv, options, stat_usage,
494 PARSE_OPT_STOP_AT_NON_OPTION); 556 PARSE_OPT_STOP_AT_NON_OPTION);
495 if (!argc) 557 if (!argc && target_pid == -1 && target_tid == -1)
496 usage_with_options(stat_usage, options); 558 usage_with_options(stat_usage, options);
497 if (run_count <= 0) 559 if (run_count <= 0)
498 usage_with_options(stat_usage, options); 560 usage_with_options(stat_usage, options);
@@ -503,9 +565,35 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used)
503 nr_counters = ARRAY_SIZE(default_attrs); 565 nr_counters = ARRAY_SIZE(default_attrs);
504 } 566 }
505 567
506 nr_cpus = sysconf(_SC_NPROCESSORS_ONLN); 568 if (system_wide)
507 assert(nr_cpus <= MAX_NR_CPUS); 569 nr_cpus = read_cpu_map();
508 assert((int)nr_cpus >= 0); 570 else
571 nr_cpus = 1;
572
573 if (target_pid != -1) {
574 target_tid = target_pid;
575 thread_num = find_all_tid(target_pid, &all_tids);
576 if (thread_num <= 0) {
577 fprintf(stderr, "Can't find all threads of pid %d\n",
578 target_pid);
579 usage_with_options(stat_usage, options);
580 }
581 } else {
582 all_tids=malloc(sizeof(pid_t));
583 if (!all_tids)
584 return -ENOMEM;
585
586 all_tids[0] = target_tid;
587 thread_num = 1;
588 }
589
590 for (i = 0; i < MAX_NR_CPUS; i++) {
591 for (j = 0; j < MAX_COUNTERS; j++) {
592 fd[i][j] = malloc(sizeof(int)*thread_num);
593 if (!fd[i][j])
594 return -ENOMEM;
595 }
596 }
509 597
510 /* 598 /*
511 * We dont want to block the signals - that would cause 599 * We dont want to block the signals - that would cause
@@ -525,7 +613,8 @@ int cmd_stat(int argc, const char **argv, const char *prefix __used)
525 status = run_perf_stat(argc, argv); 613 status = run_perf_stat(argc, argv);
526 } 614 }
527 615
528 print_stat(argc, argv); 616 if (status != -1)
617 print_stat(argc, argv);
529 618
530 return status; 619 return status;
531} 620}
diff --git a/tools/perf/builtin-test.c b/tools/perf/builtin-test.c
new file mode 100644
index 000000000000..035b9fa063a9
--- /dev/null
+++ b/tools/perf/builtin-test.c
@@ -0,0 +1,281 @@
1/*
2 * builtin-test.c
3 *
4 * Builtin regression testing command: ever growing number of sanity tests
5 */
6#include "builtin.h"
7
8#include "util/cache.h"
9#include "util/debug.h"
10#include "util/parse-options.h"
11#include "util/session.h"
12#include "util/symbol.h"
13#include "util/thread.h"
14
15static long page_size;
16
17static int vmlinux_matches_kallsyms_filter(struct map *map __used, struct symbol *sym)
18{
19 bool *visited = symbol__priv(sym);
20 *visited = true;
21 return 0;
22}
23
24static int test__vmlinux_matches_kallsyms(void)
25{
26 int err = -1;
27 struct rb_node *nd;
28 struct symbol *sym;
29 struct map *kallsyms_map, *vmlinux_map;
30 struct machine kallsyms, vmlinux;
31 enum map_type type = MAP__FUNCTION;
32 struct ref_reloc_sym ref_reloc_sym = { .name = "_stext", };
33
34 /*
35 * Step 1:
36 *
37 * Init the machines that will hold kernel, modules obtained from
38 * both vmlinux + .ko files and from /proc/kallsyms split by modules.
39 */
40 machine__init(&kallsyms, "", HOST_KERNEL_ID);
41 machine__init(&vmlinux, "", HOST_KERNEL_ID);
42
43 /*
44 * Step 2:
45 *
46 * Create the kernel maps for kallsyms and the DSO where we will then
47 * load /proc/kallsyms. Also create the modules maps from /proc/modules
48 * and find the .ko files that match them in /lib/modules/`uname -r`/.
49 */
50 if (machine__create_kernel_maps(&kallsyms) < 0) {
51 pr_debug("machine__create_kernel_maps ");
52 return -1;
53 }
54
55 /*
56 * Step 3:
57 *
58 * Load and split /proc/kallsyms into multiple maps, one per module.
59 */
60 if (machine__load_kallsyms(&kallsyms, "/proc/kallsyms", type, NULL) <= 0) {
61 pr_debug("dso__load_kallsyms ");
62 goto out;
63 }
64
65 /*
66 * Step 4:
67 *
68 * kallsyms will be internally on demand sorted by name so that we can
69 * find the reference relocation * symbol, i.e. the symbol we will use
70 * to see if the running kernel was relocated by checking if it has the
71 * same value in the vmlinux file we load.
72 */
73 kallsyms_map = machine__kernel_map(&kallsyms, type);
74
75 sym = map__find_symbol_by_name(kallsyms_map, ref_reloc_sym.name, NULL);
76 if (sym == NULL) {
77 pr_debug("dso__find_symbol_by_name ");
78 goto out;
79 }
80
81 ref_reloc_sym.addr = sym->start;
82
83 /*
84 * Step 5:
85 *
86 * Now repeat step 2, this time for the vmlinux file we'll auto-locate.
87 */
88 if (machine__create_kernel_maps(&vmlinux) < 0) {
89 pr_debug("machine__create_kernel_maps ");
90 goto out;
91 }
92
93 vmlinux_map = machine__kernel_map(&vmlinux, type);
94 map__kmap(vmlinux_map)->ref_reloc_sym = &ref_reloc_sym;
95
96 /*
97 * Step 6:
98 *
99 * Locate a vmlinux file in the vmlinux path that has a buildid that
100 * matches the one of the running kernel.
101 *
102 * While doing that look if we find the ref reloc symbol, if we find it
103 * we'll have its ref_reloc_symbol.unrelocated_addr and then
104 * maps__reloc_vmlinux will notice and set proper ->[un]map_ip routines
105 * to fixup the symbols.
106 */
107 if (machine__load_vmlinux_path(&vmlinux, type,
108 vmlinux_matches_kallsyms_filter) <= 0) {
109 pr_debug("machine__load_vmlinux_path ");
110 goto out;
111 }
112
113 err = 0;
114 /*
115 * Step 7:
116 *
117 * Now look at the symbols in the vmlinux DSO and check if we find all of them
118 * in the kallsyms dso. For the ones that are in both, check its names and
119 * end addresses too.
120 */
121 for (nd = rb_first(&vmlinux_map->dso->symbols[type]); nd; nd = rb_next(nd)) {
122 struct symbol *pair;
123
124 sym = rb_entry(nd, struct symbol, rb_node);
125 pair = machine__find_kernel_symbol(&kallsyms, type, sym->start, NULL, NULL);
126
127 if (pair && pair->start == sym->start) {
128next_pair:
129 if (strcmp(sym->name, pair->name) == 0) {
130 /*
131 * kallsyms don't have the symbol end, so we
132 * set that by using the next symbol start - 1,
133 * in some cases we get this up to a page
134 * wrong, trace_kmalloc when I was developing
135 * this code was one such example, 2106 bytes
136 * off the real size. More than that and we
137 * _really_ have a problem.
138 */
139 s64 skew = sym->end - pair->end;
140 if (llabs(skew) < page_size)
141 continue;
142
143 pr_debug("%#Lx: diff end addr for %s v: %#Lx k: %#Lx\n",
144 sym->start, sym->name, sym->end, pair->end);
145 } else {
146 struct rb_node *nnd = rb_prev(&pair->rb_node);
147
148 if (nnd) {
149 struct symbol *next = rb_entry(nnd, struct symbol, rb_node);
150
151 if (next->start == sym->start) {
152 pair = next;
153 goto next_pair;
154 }
155 }
156 pr_debug("%#Lx: diff name v: %s k: %s\n",
157 sym->start, sym->name, pair->name);
158 }
159 } else
160 pr_debug("%#Lx: %s not on kallsyms\n", sym->start, sym->name);
161
162 err = -1;
163 }
164
165 if (!verbose)
166 goto out;
167
168 pr_info("Maps only in vmlinux:\n");
169
170 for (nd = rb_first(&vmlinux.kmaps.maps[type]); nd; nd = rb_next(nd)) {
171 struct map *pos = rb_entry(nd, struct map, rb_node), *pair;
172 /*
173 * If it is the kernel, kallsyms is always "[kernel.kallsyms]", while
174 * the kernel will have the path for the vmlinux file being used,
175 * so use the short name, less descriptive but the same ("[kernel]" in
176 * both cases.
177 */
178 pair = map_groups__find_by_name(&kallsyms.kmaps, type,
179 (pos->dso->kernel ?
180 pos->dso->short_name :
181 pos->dso->name));
182 if (pair)
183 pair->priv = 1;
184 else
185 map__fprintf(pos, stderr);
186 }
187
188 pr_info("Maps in vmlinux with a different name in kallsyms:\n");
189
190 for (nd = rb_first(&vmlinux.kmaps.maps[type]); nd; nd = rb_next(nd)) {
191 struct map *pos = rb_entry(nd, struct map, rb_node), *pair;
192
193 pair = map_groups__find(&kallsyms.kmaps, type, pos->start);
194 if (pair == NULL || pair->priv)
195 continue;
196
197 if (pair->start == pos->start) {
198 pair->priv = 1;
199 pr_info(" %Lx-%Lx %Lx %s in kallsyms as",
200 pos->start, pos->end, pos->pgoff, pos->dso->name);
201 if (pos->pgoff != pair->pgoff || pos->end != pair->end)
202 pr_info(": \n*%Lx-%Lx %Lx",
203 pair->start, pair->end, pair->pgoff);
204 pr_info(" %s\n", pair->dso->name);
205 pair->priv = 1;
206 }
207 }
208
209 pr_info("Maps only in kallsyms:\n");
210
211 for (nd = rb_first(&kallsyms.kmaps.maps[type]);
212 nd; nd = rb_next(nd)) {
213 struct map *pos = rb_entry(nd, struct map, rb_node);
214
215 if (!pos->priv)
216 map__fprintf(pos, stderr);
217 }
218out:
219 return err;
220}
221
222static struct test {
223 const char *desc;
224 int (*func)(void);
225} tests[] = {
226 {
227 .desc = "vmlinux symtab matches kallsyms",
228 .func = test__vmlinux_matches_kallsyms,
229 },
230 {
231 .func = NULL,
232 },
233};
234
235static int __cmd_test(void)
236{
237 int i = 0;
238
239 page_size = sysconf(_SC_PAGE_SIZE);
240
241 while (tests[i].func) {
242 int err;
243 pr_info("%2d: %s:", i + 1, tests[i].desc);
244 pr_debug("\n--- start ---\n");
245 err = tests[i].func();
246 pr_debug("---- end ----\n%s:", tests[i].desc);
247 pr_info(" %s\n", err ? "FAILED!\n" : "Ok");
248 ++i;
249 }
250
251 return 0;
252}
253
254static const char * const test_usage[] = {
255 "perf test [<options>]",
256 NULL,
257};
258
259static const struct option test_options[] = {
260 OPT_INTEGER('v', "verbose", &verbose,
261 "be more verbose (show symbol address, etc)"),
262 OPT_END()
263};
264
265int cmd_test(int argc, const char **argv, const char *prefix __used)
266{
267 argc = parse_options(argc, argv, test_options, test_usage, 0);
268 if (argc)
269 usage_with_options(test_usage, test_options);
270
271 symbol_conf.priv_size = sizeof(int);
272 symbol_conf.sort_by_name = true;
273 symbol_conf.try_vmlinux_path = true;
274
275 if (symbol__init() < 0)
276 return -1;
277
278 setup_pager();
279
280 return __cmd_test();
281}
diff --git a/tools/perf/builtin-timechart.c b/tools/perf/builtin-timechart.c
index 3f8bbcfb1e9b..5a52ed9fc10b 100644
--- a/tools/perf/builtin-timechart.c
+++ b/tools/perf/builtin-timechart.c
@@ -21,7 +21,6 @@
21#include "util/cache.h" 21#include "util/cache.h"
22#include <linux/rbtree.h> 22#include <linux/rbtree.h>
23#include "util/symbol.h" 23#include "util/symbol.h"
24#include "util/string.h"
25#include "util/callchain.h" 24#include "util/callchain.h"
26#include "util/strlist.h" 25#include "util/strlist.h"
27 26
@@ -43,7 +42,7 @@ static u64 turbo_frequency;
43 42
44static u64 first_time, last_time; 43static u64 first_time, last_time;
45 44
46static int power_only; 45static bool power_only;
47 46
48 47
49struct per_pid; 48struct per_pid;
@@ -78,8 +77,6 @@ struct per_pid {
78 77
79 struct per_pidcomm *all; 78 struct per_pidcomm *all;
80 struct per_pidcomm *current; 79 struct per_pidcomm *current;
81
82 int painted;
83}; 80};
84 81
85 82
@@ -146,9 +143,6 @@ struct wake_event {
146static struct power_event *power_events; 143static struct power_event *power_events;
147static struct wake_event *wake_events; 144static struct wake_event *wake_events;
148 145
149struct sample_wrapper *all_samples;
150
151
152struct process_filter; 146struct process_filter;
153struct process_filter { 147struct process_filter {
154 char *name; 148 char *name;
@@ -569,88 +563,6 @@ static void end_sample_processing(void)
569 } 563 }
570} 564}
571 565
572static u64 sample_time(event_t *event, const struct perf_session *session)
573{
574 int cursor;
575
576 cursor = 0;
577 if (session->sample_type & PERF_SAMPLE_IP)
578 cursor++;
579 if (session->sample_type & PERF_SAMPLE_TID)
580 cursor++;
581 if (session->sample_type & PERF_SAMPLE_TIME)
582 return event->sample.array[cursor];
583 return 0;
584}
585
586
587/*
588 * We first queue all events, sorted backwards by insertion.
589 * The order will get flipped later.
590 */
591static int queue_sample_event(event_t *event, struct perf_session *session)
592{
593 struct sample_wrapper *copy, *prev;
594 int size;
595
596 size = event->sample.header.size + sizeof(struct sample_wrapper) + 8;
597
598 copy = malloc(size);
599 if (!copy)
600 return 1;
601
602 memset(copy, 0, size);
603
604 copy->next = NULL;
605 copy->timestamp = sample_time(event, session);
606
607 memcpy(&copy->data, event, event->sample.header.size);
608
609 /* insert in the right place in the list */
610
611 if (!all_samples) {
612 /* first sample ever */
613 all_samples = copy;
614 return 0;
615 }
616
617 if (all_samples->timestamp < copy->timestamp) {
618 /* insert at the head of the list */
619 copy->next = all_samples;
620 all_samples = copy;
621 return 0;
622 }
623
624 prev = all_samples;
625 while (prev->next) {
626 if (prev->next->timestamp < copy->timestamp) {
627 copy->next = prev->next;
628 prev->next = copy;
629 return 0;
630 }
631 prev = prev->next;
632 }
633 /* insert at the end of the list */
634 prev->next = copy;
635
636 return 0;
637}
638
639static void sort_queued_samples(void)
640{
641 struct sample_wrapper *cursor, *next;
642
643 cursor = all_samples;
644 all_samples = NULL;
645
646 while (cursor) {
647 next = cursor->next;
648 cursor->next = all_samples;
649 all_samples = cursor;
650 cursor = next;
651 }
652}
653
654/* 566/*
655 * Sort the pid datastructure 567 * Sort the pid datastructure
656 */ 568 */
@@ -1014,54 +926,29 @@ static void write_svg_file(const char *filename)
1014 svg_close(); 926 svg_close();
1015} 927}
1016 928
1017static void process_samples(struct perf_session *session)
1018{
1019 struct sample_wrapper *cursor;
1020 event_t *event;
1021
1022 sort_queued_samples();
1023
1024 cursor = all_samples;
1025 while (cursor) {
1026 event = (void *)&cursor->data;
1027 cursor = cursor->next;
1028 process_sample_event(event, session);
1029 }
1030}
1031
1032static int sample_type_check(struct perf_session *session)
1033{
1034 if (!(session->sample_type & PERF_SAMPLE_RAW)) {
1035 fprintf(stderr, "No trace samples found in the file.\n"
1036 "Have you used 'perf timechart record' to record it?\n");
1037 return -1;
1038 }
1039
1040 return 0;
1041}
1042
1043static struct perf_event_ops event_ops = { 929static struct perf_event_ops event_ops = {
1044 .process_comm_event = process_comm_event, 930 .comm = process_comm_event,
1045 .process_fork_event = process_fork_event, 931 .fork = process_fork_event,
1046 .process_exit_event = process_exit_event, 932 .exit = process_exit_event,
1047 .process_sample_event = queue_sample_event, 933 .sample = process_sample_event,
1048 .sample_type_check = sample_type_check, 934 .ordered_samples = true,
1049}; 935};
1050 936
1051static int __cmd_timechart(void) 937static int __cmd_timechart(void)
1052{ 938{
1053 struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0); 939 struct perf_session *session = perf_session__new(input_name, O_RDONLY, 0, false);
1054 int ret; 940 int ret = -EINVAL;
1055 941
1056 if (session == NULL) 942 if (session == NULL)
1057 return -ENOMEM; 943 return -ENOMEM;
1058 944
945 if (!perf_session__has_traces(session, "timechart record"))
946 goto out_delete;
947
1059 ret = perf_session__process_events(session, &event_ops); 948 ret = perf_session__process_events(session, &event_ops);
1060 if (ret) 949 if (ret)
1061 goto out_delete; 950 goto out_delete;
1062 951
1063 process_samples(session);
1064
1065 end_sample_processing(); 952 end_sample_processing();
1066 953
1067 sort_pids(); 954 sort_pids();
@@ -1084,7 +971,6 @@ static const char *record_args[] = {
1084 "record", 971 "record",
1085 "-a", 972 "-a",
1086 "-R", 973 "-R",
1087 "-M",
1088 "-f", 974 "-f",
1089 "-c", "1", 975 "-c", "1",
1090 "-e", "power:power_start", 976 "-e", "power:power_start",
diff --git a/tools/perf/builtin-top.c b/tools/perf/builtin-top.c
index 4b91d8cf00ec..a66f4272b994 100644
--- a/tools/perf/builtin-top.c
+++ b/tools/perf/builtin-top.c
@@ -28,6 +28,7 @@
28#include <linux/rbtree.h> 28#include <linux/rbtree.h>
29#include "util/parse-options.h" 29#include "util/parse-options.h"
30#include "util/parse-events.h" 30#include "util/parse-events.h"
31#include "util/cpumap.h"
31 32
32#include "util/debug.h" 33#include "util/debug.h"
33 34
@@ -54,9 +55,9 @@
54#include <linux/unistd.h> 55#include <linux/unistd.h>
55#include <linux/types.h> 56#include <linux/types.h>
56 57
57static int fd[MAX_NR_CPUS][MAX_COUNTERS]; 58static int *fd[MAX_NR_CPUS][MAX_COUNTERS];
58 59
59static int system_wide = 0; 60static bool system_wide = false;
60 61
61static int default_interval = 0; 62static int default_interval = 0;
62 63
@@ -64,18 +65,21 @@ static int count_filter = 5;
64static int print_entries; 65static int print_entries;
65 66
66static int target_pid = -1; 67static int target_pid = -1;
67static int inherit = 0; 68static int target_tid = -1;
69static pid_t *all_tids = NULL;
70static int thread_num = 0;
71static bool inherit = false;
68static int profile_cpu = -1; 72static int profile_cpu = -1;
69static int nr_cpus = 0; 73static int nr_cpus = 0;
70static unsigned int realtime_prio = 0; 74static int realtime_prio = 0;
71static int group = 0; 75static bool group = false;
72static unsigned int page_size; 76static unsigned int page_size;
73static unsigned int mmap_pages = 16; 77static unsigned int mmap_pages = 16;
74static int freq = 1000; /* 1 KHz */ 78static int freq = 1000; /* 1 KHz */
75 79
76static int delay_secs = 2; 80static int delay_secs = 2;
77static int zero = 0; 81static bool zero = false;
78static int dump_symtab = 0; 82static bool dump_symtab = false;
79 83
80static bool hide_kernel_symbols = false; 84static bool hide_kernel_symbols = false;
81static bool hide_user_symbols = false; 85static bool hide_user_symbols = false;
@@ -92,8 +96,9 @@ struct source_line {
92 struct source_line *next; 96 struct source_line *next;
93}; 97};
94 98
95static char *sym_filter = NULL; 99static const char *sym_filter = NULL;
96struct sym_entry *sym_filter_entry = NULL; 100struct sym_entry *sym_filter_entry = NULL;
101struct sym_entry *sym_filter_entry_sched = NULL;
97static int sym_pcnt_filter = 5; 102static int sym_pcnt_filter = 5;
98static int sym_counter = 0; 103static int sym_counter = 0;
99static int display_weighted = -1; 104static int display_weighted = -1;
@@ -131,7 +136,7 @@ static inline struct symbol *sym_entry__symbol(struct sym_entry *self)
131 return ((void *)self) + symbol_conf.priv_size; 136 return ((void *)self) + symbol_conf.priv_size;
132} 137}
133 138
134static void get_term_dimensions(struct winsize *ws) 139void get_term_dimensions(struct winsize *ws)
135{ 140{
136 char *s = getenv("LINES"); 141 char *s = getenv("LINES");
137 142
@@ -167,7 +172,7 @@ static void sig_winch_handler(int sig __used)
167 update_print_entries(&winsize); 172 update_print_entries(&winsize);
168} 173}
169 174
170static void parse_source(struct sym_entry *syme) 175static int parse_source(struct sym_entry *syme)
171{ 176{
172 struct symbol *sym; 177 struct symbol *sym;
173 struct sym_entry_source *source; 178 struct sym_entry_source *source;
@@ -178,12 +183,21 @@ static void parse_source(struct sym_entry *syme)
178 u64 len; 183 u64 len;
179 184
180 if (!syme) 185 if (!syme)
181 return; 186 return -1;
187
188 sym = sym_entry__symbol(syme);
189 map = syme->map;
190
191 /*
192 * We can't annotate with just /proc/kallsyms
193 */
194 if (map->dso->origin == DSO__ORIG_KERNEL)
195 return -1;
182 196
183 if (syme->src == NULL) { 197 if (syme->src == NULL) {
184 syme->src = zalloc(sizeof(*source)); 198 syme->src = zalloc(sizeof(*source));
185 if (syme->src == NULL) 199 if (syme->src == NULL)
186 return; 200 return -1;
187 pthread_mutex_init(&syme->src->lock, NULL); 201 pthread_mutex_init(&syme->src->lock, NULL);
188 } 202 }
189 203
@@ -193,29 +207,25 @@ static void parse_source(struct sym_entry *syme)
193 pthread_mutex_lock(&source->lock); 207 pthread_mutex_lock(&source->lock);
194 goto out_assign; 208 goto out_assign;
195 } 209 }
196
197 sym = sym_entry__symbol(syme);
198 map = syme->map;
199 path = map->dso->long_name; 210 path = map->dso->long_name;
200 211
201 len = sym->end - sym->start; 212 len = sym->end - sym->start;
202 213
203 sprintf(command, 214 sprintf(command,
204 "objdump --start-address=0x%016Lx " 215 "objdump --start-address=%#0*Lx --stop-address=%#0*Lx -dS %s",
205 "--stop-address=0x%016Lx -dS %s", 216 BITS_PER_LONG / 4, map__rip_2objdump(map, sym->start),
206 map->unmap_ip(map, sym->start), 217 BITS_PER_LONG / 4, map__rip_2objdump(map, sym->end), path);
207 map->unmap_ip(map, sym->end), path);
208 218
209 file = popen(command, "r"); 219 file = popen(command, "r");
210 if (!file) 220 if (!file)
211 return; 221 return -1;
212 222
213 pthread_mutex_lock(&source->lock); 223 pthread_mutex_lock(&source->lock);
214 source->lines_tail = &source->lines; 224 source->lines_tail = &source->lines;
215 while (!feof(file)) { 225 while (!feof(file)) {
216 struct source_line *src; 226 struct source_line *src;
217 size_t dummy = 0; 227 size_t dummy = 0;
218 char *c; 228 char *c, *sep;
219 229
220 src = malloc(sizeof(struct source_line)); 230 src = malloc(sizeof(struct source_line));
221 assert(src != NULL); 231 assert(src != NULL);
@@ -234,19 +244,17 @@ static void parse_source(struct sym_entry *syme)
234 *source->lines_tail = src; 244 *source->lines_tail = src;
235 source->lines_tail = &src->next; 245 source->lines_tail = &src->next;
236 246
237 if (strlen(src->line)>8 && src->line[8] == ':') { 247 src->eip = strtoull(src->line, &sep, 16);
238 src->eip = strtoull(src->line, NULL, 16); 248 if (*sep == ':')
239 src->eip = map->unmap_ip(map, src->eip); 249 src->eip = map__objdump_2ip(map, src->eip);
240 } 250 else /* this line has no ip info (e.g. source line) */
241 if (strlen(src->line)>8 && src->line[16] == ':') { 251 src->eip = 0;
242 src->eip = strtoull(src->line, NULL, 16);
243 src->eip = map->unmap_ip(map, src->eip);
244 }
245 } 252 }
246 pclose(file); 253 pclose(file);
247out_assign: 254out_assign:
248 sym_filter_entry = syme; 255 sym_filter_entry = syme;
249 pthread_mutex_unlock(&source->lock); 256 pthread_mutex_unlock(&source->lock);
257 return 0;
250} 258}
251 259
252static void __zero_source_counters(struct sym_entry *syme) 260static void __zero_source_counters(struct sym_entry *syme)
@@ -276,6 +284,9 @@ static void record_precise_ip(struct sym_entry *syme, int counter, u64 ip)
276 goto out_unlock; 284 goto out_unlock;
277 285
278 for (line = syme->src->lines; line; line = line->next) { 286 for (line = syme->src->lines; line; line = line->next) {
287 /* skip lines without IP info */
288 if (line->eip == 0)
289 continue;
279 if (line->eip == ip) { 290 if (line->eip == ip) {
280 line->count[counter]++; 291 line->count[counter]++;
281 break; 292 break;
@@ -287,17 +298,20 @@ out_unlock:
287 pthread_mutex_unlock(&syme->src->lock); 298 pthread_mutex_unlock(&syme->src->lock);
288} 299}
289 300
301#define PATTERN_LEN (BITS_PER_LONG / 4 + 2)
302
290static void lookup_sym_source(struct sym_entry *syme) 303static void lookup_sym_source(struct sym_entry *syme)
291{ 304{
292 struct symbol *symbol = sym_entry__symbol(syme); 305 struct symbol *symbol = sym_entry__symbol(syme);
293 struct source_line *line; 306 struct source_line *line;
294 char pattern[PATH_MAX]; 307 char pattern[PATTERN_LEN + 1];
295 308
296 sprintf(pattern, "<%s>:", symbol->name); 309 sprintf(pattern, "%0*Lx <", BITS_PER_LONG / 4,
310 map__rip_2objdump(syme->map, symbol->start));
297 311
298 pthread_mutex_lock(&syme->src->lock); 312 pthread_mutex_lock(&syme->src->lock);
299 for (line = syme->src->lines; line; line = line->next) { 313 for (line = syme->src->lines; line; line = line->next) {
300 if (strstr(line->line, pattern)) { 314 if (memcmp(line->line, pattern, PATTERN_LEN) == 0) {
301 syme->src->source = line; 315 syme->src->source = line;
302 break; 316 break;
303 } 317 }
@@ -406,7 +420,9 @@ static double sym_weight(const struct sym_entry *sym)
406} 420}
407 421
408static long samples; 422static long samples;
409static long userspace_samples; 423static long kernel_samples, us_samples;
424static long exact_samples;
425static long guest_us_samples, guest_kernel_samples;
410static const char CONSOLE_CLEAR[] = ""; 426static const char CONSOLE_CLEAR[] = "";
411 427
412static void __list_insert_active_sym(struct sym_entry *syme) 428static void __list_insert_active_sym(struct sym_entry *syme)
@@ -446,15 +462,20 @@ static void print_sym_table(void)
446 int printed = 0, j; 462 int printed = 0, j;
447 int counter, snap = !display_weighted ? sym_counter : 0; 463 int counter, snap = !display_weighted ? sym_counter : 0;
448 float samples_per_sec = samples/delay_secs; 464 float samples_per_sec = samples/delay_secs;
449 float ksamples_per_sec = (samples-userspace_samples)/delay_secs; 465 float ksamples_per_sec = kernel_samples/delay_secs;
466 float us_samples_per_sec = (us_samples)/delay_secs;
467 float guest_kernel_samples_per_sec = (guest_kernel_samples)/delay_secs;
468 float guest_us_samples_per_sec = (guest_us_samples)/delay_secs;
469 float esamples_percent = (100.0*exact_samples)/samples;
450 float sum_ksamples = 0.0; 470 float sum_ksamples = 0.0;
451 struct sym_entry *syme, *n; 471 struct sym_entry *syme, *n;
452 struct rb_root tmp = RB_ROOT; 472 struct rb_root tmp = RB_ROOT;
453 struct rb_node *nd; 473 struct rb_node *nd;
454 int sym_width = 0, dso_width = 0, max_dso_width; 474 int sym_width = 0, dso_width = 0, dso_short_width = 0;
455 const int win_width = winsize.ws_col - 1; 475 const int win_width = winsize.ws_col - 1;
456 476
457 samples = userspace_samples = 0; 477 samples = us_samples = kernel_samples = exact_samples = 0;
478 guest_kernel_samples = guest_us_samples = 0;
458 479
459 /* Sort the active symbols */ 480 /* Sort the active symbols */
460 pthread_mutex_lock(&active_symbols_lock); 481 pthread_mutex_lock(&active_symbols_lock);
@@ -485,9 +506,30 @@ static void print_sym_table(void)
485 puts(CONSOLE_CLEAR); 506 puts(CONSOLE_CLEAR);
486 507
487 printf("%-*.*s\n", win_width, win_width, graph_dotted_line); 508 printf("%-*.*s\n", win_width, win_width, graph_dotted_line);
488 printf( " PerfTop:%8.0f irqs/sec kernel:%4.1f%% [", 509 if (!perf_guest) {
489 samples_per_sec, 510 printf(" PerfTop:%8.0f irqs/sec kernel:%4.1f%%"
490 100.0 - (100.0*((samples_per_sec-ksamples_per_sec)/samples_per_sec))); 511 " exact: %4.1f%% [",
512 samples_per_sec,
513 100.0 - (100.0 * ((samples_per_sec - ksamples_per_sec) /
514 samples_per_sec)),
515 esamples_percent);
516 } else {
517 printf(" PerfTop:%8.0f irqs/sec kernel:%4.1f%% us:%4.1f%%"
518 " guest kernel:%4.1f%% guest us:%4.1f%%"
519 " exact: %4.1f%% [",
520 samples_per_sec,
521 100.0 - (100.0 * ((samples_per_sec-ksamples_per_sec) /
522 samples_per_sec)),
523 100.0 - (100.0 * ((samples_per_sec-us_samples_per_sec) /
524 samples_per_sec)),
525 100.0 - (100.0 * ((samples_per_sec -
526 guest_kernel_samples_per_sec) /
527 samples_per_sec)),
528 100.0 - (100.0 * ((samples_per_sec -
529 guest_us_samples_per_sec) /
530 samples_per_sec)),
531 esamples_percent);
532 }
491 533
492 if (nr_counters == 1 || !display_weighted) { 534 if (nr_counters == 1 || !display_weighted) {
493 printf("%Ld", (u64)attrs[0].sample_period); 535 printf("%Ld", (u64)attrs[0].sample_period);
@@ -510,13 +552,15 @@ static void print_sym_table(void)
510 552
511 if (target_pid != -1) 553 if (target_pid != -1)
512 printf(" (target_pid: %d", target_pid); 554 printf(" (target_pid: %d", target_pid);
555 else if (target_tid != -1)
556 printf(" (target_tid: %d", target_tid);
513 else 557 else
514 printf(" (all"); 558 printf(" (all");
515 559
516 if (profile_cpu != -1) 560 if (profile_cpu != -1)
517 printf(", cpu: %d)\n", profile_cpu); 561 printf(", cpu: %d)\n", profile_cpu);
518 else { 562 else {
519 if (target_pid != -1) 563 if (target_tid != -1)
520 printf(")\n"); 564 printf(")\n");
521 else 565 else
522 printf(", %d CPUs)\n", nr_cpus); 566 printf(", %d CPUs)\n", nr_cpus);
@@ -541,15 +585,20 @@ static void print_sym_table(void)
541 if (syme->map->dso->long_name_len > dso_width) 585 if (syme->map->dso->long_name_len > dso_width)
542 dso_width = syme->map->dso->long_name_len; 586 dso_width = syme->map->dso->long_name_len;
543 587
588 if (syme->map->dso->short_name_len > dso_short_width)
589 dso_short_width = syme->map->dso->short_name_len;
590
544 if (syme->name_len > sym_width) 591 if (syme->name_len > sym_width)
545 sym_width = syme->name_len; 592 sym_width = syme->name_len;
546 } 593 }
547 594
548 printed = 0; 595 printed = 0;
549 596
550 max_dso_width = winsize.ws_col - sym_width - 29; 597 if (sym_width + dso_width > winsize.ws_col - 29) {
551 if (dso_width > max_dso_width) 598 dso_width = dso_short_width;
552 dso_width = max_dso_width; 599 if (sym_width + dso_width > winsize.ws_col - 29)
600 sym_width = winsize.ws_col - dso_width - 29;
601 }
553 putchar('\n'); 602 putchar('\n');
554 if (nr_counters == 1) 603 if (nr_counters == 1)
555 printf(" samples pcnt"); 604 printf(" samples pcnt");
@@ -573,7 +622,6 @@ static void print_sym_table(void)
573 622
574 syme = rb_entry(nd, struct sym_entry, rb_node); 623 syme = rb_entry(nd, struct sym_entry, rb_node);
575 sym = sym_entry__symbol(syme); 624 sym = sym_entry__symbol(syme);
576
577 if (++printed > print_entries || (int)syme->snap_count < count_filter) 625 if (++printed > print_entries || (int)syme->snap_count < count_filter)
578 continue; 626 continue;
579 627
@@ -667,7 +715,7 @@ static void prompt_symbol(struct sym_entry **target, const char *msg)
667 } 715 }
668 716
669 if (!found) { 717 if (!found) {
670 fprintf(stderr, "Sorry, %s is not active.\n", sym_filter); 718 fprintf(stderr, "Sorry, %s is not active.\n", buf);
671 sleep(1); 719 sleep(1);
672 return; 720 return;
673 } else 721 } else
@@ -695,11 +743,9 @@ static void print_mapped_keys(void)
695 743
696 fprintf(stdout, "\t[f] profile display filter (count). \t(%d)\n", count_filter); 744 fprintf(stdout, "\t[f] profile display filter (count). \t(%d)\n", count_filter);
697 745
698 if (symbol_conf.vmlinux_name) { 746 fprintf(stdout, "\t[F] annotate display filter (percent). \t(%d%%)\n", sym_pcnt_filter);
699 fprintf(stdout, "\t[F] annotate display filter (percent). \t(%d%%)\n", sym_pcnt_filter); 747 fprintf(stdout, "\t[s] annotate symbol. \t(%s)\n", name?: "NULL");
700 fprintf(stdout, "\t[s] annotate symbol. \t(%s)\n", name?: "NULL"); 748 fprintf(stdout, "\t[S] stop annotation.\n");
701 fprintf(stdout, "\t[S] stop annotation.\n");
702 }
703 749
704 if (nr_counters > 1) 750 if (nr_counters > 1)
705 fprintf(stdout, "\t[w] toggle display weighted/count[E]r. \t(%d)\n", display_weighted ? 1 : 0); 751 fprintf(stdout, "\t[w] toggle display weighted/count[E]r. \t(%d)\n", display_weighted ? 1 : 0);
@@ -725,14 +771,13 @@ static int key_mapped(int c)
725 case 'Q': 771 case 'Q':
726 case 'K': 772 case 'K':
727 case 'U': 773 case 'U':
774 case 'F':
775 case 's':
776 case 'S':
728 return 1; 777 return 1;
729 case 'E': 778 case 'E':
730 case 'w': 779 case 'w':
731 return nr_counters > 1 ? 1 : 0; 780 return nr_counters > 1 ? 1 : 0;
732 case 'F':
733 case 's':
734 case 'S':
735 return symbol_conf.vmlinux_name ? 1 : 0;
736 default: 781 default:
737 break; 782 break;
738 } 783 }
@@ -740,7 +785,7 @@ static int key_mapped(int c)
740 return 0; 785 return 0;
741} 786}
742 787
743static void handle_keypress(int c) 788static void handle_keypress(struct perf_session *session, int c)
744{ 789{
745 if (!key_mapped(c)) { 790 if (!key_mapped(c)) {
746 struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; 791 struct pollfd stdin_poll = { .fd = 0, .events = POLLIN };
@@ -809,7 +854,7 @@ static void handle_keypress(int c)
809 case 'Q': 854 case 'Q':
810 printf("exiting.\n"); 855 printf("exiting.\n");
811 if (dump_symtab) 856 if (dump_symtab)
812 dsos__fprintf(stderr); 857 perf_session__fprintf_dsos(session, stderr);
813 exit(0); 858 exit(0);
814 case 's': 859 case 's':
815 prompt_symbol(&sym_filter_entry, "Enter details symbol"); 860 prompt_symbol(&sym_filter_entry, "Enter details symbol");
@@ -833,7 +878,7 @@ static void handle_keypress(int c)
833 display_weighted = ~display_weighted; 878 display_weighted = ~display_weighted;
834 break; 879 break;
835 case 'z': 880 case 'z':
836 zero = ~zero; 881 zero = !zero;
837 break; 882 break;
838 default: 883 default:
839 break; 884 break;
@@ -845,6 +890,7 @@ static void *display_thread(void *arg __used)
845 struct pollfd stdin_poll = { .fd = 0, .events = POLLIN }; 890 struct pollfd stdin_poll = { .fd = 0, .events = POLLIN };
846 struct termios tc, save; 891 struct termios tc, save;
847 int delay_msecs, c; 892 int delay_msecs, c;
893 struct perf_session *session = (struct perf_session *) arg;
848 894
849 tcgetattr(0, &save); 895 tcgetattr(0, &save);
850 tc = save; 896 tc = save;
@@ -865,7 +911,7 @@ repeat:
865 c = getc(stdin); 911 c = getc(stdin);
866 tcsetattr(0, TCSAFLUSH, &save); 912 tcsetattr(0, TCSAFLUSH, &save);
867 913
868 handle_keypress(c); 914 handle_keypress(session, c);
869 goto repeat; 915 goto repeat;
870 916
871 return NULL; 917 return NULL;
@@ -910,8 +956,12 @@ static int symbol_filter(struct map *map, struct symbol *sym)
910 syme = symbol__priv(sym); 956 syme = symbol__priv(sym);
911 syme->map = map; 957 syme->map = map;
912 syme->src = NULL; 958 syme->src = NULL;
913 if (!sym_filter_entry && sym_filter && !strcmp(name, sym_filter)) 959
914 sym_filter_entry = syme; 960 if (!sym_filter_entry && sym_filter && !strcmp(name, sym_filter)) {
961 /* schedule initial sym_filter_entry setup */
962 sym_filter_entry_sched = syme;
963 sym_filter = NULL;
964 }
915 965
916 for (i = 0; skip_symbols[i]; i++) { 966 for (i = 0; skip_symbols[i]; i++) {
917 if (!strcmp(skip_symbols[i], name)) { 967 if (!strcmp(skip_symbols[i], name)) {
@@ -932,25 +982,91 @@ static void event__process_sample(const event_t *self,
932 u64 ip = self->ip.ip; 982 u64 ip = self->ip.ip;
933 struct sym_entry *syme; 983 struct sym_entry *syme;
934 struct addr_location al; 984 struct addr_location al;
985 struct machine *machine;
935 u8 origin = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK; 986 u8 origin = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
936 987
988 ++samples;
989
937 switch (origin) { 990 switch (origin) {
938 case PERF_RECORD_MISC_USER: 991 case PERF_RECORD_MISC_USER:
992 ++us_samples;
939 if (hide_user_symbols) 993 if (hide_user_symbols)
940 return; 994 return;
995 machine = perf_session__find_host_machine(session);
941 break; 996 break;
942 case PERF_RECORD_MISC_KERNEL: 997 case PERF_RECORD_MISC_KERNEL:
998 ++kernel_samples;
943 if (hide_kernel_symbols) 999 if (hide_kernel_symbols)
944 return; 1000 return;
1001 machine = perf_session__find_host_machine(session);
1002 break;
1003 case PERF_RECORD_MISC_GUEST_KERNEL:
1004 ++guest_kernel_samples;
1005 machine = perf_session__find_machine(session, self->ip.pid);
945 break; 1006 break;
1007 case PERF_RECORD_MISC_GUEST_USER:
1008 ++guest_us_samples;
1009 /*
1010 * TODO: we don't process guest user from host side
1011 * except simple counting.
1012 */
1013 return;
946 default: 1014 default:
947 return; 1015 return;
948 } 1016 }
949 1017
1018 if (!machine && perf_guest) {
1019 pr_err("Can't find guest [%d]'s kernel information\n",
1020 self->ip.pid);
1021 return;
1022 }
1023
1024 if (self->header.misc & PERF_RECORD_MISC_EXACT_IP)
1025 exact_samples++;
1026
950 if (event__preprocess_sample(self, session, &al, symbol_filter) < 0 || 1027 if (event__preprocess_sample(self, session, &al, symbol_filter) < 0 ||
951 al.sym == NULL || al.filtered) 1028 al.filtered)
952 return; 1029 return;
953 1030
1031 if (al.sym == NULL) {
1032 /*
1033 * As we do lazy loading of symtabs we only will know if the
1034 * specified vmlinux file is invalid when we actually have a
1035 * hit in kernel space and then try to load it. So if we get
1036 * here and there are _no_ symbols in the DSO backing the
1037 * kernel map, bail out.
1038 *
1039 * We may never get here, for instance, if we use -K/
1040 * --hide-kernel-symbols, even if the user specifies an
1041 * invalid --vmlinux ;-)
1042 */
1043 if (al.map == machine->vmlinux_maps[MAP__FUNCTION] &&
1044 RB_EMPTY_ROOT(&al.map->dso->symbols[MAP__FUNCTION])) {
1045 pr_err("The %s file can't be used\n",
1046 symbol_conf.vmlinux_name);
1047 exit(1);
1048 }
1049
1050 return;
1051 }
1052
1053 /* let's see, whether we need to install initial sym_filter_entry */
1054 if (sym_filter_entry_sched) {
1055 sym_filter_entry = sym_filter_entry_sched;
1056 sym_filter_entry_sched = NULL;
1057 if (parse_source(sym_filter_entry) < 0) {
1058 struct symbol *sym = sym_entry__symbol(sym_filter_entry);
1059
1060 pr_err("Can't annotate %s", sym->name);
1061 if (sym_filter_entry->map->dso->origin == DSO__ORIG_KERNEL) {
1062 pr_err(": No vmlinux file was found in the path:\n");
1063 machine__fprintf_vmlinux_path(machine, stderr);
1064 } else
1065 pr_err(".\n");
1066 exit(1);
1067 }
1068 }
1069
954 syme = symbol__priv(al.sym); 1070 syme = symbol__priv(al.sym);
955 if (!syme->skip) { 1071 if (!syme->skip) {
956 syme->count[counter]++; 1072 syme->count[counter]++;
@@ -960,9 +1076,6 @@ static void event__process_sample(const event_t *self,
960 if (list_empty(&syme->node) || !syme->node.next) 1076 if (list_empty(&syme->node) || !syme->node.next)
961 __list_insert_active_sym(syme); 1077 __list_insert_active_sym(syme);
962 pthread_mutex_unlock(&active_symbols_lock); 1078 pthread_mutex_unlock(&active_symbols_lock);
963 if (origin == PERF_RECORD_MISC_USER)
964 ++userspace_samples;
965 ++samples;
966 } 1079 }
967} 1080}
968 1081
@@ -975,6 +1088,10 @@ static int event__process(event_t *event, struct perf_session *session)
975 case PERF_RECORD_MMAP: 1088 case PERF_RECORD_MMAP:
976 event__process_mmap(event, session); 1089 event__process_mmap(event, session);
977 break; 1090 break;
1091 case PERF_RECORD_FORK:
1092 case PERF_RECORD_EXIT:
1093 event__process_task(event, session);
1094 break;
978 default: 1095 default:
979 break; 1096 break;
980 } 1097 }
@@ -1063,16 +1180,21 @@ static void perf_session__mmap_read_counter(struct perf_session *self,
1063 md->prev = old; 1180 md->prev = old;
1064} 1181}
1065 1182
1066static struct pollfd event_array[MAX_NR_CPUS * MAX_COUNTERS]; 1183static struct pollfd *event_array;
1067static struct mmap_data mmap_array[MAX_NR_CPUS][MAX_COUNTERS]; 1184static struct mmap_data *mmap_array[MAX_NR_CPUS][MAX_COUNTERS];
1068 1185
1069static void perf_session__mmap_read(struct perf_session *self) 1186static void perf_session__mmap_read(struct perf_session *self)
1070{ 1187{
1071 int i, counter; 1188 int i, counter, thread_index;
1072 1189
1073 for (i = 0; i < nr_cpus; i++) { 1190 for (i = 0; i < nr_cpus; i++) {
1074 for (counter = 0; counter < nr_counters; counter++) 1191 for (counter = 0; counter < nr_counters; counter++)
1075 perf_session__mmap_read_counter(self, &mmap_array[i][counter]); 1192 for (thread_index = 0;
1193 thread_index < thread_num;
1194 thread_index++) {
1195 perf_session__mmap_read_counter(self,
1196 &mmap_array[i][counter][thread_index]);
1197 }
1076 } 1198 }
1077} 1199}
1078 1200
@@ -1083,10 +1205,11 @@ static void start_counter(int i, int counter)
1083{ 1205{
1084 struct perf_event_attr *attr; 1206 struct perf_event_attr *attr;
1085 int cpu; 1207 int cpu;
1208 int thread_index;
1086 1209
1087 cpu = profile_cpu; 1210 cpu = profile_cpu;
1088 if (target_pid == -1 && profile_cpu == -1) 1211 if (target_tid == -1 && profile_cpu == -1)
1089 cpu = i; 1212 cpu = cpumap[i];
1090 1213
1091 attr = attrs + counter; 1214 attr = attrs + counter;
1092 1215
@@ -1101,55 +1224,58 @@ static void start_counter(int i, int counter)
1101 attr->inherit = (cpu < 0) && inherit; 1224 attr->inherit = (cpu < 0) && inherit;
1102 attr->mmap = 1; 1225 attr->mmap = 1;
1103 1226
1227 for (thread_index = 0; thread_index < thread_num; thread_index++) {
1104try_again: 1228try_again:
1105 fd[i][counter] = sys_perf_event_open(attr, target_pid, cpu, group_fd, 0); 1229 fd[i][counter][thread_index] = sys_perf_event_open(attr,
1106 1230 all_tids[thread_index], cpu, group_fd, 0);
1107 if (fd[i][counter] < 0) { 1231
1108 int err = errno; 1232 if (fd[i][counter][thread_index] < 0) {
1233 int err = errno;
1234
1235 if (err == EPERM || err == EACCES)
1236 die("No permission - are you root?\n");
1237 /*
1238 * If it's cycles then fall back to hrtimer
1239 * based cpu-clock-tick sw counter, which
1240 * is always available even if no PMU support:
1241 */
1242 if (attr->type == PERF_TYPE_HARDWARE
1243 && attr->config == PERF_COUNT_HW_CPU_CYCLES) {
1244
1245 if (verbose)
1246 warning(" ... trying to fall back to cpu-clock-ticks\n");
1247
1248 attr->type = PERF_TYPE_SOFTWARE;
1249 attr->config = PERF_COUNT_SW_CPU_CLOCK;
1250 goto try_again;
1251 }
1252 printf("\n");
1253 error("perfcounter syscall returned with %d (%s)\n",
1254 fd[i][counter][thread_index], strerror(err));
1255 die("No CONFIG_PERF_EVENTS=y kernel support configured?\n");
1256 exit(-1);
1257 }
1258 assert(fd[i][counter][thread_index] >= 0);
1259 fcntl(fd[i][counter][thread_index], F_SETFL, O_NONBLOCK);
1109 1260
1110 if (err == EPERM || err == EACCES)
1111 die("No permission - are you root?\n");
1112 /* 1261 /*
1113 * If it's cycles then fall back to hrtimer 1262 * First counter acts as the group leader:
1114 * based cpu-clock-tick sw counter, which
1115 * is always available even if no PMU support:
1116 */ 1263 */
1117 if (attr->type == PERF_TYPE_HARDWARE 1264 if (group && group_fd == -1)
1118 && attr->config == PERF_COUNT_HW_CPU_CYCLES) { 1265 group_fd = fd[i][counter][thread_index];
1119 1266
1120 if (verbose) 1267 event_array[nr_poll].fd = fd[i][counter][thread_index];
1121 warning(" ... trying to fall back to cpu-clock-ticks\n"); 1268 event_array[nr_poll].events = POLLIN;
1122 1269 nr_poll++;
1123 attr->type = PERF_TYPE_SOFTWARE; 1270
1124 attr->config = PERF_COUNT_SW_CPU_CLOCK; 1271 mmap_array[i][counter][thread_index].counter = counter;
1125 goto try_again; 1272 mmap_array[i][counter][thread_index].prev = 0;
1126 } 1273 mmap_array[i][counter][thread_index].mask = mmap_pages*page_size - 1;
1127 printf("\n"); 1274 mmap_array[i][counter][thread_index].base = mmap(NULL, (mmap_pages+1)*page_size,
1128 error("perfcounter syscall returned with %d (%s)\n", 1275 PROT_READ, MAP_SHARED, fd[i][counter][thread_index], 0);
1129 fd[i][counter], strerror(err)); 1276 if (mmap_array[i][counter][thread_index].base == MAP_FAILED)
1130 die("No CONFIG_PERF_EVENTS=y kernel support configured?\n"); 1277 die("failed to mmap with %d (%s)\n", errno, strerror(errno));
1131 exit(-1);
1132 } 1278 }
1133 assert(fd[i][counter] >= 0);
1134 fcntl(fd[i][counter], F_SETFL, O_NONBLOCK);
1135
1136 /*
1137 * First counter acts as the group leader:
1138 */
1139 if (group && group_fd == -1)
1140 group_fd = fd[i][counter];
1141
1142 event_array[nr_poll].fd = fd[i][counter];
1143 event_array[nr_poll].events = POLLIN;
1144 nr_poll++;
1145
1146 mmap_array[i][counter].counter = counter;
1147 mmap_array[i][counter].prev = 0;
1148 mmap_array[i][counter].mask = mmap_pages*page_size - 1;
1149 mmap_array[i][counter].base = mmap(NULL, (mmap_pages+1)*page_size,
1150 PROT_READ, MAP_SHARED, fd[i][counter], 0);
1151 if (mmap_array[i][counter].base == MAP_FAILED)
1152 die("failed to mmap with %d (%s)\n", errno, strerror(errno));
1153} 1279}
1154 1280
1155static int __cmd_top(void) 1281static int __cmd_top(void)
@@ -1161,12 +1287,12 @@ static int __cmd_top(void)
1161 * FIXME: perf_session__new should allow passing a O_MMAP, so that all this 1287 * FIXME: perf_session__new should allow passing a O_MMAP, so that all this
1162 * mmap reading, etc is encapsulated in it. Use O_WRONLY for now. 1288 * mmap reading, etc is encapsulated in it. Use O_WRONLY for now.
1163 */ 1289 */
1164 struct perf_session *session = perf_session__new(NULL, O_WRONLY, false); 1290 struct perf_session *session = perf_session__new(NULL, O_WRONLY, false, false);
1165 if (session == NULL) 1291 if (session == NULL)
1166 return -ENOMEM; 1292 return -ENOMEM;
1167 1293
1168 if (target_pid != -1) 1294 if (target_tid != -1)
1169 event__synthesize_thread(target_pid, event__process, session); 1295 event__synthesize_thread(target_tid, event__process, session);
1170 else 1296 else
1171 event__synthesize_threads(event__process, session); 1297 event__synthesize_threads(event__process, session);
1172 1298
@@ -1177,11 +1303,11 @@ static int __cmd_top(void)
1177 } 1303 }
1178 1304
1179 /* Wait for a minimal set of events before starting the snapshot */ 1305 /* Wait for a minimal set of events before starting the snapshot */
1180 poll(event_array, nr_poll, 100); 1306 poll(&event_array[0], nr_poll, 100);
1181 1307
1182 perf_session__mmap_read(session); 1308 perf_session__mmap_read(session);
1183 1309
1184 if (pthread_create(&thread, NULL, display_thread, NULL)) { 1310 if (pthread_create(&thread, NULL, display_thread, session)) {
1185 printf("Could not create display thread.\n"); 1311 printf("Could not create display thread.\n");
1186 exit(-1); 1312 exit(-1);
1187 } 1313 }
@@ -1220,7 +1346,9 @@ static const struct option options[] = {
1220 OPT_INTEGER('c', "count", &default_interval, 1346 OPT_INTEGER('c', "count", &default_interval,
1221 "event period to sample"), 1347 "event period to sample"),
1222 OPT_INTEGER('p', "pid", &target_pid, 1348 OPT_INTEGER('p', "pid", &target_pid,
1223 "profile events on existing pid"), 1349 "profile events on existing process id"),
1350 OPT_INTEGER('t', "tid", &target_tid,
1351 "profile events on existing thread id"),
1224 OPT_BOOLEAN('a', "all-cpus", &system_wide, 1352 OPT_BOOLEAN('a', "all-cpus", &system_wide,
1225 "system-wide collection from all CPUs"), 1353 "system-wide collection from all CPUs"),
1226 OPT_INTEGER('C', "CPU", &profile_cpu, 1354 OPT_INTEGER('C', "CPU", &profile_cpu,
@@ -1229,8 +1357,7 @@ static const struct option options[] = {
1229 "file", "vmlinux pathname"), 1357 "file", "vmlinux pathname"),
1230 OPT_BOOLEAN('K', "hide_kernel_symbols", &hide_kernel_symbols, 1358 OPT_BOOLEAN('K', "hide_kernel_symbols", &hide_kernel_symbols,
1231 "hide kernel symbols"), 1359 "hide kernel symbols"),
1232 OPT_INTEGER('m', "mmap-pages", &mmap_pages, 1360 OPT_UINTEGER('m', "mmap-pages", &mmap_pages, "number of mmap data pages"),
1233 "number of mmap data pages"),
1234 OPT_INTEGER('r', "realtime", &realtime_prio, 1361 OPT_INTEGER('r', "realtime", &realtime_prio,
1235 "collect data with this RT SCHED_FIFO priority"), 1362 "collect data with this RT SCHED_FIFO priority"),
1236 OPT_INTEGER('d', "delay", &delay_secs, 1363 OPT_INTEGER('d', "delay", &delay_secs,
@@ -1244,7 +1371,7 @@ static const struct option options[] = {
1244 OPT_BOOLEAN('i', "inherit", &inherit, 1371 OPT_BOOLEAN('i', "inherit", &inherit,
1245 "child tasks inherit counters"), 1372 "child tasks inherit counters"),
1246 OPT_STRING('s', "sym-annotate", &sym_filter, "symbol name", 1373 OPT_STRING('s', "sym-annotate", &sym_filter, "symbol name",
1247 "symbol to annotate - requires -k option"), 1374 "symbol to annotate"),
1248 OPT_BOOLEAN('z', "zero", &zero, 1375 OPT_BOOLEAN('z', "zero", &zero,
1249 "zero history across updates"), 1376 "zero history across updates"),
1250 OPT_INTEGER('F', "freq", &freq, 1377 OPT_INTEGER('F', "freq", &freq,
@@ -1253,7 +1380,7 @@ static const struct option options[] = {
1253 "display this many functions"), 1380 "display this many functions"),
1254 OPT_BOOLEAN('U', "hide_user_symbols", &hide_user_symbols, 1381 OPT_BOOLEAN('U', "hide_user_symbols", &hide_user_symbols,
1255 "hide user symbols"), 1382 "hide user symbols"),
1256 OPT_BOOLEAN('v', "verbose", &verbose, 1383 OPT_INCR('v', "verbose", &verbose,
1257 "be more verbose (show counter open errors, etc)"), 1384 "be more verbose (show counter open errors, etc)"),
1258 OPT_END() 1385 OPT_END()
1259}; 1386};
@@ -1261,6 +1388,7 @@ static const struct option options[] = {
1261int cmd_top(int argc, const char **argv, const char *prefix __used) 1388int cmd_top(int argc, const char **argv, const char *prefix __used)
1262{ 1389{
1263 int counter; 1390 int counter;
1391 int i,j;
1264 1392
1265 page_size = sysconf(_SC_PAGE_SIZE); 1393 page_size = sysconf(_SC_PAGE_SIZE);
1266 1394
@@ -1268,8 +1396,39 @@ int cmd_top(int argc, const char **argv, const char *prefix __used)
1268 if (argc) 1396 if (argc)
1269 usage_with_options(top_usage, options); 1397 usage_with_options(top_usage, options);
1270 1398
1399 if (target_pid != -1) {
1400 target_tid = target_pid;
1401 thread_num = find_all_tid(target_pid, &all_tids);
1402 if (thread_num <= 0) {
1403 fprintf(stderr, "Can't find all threads of pid %d\n",
1404 target_pid);
1405 usage_with_options(top_usage, options);
1406 }
1407 } else {
1408 all_tids=malloc(sizeof(pid_t));
1409 if (!all_tids)
1410 return -ENOMEM;
1411
1412 all_tids[0] = target_tid;
1413 thread_num = 1;
1414 }
1415
1416 for (i = 0; i < MAX_NR_CPUS; i++) {
1417 for (j = 0; j < MAX_COUNTERS; j++) {
1418 fd[i][j] = malloc(sizeof(int)*thread_num);
1419 mmap_array[i][j] = zalloc(
1420 sizeof(struct mmap_data)*thread_num);
1421 if (!fd[i][j] || !mmap_array[i][j])
1422 return -ENOMEM;
1423 }
1424 }
1425 event_array = malloc(
1426 sizeof(struct pollfd)*MAX_NR_CPUS*MAX_COUNTERS*thread_num);
1427 if (!event_array)
1428 return -ENOMEM;
1429
1271 /* CPU and PID are mutually exclusive */ 1430 /* CPU and PID are mutually exclusive */
1272 if (target_pid != -1 && profile_cpu != -1) { 1431 if (target_tid > 0 && profile_cpu != -1) {
1273 printf("WARNING: PID switch overriding CPU\n"); 1432 printf("WARNING: PID switch overriding CPU\n");
1274 sleep(1); 1433 sleep(1);
1275 profile_cpu = -1; 1434 profile_cpu = -1;
@@ -1280,16 +1439,14 @@ int cmd_top(int argc, const char **argv, const char *prefix __used)
1280 1439
1281 symbol_conf.priv_size = (sizeof(struct sym_entry) + 1440 symbol_conf.priv_size = (sizeof(struct sym_entry) +
1282 (nr_counters + 1) * sizeof(unsigned long)); 1441 (nr_counters + 1) * sizeof(unsigned long));
1283 if (symbol_conf.vmlinux_name == NULL) 1442
1284 symbol_conf.try_vmlinux_path = true; 1443 symbol_conf.try_vmlinux_path = (symbol_conf.vmlinux_name == NULL);
1285 if (symbol__init() < 0) 1444 if (symbol__init() < 0)
1286 return -1; 1445 return -1;
1287 1446
1288 if (delay_secs < 1) 1447 if (delay_secs < 1)
1289 delay_secs = 1; 1448 delay_secs = 1;
1290 1449
1291 parse_source(sym_filter_entry);
1292
1293 /* 1450 /*
1294 * User specified count overrides default frequency. 1451 * User specified count overrides default frequency.
1295 */ 1452 */
@@ -1312,12 +1469,10 @@ int cmd_top(int argc, const char **argv, const char *prefix __used)
1312 attrs[counter].sample_period = default_interval; 1469 attrs[counter].sample_period = default_interval;
1313 } 1470 }
1314 1471
1315 nr_cpus = sysconf(_SC_NPROCESSORS_ONLN); 1472 if (target_tid != -1 || profile_cpu != -1)
1316 assert(nr_cpus <= MAX_NR_CPUS);
1317 assert(nr_cpus >= 0);
1318
1319 if (target_pid != -1 || profile_cpu != -1)
1320 nr_cpus = 1; 1473 nr_cpus = 1;
1474 else
1475 nr_cpus = read_cpu_map();
1321 1476
1322 get_term_dimensions(&winsize); 1477 get_term_dimensions(&winsize);
1323 if (print_entries == 0) { 1478 if (print_entries == 0) {
diff --git a/tools/perf/builtin-trace.c b/tools/perf/builtin-trace.c
index 574a215e800b..dddf3f01b5ab 100644
--- a/tools/perf/builtin-trace.c
+++ b/tools/perf/builtin-trace.c
@@ -11,6 +11,8 @@
11 11
12static char const *script_name; 12static char const *script_name;
13static char const *generate_script_lang; 13static char const *generate_script_lang;
14static bool debug_ordering;
15static u64 last_timestamp;
14 16
15static int default_start_script(const char *script __unused, 17static int default_start_script(const char *script __unused,
16 int argc __unused, 18 int argc __unused,
@@ -44,12 +46,15 @@ static void setup_scripting(void)
44 perf_set_argv_exec_path(perf_exec_path()); 46 perf_set_argv_exec_path(perf_exec_path());
45 47
46 setup_perl_scripting(); 48 setup_perl_scripting();
49 setup_python_scripting();
47 50
48 scripting_ops = &default_scripting_ops; 51 scripting_ops = &default_scripting_ops;
49} 52}
50 53
51static int cleanup_scripting(void) 54static int cleanup_scripting(void)
52{ 55{
56 pr_debug("\nperf trace script stopped\n");
57
53 return scripting_ops->stop_script(); 58 return scripting_ops->stop_script();
54} 59}
55 60
@@ -75,11 +80,8 @@ static int process_sample_event(event_t *event, struct perf_session *session)
75 80
76 event__parse_sample(event, session->sample_type, &data); 81 event__parse_sample(event, session->sample_type, &data);
77 82
78 dump_printf("(IP, %d): %d/%d: %p period: %Ld\n", 83 dump_printf("(IP, %d): %d/%d: %#Lx period: %Ld\n", event->header.misc,
79 event->header.misc, 84 data.pid, data.tid, data.ip, data.period);
80 data.pid, data.tid,
81 (void *)(long)data.ip,
82 (long long)data.period);
83 85
84 thread = perf_session__findnew(session, event->ip.pid); 86 thread = perf_session__findnew(session, event->ip.pid);
85 if (thread == NULL) { 87 if (thread == NULL) {
@@ -89,6 +91,14 @@ static int process_sample_event(event_t *event, struct perf_session *session)
89 } 91 }
90 92
91 if (session->sample_type & PERF_SAMPLE_RAW) { 93 if (session->sample_type & PERF_SAMPLE_RAW) {
94 if (debug_ordering) {
95 if (data.time < last_timestamp) {
96 pr_err("Samples misordered, previous: %llu "
97 "this: %llu\n", last_timestamp,
98 data.time);
99 }
100 last_timestamp = data.time;
101 }
92 /* 102 /*
93 * FIXME: better resolve from pid from the struct trace_entry 103 * FIXME: better resolve from pid from the struct trace_entry
94 * field, although it should be the same than this perf 104 * field, although it should be the same than this perf
@@ -99,30 +109,31 @@ static int process_sample_event(event_t *event, struct perf_session *session)
99 data.time, thread->comm); 109 data.time, thread->comm);
100 } 110 }
101 111
102 session->events_stats.total += data.period; 112 session->hists.stats.total_period += data.period;
103 return 0;
104}
105
106static int sample_type_check(struct perf_session *session)
107{
108 if (!(session->sample_type & PERF_SAMPLE_RAW)) {
109 fprintf(stderr,
110 "No trace sample to read. Did you call perf record "
111 "without -R?");
112 return -1;
113 }
114
115 return 0; 113 return 0;
116} 114}
117 115
118static struct perf_event_ops event_ops = { 116static struct perf_event_ops event_ops = {
119 .process_sample_event = process_sample_event, 117 .sample = process_sample_event,
120 .process_comm_event = event__process_comm, 118 .comm = event__process_comm,
121 .sample_type_check = sample_type_check, 119 .attr = event__process_attr,
120 .event_type = event__process_event_type,
121 .tracing_data = event__process_tracing_data,
122 .build_id = event__process_build_id,
123 .ordered_samples = true,
122}; 124};
123 125
126extern volatile int session_done;
127
128static void sig_handler(int sig __unused)
129{
130 session_done = 1;
131}
132
124static int __cmd_trace(struct perf_session *session) 133static int __cmd_trace(struct perf_session *session)
125{ 134{
135 signal(SIGINT, sig_handler);
136
126 return perf_session__process_events(session, &event_ops); 137 return perf_session__process_events(session, &event_ops);
127} 138}
128 139
@@ -235,9 +246,9 @@ static int parse_scriptname(const struct option *opt __used,
235 const char *script, *ext; 246 const char *script, *ext;
236 int len; 247 int len;
237 248
238 if (strcmp(str, "list") == 0) { 249 if (strcmp(str, "lang") == 0) {
239 list_available_languages(); 250 list_available_languages();
240 return 0; 251 exit(0);
241 } 252 }
242 253
243 script = strchr(str, ':'); 254 script = strchr(str, ':');
@@ -520,7 +531,7 @@ static const char * const trace_usage[] = {
520static const struct option options[] = { 531static const struct option options[] = {
521 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, 532 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
522 "dump raw trace in ASCII"), 533 "dump raw trace in ASCII"),
523 OPT_BOOLEAN('v', "verbose", &verbose, 534 OPT_INCR('v', "verbose", &verbose,
524 "be more verbose (show symbol address, etc)"), 535 "be more verbose (show symbol address, etc)"),
525 OPT_BOOLEAN('L', "Latency", &latency_format, 536 OPT_BOOLEAN('L', "Latency", &latency_format,
526 "show latency attributes (irqs/preemption disabled, etc)"), 537 "show latency attributes (irqs/preemption disabled, etc)"),
@@ -531,6 +542,10 @@ static const struct option options[] = {
531 parse_scriptname), 542 parse_scriptname),
532 OPT_STRING('g', "gen-script", &generate_script_lang, "lang", 543 OPT_STRING('g', "gen-script", &generate_script_lang, "lang",
533 "generate perf-trace.xx script in specified language"), 544 "generate perf-trace.xx script in specified language"),
545 OPT_STRING('i', "input", &input_name, "file",
546 "input file name"),
547 OPT_BOOLEAN('d', "debug-ordering", &debug_ordering,
548 "check that samples time ordering is monotonic"),
534 549
535 OPT_END() 550 OPT_END()
536}; 551};
@@ -561,6 +576,65 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used)
561 suffix = REPORT_SUFFIX; 576 suffix = REPORT_SUFFIX;
562 } 577 }
563 578
579 if (!suffix && argc >= 2 && strncmp(argv[1], "-", strlen("-")) != 0) {
580 char *record_script_path, *report_script_path;
581 int live_pipe[2];
582 pid_t pid;
583
584 record_script_path = get_script_path(argv[1], RECORD_SUFFIX);
585 if (!record_script_path) {
586 fprintf(stderr, "record script not found\n");
587 return -1;
588 }
589
590 report_script_path = get_script_path(argv[1], REPORT_SUFFIX);
591 if (!report_script_path) {
592 fprintf(stderr, "report script not found\n");
593 return -1;
594 }
595
596 if (pipe(live_pipe) < 0) {
597 perror("failed to create pipe");
598 exit(-1);
599 }
600
601 pid = fork();
602 if (pid < 0) {
603 perror("failed to fork");
604 exit(-1);
605 }
606
607 if (!pid) {
608 dup2(live_pipe[1], 1);
609 close(live_pipe[0]);
610
611 __argv = malloc(5 * sizeof(const char *));
612 __argv[0] = "/bin/sh";
613 __argv[1] = record_script_path;
614 __argv[2] = "-o";
615 __argv[3] = "-";
616 __argv[4] = NULL;
617
618 execvp("/bin/sh", (char **)__argv);
619 exit(-1);
620 }
621
622 dup2(live_pipe[0], 0);
623 close(live_pipe[1]);
624
625 __argv = malloc((argc + 3) * sizeof(const char *));
626 __argv[0] = "/bin/sh";
627 __argv[1] = report_script_path;
628 for (i = 2; i < argc; i++)
629 __argv[i] = argv[i];
630 __argv[i++] = "-i";
631 __argv[i++] = "-";
632 __argv[i++] = NULL;
633
634 execvp("/bin/sh", (char **)__argv);
635 exit(-1);
636 }
637
564 if (suffix) { 638 if (suffix) {
565 script_path = get_script_path(argv[2], suffix); 639 script_path = get_script_path(argv[2], suffix);
566 if (!script_path) { 640 if (!script_path) {
@@ -586,12 +660,17 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used)
586 660
587 if (symbol__init() < 0) 661 if (symbol__init() < 0)
588 return -1; 662 return -1;
589 setup_pager(); 663 if (!script_name)
664 setup_pager();
590 665
591 session = perf_session__new(input_name, O_RDONLY, 0); 666 session = perf_session__new(input_name, O_RDONLY, 0, false);
592 if (session == NULL) 667 if (session == NULL)
593 return -ENOMEM; 668 return -ENOMEM;
594 669
670 if (strcmp(input_name, "-") &&
671 !perf_session__has_traces(session, "record -R"))
672 return -EINVAL;
673
595 if (generate_script_lang) { 674 if (generate_script_lang) {
596 struct stat perf_stat; 675 struct stat perf_stat;
597 676
@@ -618,7 +697,6 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used)
618 return -1; 697 return -1;
619 } 698 }
620 699
621 perf_header__read(&session->header, input);
622 err = scripting_ops->generate_script("perf-trace"); 700 err = scripting_ops->generate_script("perf-trace");
623 goto out; 701 goto out;
624 } 702 }
@@ -627,6 +705,7 @@ int cmd_trace(int argc, const char **argv, const char *prefix __used)
627 err = scripting_ops->start_script(script_name, argc, argv); 705 err = scripting_ops->start_script(script_name, argc, argv);
628 if (err) 706 if (err)
629 goto out; 707 goto out;
708 pr_debug("perf trace started with script %s\n\n", script_name);
630 } 709 }
631 710
632 err = __cmd_trace(session); 711 err = __cmd_trace(session);
diff --git a/tools/perf/builtin.h b/tools/perf/builtin.h
index 18035b1f16c7..921245b28583 100644
--- a/tools/perf/builtin.h
+++ b/tools/perf/builtin.h
@@ -16,6 +16,7 @@ extern int check_pager_config(const char *cmd);
16 16
17extern int cmd_annotate(int argc, const char **argv, const char *prefix); 17extern int cmd_annotate(int argc, const char **argv, const char *prefix);
18extern int cmd_bench(int argc, const char **argv, const char *prefix); 18extern int cmd_bench(int argc, const char **argv, const char *prefix);
19extern int cmd_buildid_cache(int argc, const char **argv, const char *prefix);
19extern int cmd_buildid_list(int argc, const char **argv, const char *prefix); 20extern int cmd_buildid_list(int argc, const char **argv, const char *prefix);
20extern int cmd_diff(int argc, const char **argv, const char *prefix); 21extern int cmd_diff(int argc, const char **argv, const char *prefix);
21extern int cmd_help(int argc, const char **argv, const char *prefix); 22extern int cmd_help(int argc, const char **argv, const char *prefix);
@@ -30,5 +31,9 @@ extern int cmd_trace(int argc, const char **argv, const char *prefix);
30extern int cmd_version(int argc, const char **argv, const char *prefix); 31extern int cmd_version(int argc, const char **argv, const char *prefix);
31extern int cmd_probe(int argc, const char **argv, const char *prefix); 32extern int cmd_probe(int argc, const char **argv, const char *prefix);
32extern int cmd_kmem(int argc, const char **argv, const char *prefix); 33extern int cmd_kmem(int argc, const char **argv, const char *prefix);
34extern int cmd_lock(int argc, const char **argv, const char *prefix);
35extern int cmd_kvm(int argc, const char **argv, const char *prefix);
36extern int cmd_test(int argc, const char **argv, const char *prefix);
37extern int cmd_inject(int argc, const char **argv, const char *prefix);
33 38
34#endif 39#endif
diff --git a/tools/perf/command-list.txt b/tools/perf/command-list.txt
index 71dc7c3fe7b2..949d77fc0b97 100644
--- a/tools/perf/command-list.txt
+++ b/tools/perf/command-list.txt
@@ -3,9 +3,12 @@
3# command name category [deprecated] [common] 3# command name category [deprecated] [common]
4# 4#
5perf-annotate mainporcelain common 5perf-annotate mainporcelain common
6perf-archive mainporcelain common
6perf-bench mainporcelain common 7perf-bench mainporcelain common
8perf-buildid-cache mainporcelain common
7perf-buildid-list mainporcelain common 9perf-buildid-list mainporcelain common
8perf-diff mainporcelain common 10perf-diff mainporcelain common
11perf-inject mainporcelain common
9perf-list mainporcelain common 12perf-list mainporcelain common
10perf-sched mainporcelain common 13perf-sched mainporcelain common
11perf-record mainporcelain common 14perf-record mainporcelain common
@@ -16,3 +19,6 @@ perf-top mainporcelain common
16perf-trace mainporcelain common 19perf-trace mainporcelain common
17perf-probe mainporcelain common 20perf-probe mainporcelain common
18perf-kmem mainporcelain common 21perf-kmem mainporcelain common
22perf-lock mainporcelain common
23perf-kvm mainporcelain common
24perf-test mainporcelain common
diff --git a/tools/perf/design.txt b/tools/perf/design.txt
index 8d0de5130db3..bd0bb1b1279b 100644
--- a/tools/perf/design.txt
+++ b/tools/perf/design.txt
@@ -101,10 +101,10 @@ enum hw_event_ids {
101 */ 101 */
102 PERF_COUNT_HW_CPU_CYCLES = 0, 102 PERF_COUNT_HW_CPU_CYCLES = 0,
103 PERF_COUNT_HW_INSTRUCTIONS = 1, 103 PERF_COUNT_HW_INSTRUCTIONS = 1,
104 PERF_COUNT_HW_CACHE_REFERENCES = 2, 104 PERF_COUNT_HW_CACHE_REFERENCES = 2,
105 PERF_COUNT_HW_CACHE_MISSES = 3, 105 PERF_COUNT_HW_CACHE_MISSES = 3,
106 PERF_COUNT_HW_BRANCH_INSTRUCTIONS = 4, 106 PERF_COUNT_HW_BRANCH_INSTRUCTIONS = 4,
107 PERF_COUNT_HW_BRANCH_MISSES = 5, 107 PERF_COUNT_HW_BRANCH_MISSES = 5,
108 PERF_COUNT_HW_BUS_CYCLES = 6, 108 PERF_COUNT_HW_BUS_CYCLES = 6,
109}; 109};
110 110
@@ -131,8 +131,8 @@ software events, selected by 'event_id':
131 */ 131 */
132enum sw_event_ids { 132enum sw_event_ids {
133 PERF_COUNT_SW_CPU_CLOCK = 0, 133 PERF_COUNT_SW_CPU_CLOCK = 0,
134 PERF_COUNT_SW_TASK_CLOCK = 1, 134 PERF_COUNT_SW_TASK_CLOCK = 1,
135 PERF_COUNT_SW_PAGE_FAULTS = 2, 135 PERF_COUNT_SW_PAGE_FAULTS = 2,
136 PERF_COUNT_SW_CONTEXT_SWITCHES = 3, 136 PERF_COUNT_SW_CONTEXT_SWITCHES = 3,
137 PERF_COUNT_SW_CPU_MIGRATIONS = 4, 137 PERF_COUNT_SW_CPU_MIGRATIONS = 4,
138 PERF_COUNT_SW_PAGE_FAULTS_MIN = 5, 138 PERF_COUNT_SW_PAGE_FAULTS_MIN = 5,
diff --git a/tools/perf/perf-archive.sh b/tools/perf/perf-archive.sh
new file mode 100644
index 000000000000..2e7a4f417e20
--- /dev/null
+++ b/tools/perf/perf-archive.sh
@@ -0,0 +1,36 @@
1#!/bin/bash
2# perf archive
3# Arnaldo Carvalho de Melo <acme@redhat.com>
4
5PERF_DATA=perf.data
6if [ $# -ne 0 ] ; then
7 PERF_DATA=$1
8fi
9
10DEBUGDIR=~/.debug/
11BUILDIDS=$(mktemp /tmp/perf-archive-buildids.XXXXXX)
12NOBUILDID=0000000000000000000000000000000000000000
13
14perf buildid-list -i $PERF_DATA --with-hits | grep -v "^$NOBUILDID " > $BUILDIDS
15if [ ! -s $BUILDIDS ] ; then
16 echo "perf archive: no build-ids found"
17 rm -f $BUILDIDS
18 exit 1
19fi
20
21MANIFEST=$(mktemp /tmp/perf-archive-manifest.XXXXXX)
22
23cut -d ' ' -f 1 $BUILDIDS | \
24while read build_id ; do
25 linkname=$DEBUGDIR.build-id/${build_id:0:2}/${build_id:2}
26 filename=$(readlink -f $linkname)
27 echo ${linkname#$DEBUGDIR} >> $MANIFEST
28 echo ${filename#$DEBUGDIR} >> $MANIFEST
29done
30
31tar cfj $PERF_DATA.tar.bz2 -C $DEBUGDIR -T $MANIFEST
32rm -f $MANIFEST $BUILDIDS
33echo -e "Now please run:\n"
34echo -e "$ tar xvf $PERF_DATA.tar.bz2 -C ~/.debug\n"
35echo "wherever you need to run 'perf report' on."
36exit 0
diff --git a/tools/perf/perf.c b/tools/perf/perf.c
index 873e55fab375..6e4871191138 100644
--- a/tools/perf/perf.c
+++ b/tools/perf/perf.c
@@ -13,7 +13,6 @@
13#include "util/quote.h" 13#include "util/quote.h"
14#include "util/run-command.h" 14#include "util/run-command.h"
15#include "util/parse-events.h" 15#include "util/parse-events.h"
16#include "util/string.h"
17#include "util/debugfs.h" 16#include "util/debugfs.h"
18 17
19const char perf_usage_string[] = 18const char perf_usage_string[] =
@@ -22,7 +21,9 @@ const char perf_usage_string[] =
22const char perf_more_info_string[] = 21const char perf_more_info_string[] =
23 "See 'perf help COMMAND' for more information on a specific command."; 22 "See 'perf help COMMAND' for more information on a specific command.";
24 23
24int use_browser = -1;
25static int use_pager = -1; 25static int use_pager = -1;
26
26struct pager_config { 27struct pager_config {
27 const char *cmd; 28 const char *cmd;
28 int val; 29 int val;
@@ -48,7 +49,26 @@ int check_pager_config(const char *cmd)
48 return c.val; 49 return c.val;
49} 50}
50 51
51static void commit_pager_choice(void) { 52static int tui_command_config(const char *var, const char *value, void *data)
53{
54 struct pager_config *c = data;
55 if (!prefixcmp(var, "tui.") && !strcmp(var + 4, c->cmd))
56 c->val = perf_config_bool(var, value);
57 return 0;
58}
59
60/* returns 0 for "no tui", 1 for "use tui", and -1 for "not specified" */
61static int check_tui_config(const char *cmd)
62{
63 struct pager_config c;
64 c.cmd = cmd;
65 c.val = -1;
66 perf_config(tui_command_config, &c);
67 return c.val;
68}
69
70static void commit_pager_choice(void)
71{
52 switch (use_pager) { 72 switch (use_pager) {
53 case 0: 73 case 0:
54 setenv("PERF_PAGER", "cat", 1); 74 setenv("PERF_PAGER", "cat", 1);
@@ -70,7 +90,7 @@ static void set_debugfs_path(void)
70 "tracing/events"); 90 "tracing/events");
71} 91}
72 92
73static int handle_options(const char*** argv, int* argc, int* envchanged) 93static int handle_options(const char ***argv, int *argc, int *envchanged)
74{ 94{
75 int handled = 0; 95 int handled = 0;
76 96
@@ -109,7 +129,7 @@ static int handle_options(const char*** argv, int* argc, int* envchanged)
109 *envchanged = 1; 129 *envchanged = 1;
110 } else if (!strcmp(cmd, "--perf-dir")) { 130 } else if (!strcmp(cmd, "--perf-dir")) {
111 if (*argc < 2) { 131 if (*argc < 2) {
112 fprintf(stderr, "No directory given for --perf-dir.\n" ); 132 fprintf(stderr, "No directory given for --perf-dir.\n");
113 usage(perf_usage_string); 133 usage(perf_usage_string);
114 } 134 }
115 setenv(PERF_DIR_ENVIRONMENT, (*argv)[1], 1); 135 setenv(PERF_DIR_ENVIRONMENT, (*argv)[1], 1);
@@ -124,7 +144,7 @@ static int handle_options(const char*** argv, int* argc, int* envchanged)
124 *envchanged = 1; 144 *envchanged = 1;
125 } else if (!strcmp(cmd, "--work-tree")) { 145 } else if (!strcmp(cmd, "--work-tree")) {
126 if (*argc < 2) { 146 if (*argc < 2) {
127 fprintf(stderr, "No directory given for --work-tree.\n" ); 147 fprintf(stderr, "No directory given for --work-tree.\n");
128 usage(perf_usage_string); 148 usage(perf_usage_string);
129 } 149 }
130 setenv(PERF_WORK_TREE_ENVIRONMENT, (*argv)[1], 1); 150 setenv(PERF_WORK_TREE_ENVIRONMENT, (*argv)[1], 1);
@@ -168,7 +188,7 @@ static int handle_alias(int *argcp, const char ***argv)
168{ 188{
169 int envchanged = 0, ret = 0, saved_errno = errno; 189 int envchanged = 0, ret = 0, saved_errno = errno;
170 int count, option_count; 190 int count, option_count;
171 const char** new_argv; 191 const char **new_argv;
172 const char *alias_command; 192 const char *alias_command;
173 char *alias_string; 193 char *alias_string;
174 194
@@ -210,11 +230,11 @@ static int handle_alias(int *argcp, const char ***argv)
210 if (!strcmp(alias_command, new_argv[0])) 230 if (!strcmp(alias_command, new_argv[0]))
211 die("recursive alias: %s", alias_command); 231 die("recursive alias: %s", alias_command);
212 232
213 new_argv = realloc(new_argv, sizeof(char*) * 233 new_argv = realloc(new_argv, sizeof(char *) *
214 (count + *argcp + 1)); 234 (count + *argcp + 1));
215 /* insert after command name */ 235 /* insert after command name */
216 memcpy(new_argv + count, *argv + 1, sizeof(char*) * *argcp); 236 memcpy(new_argv + count, *argv + 1, sizeof(char *) * *argcp);
217 new_argv[count+*argcp] = NULL; 237 new_argv[count + *argcp] = NULL;
218 238
219 *argv = new_argv; 239 *argv = new_argv;
220 *argcp += count - 1; 240 *argcp += count - 1;
@@ -253,6 +273,9 @@ static int run_builtin(struct cmd_struct *p, int argc, const char **argv)
253 if (p->option & RUN_SETUP) 273 if (p->option & RUN_SETUP)
254 prefix = NULL; /* setup_perf_directory(); */ 274 prefix = NULL; /* setup_perf_directory(); */
255 275
276 if (use_browser == -1)
277 use_browser = check_tui_config(p->cmd);
278
256 if (use_pager == -1 && p->option & RUN_SETUP) 279 if (use_pager == -1 && p->option & RUN_SETUP)
257 use_pager = check_pager_config(p->cmd); 280 use_pager = check_pager_config(p->cmd);
258 if (use_pager == -1 && p->option & USE_PAGER) 281 if (use_pager == -1 && p->option & USE_PAGER)
@@ -261,6 +284,8 @@ static int run_builtin(struct cmd_struct *p, int argc, const char **argv)
261 set_debugfs_path(); 284 set_debugfs_path();
262 285
263 status = p->fn(argc, argv, prefix); 286 status = p->fn(argc, argv, prefix);
287 exit_browser(status);
288
264 if (status) 289 if (status)
265 return status & 0xff; 290 return status & 0xff;
266 291
@@ -285,6 +310,7 @@ static void handle_internal_command(int argc, const char **argv)
285{ 310{
286 const char *cmd = argv[0]; 311 const char *cmd = argv[0];
287 static struct cmd_struct commands[] = { 312 static struct cmd_struct commands[] = {
313 { "buildid-cache", cmd_buildid_cache, 0 },
288 { "buildid-list", cmd_buildid_list, 0 }, 314 { "buildid-list", cmd_buildid_list, 0 },
289 { "diff", cmd_diff, 0 }, 315 { "diff", cmd_diff, 0 },
290 { "help", cmd_help, 0 }, 316 { "help", cmd_help, 0 },
@@ -301,6 +327,10 @@ static void handle_internal_command(int argc, const char **argv)
301 { "sched", cmd_sched, 0 }, 327 { "sched", cmd_sched, 0 },
302 { "probe", cmd_probe, 0 }, 328 { "probe", cmd_probe, 0 },
303 { "kmem", cmd_kmem, 0 }, 329 { "kmem", cmd_kmem, 0 },
330 { "lock", cmd_lock, 0 },
331 { "kvm", cmd_kvm, 0 },
332 { "test", cmd_test, 0 },
333 { "inject", cmd_inject, 0 },
304 }; 334 };
305 unsigned int i; 335 unsigned int i;
306 static const char ext[] = STRIP_EXTENSION; 336 static const char ext[] = STRIP_EXTENSION;
@@ -388,7 +418,7 @@ static int run_argv(int *argcp, const char ***argv)
388/* mini /proc/mounts parser: searching for "^blah /mount/point debugfs" */ 418/* mini /proc/mounts parser: searching for "^blah /mount/point debugfs" */
389static void get_debugfs_mntpt(void) 419static void get_debugfs_mntpt(void)
390{ 420{
391 const char *path = debugfs_find_mountpoint(); 421 const char *path = debugfs_mount(NULL);
392 422
393 if (path) 423 if (path)
394 strncpy(debugfs_mntpt, path, sizeof(debugfs_mntpt)); 424 strncpy(debugfs_mntpt, path, sizeof(debugfs_mntpt));
@@ -442,15 +472,15 @@ int main(int argc, const char **argv)
442 472
443 /* 473 /*
444 * We use PATH to find perf commands, but we prepend some higher 474 * We use PATH to find perf commands, but we prepend some higher
445 * precidence paths: the "--exec-path" option, the PERF_EXEC_PATH 475 * precedence paths: the "--exec-path" option, the PERF_EXEC_PATH
446 * environment, and the $(perfexecdir) from the Makefile at build 476 * environment, and the $(perfexecdir) from the Makefile at build
447 * time. 477 * time.
448 */ 478 */
449 setup_path(); 479 setup_path();
450 480
451 while (1) { 481 while (1) {
452 static int done_help = 0; 482 static int done_help;
453 static int was_alias = 0; 483 static int was_alias;
454 484
455 was_alias = run_argv(&argc, &argv); 485 was_alias = run_argv(&argc, &argv);
456 if (errno != ENOENT) 486 if (errno != ENOENT)
diff --git a/tools/perf/perf.h b/tools/perf/perf.h
index 75f941bfba9e..ef7aa0a0c526 100644
--- a/tools/perf/perf.h
+++ b/tools/perf/perf.h
@@ -1,6 +1,10 @@
1#ifndef _PERF_PERF_H 1#ifndef _PERF_PERF_H
2#define _PERF_PERF_H 2#define _PERF_PERF_H
3 3
4struct winsize;
5
6void get_term_dimensions(struct winsize *ws);
7
4#if defined(__i386__) 8#if defined(__i386__)
5#include "../../arch/x86/include/asm/unistd.h" 9#include "../../arch/x86/include/asm/unistd.h"
6#define rmb() asm volatile("lock; addl $0,0(%%esp)" ::: "memory") 10#define rmb() asm volatile("lock; addl $0,0(%%esp)" ::: "memory")
@@ -65,9 +69,7 @@
65 * Use the __kuser_memory_barrier helper in the CPU helper page. See 69 * Use the __kuser_memory_barrier helper in the CPU helper page. See
66 * arch/arm/kernel/entry-armv.S in the kernel source for details. 70 * arch/arm/kernel/entry-armv.S in the kernel source for details.
67 */ 71 */
68#define rmb() asm volatile("mov r0, #0xffff0fff; mov lr, pc;" \ 72#define rmb() ((void(*)(void))0xffff0fa0)()
69 "sub pc, r0, #95" ::: "r0", "lr", "cc", \
70 "memory")
71#define cpu_relax() asm volatile("":::"memory") 73#define cpu_relax() asm volatile("":::"memory")
72#endif 74#endif
73 75
@@ -78,6 +80,7 @@
78 80
79#include "../../include/linux/perf_event.h" 81#include "../../include/linux/perf_event.h"
80#include "util/types.h" 82#include "util/types.h"
83#include <stdbool.h>
81 84
82/* 85/*
83 * prctl(PR_TASK_PERF_EVENTS_DISABLE) will (cheaply) disable all 86 * prctl(PR_TASK_PERF_EVENTS_DISABLE) will (cheaply) disable all
@@ -104,8 +107,6 @@ static inline unsigned long long rdclock(void)
104#define __user 107#define __user
105#define asmlinkage 108#define asmlinkage
106 109
107#define __used __attribute__((__unused__))
108
109#define unlikely(x) __builtin_expect(!!(x), 0) 110#define unlikely(x) __builtin_expect(!!(x), 0)
110#define min(x, y) ({ \ 111#define min(x, y) ({ \
111 typeof(x) _min1 = (x); \ 112 typeof(x) _min1 = (x); \
@@ -131,4 +132,6 @@ struct ip_callchain {
131 u64 ips[0]; 132 u64 ips[0];
132}; 133};
133 134
135extern bool perf_host, perf_guest;
136
134#endif 137#endif
diff --git a/tools/perf/scripts/perl/Perf-Trace-Util/Context.c b/tools/perf/scripts/perl/Perf-Trace-Util/Context.c
index af78d9a52a7d..01a64ad693f2 100644
--- a/tools/perf/scripts/perl/Perf-Trace-Util/Context.c
+++ b/tools/perf/scripts/perl/Perf-Trace-Util/Context.c
@@ -31,13 +31,14 @@
31#include "EXTERN.h" 31#include "EXTERN.h"
32#include "perl.h" 32#include "perl.h"
33#include "XSUB.h" 33#include "XSUB.h"
34#include "../../../util/trace-event-perl.h" 34#include "../../../perf.h"
35#include "../../../util/trace-event.h"
35 36
36#ifndef PERL_UNUSED_VAR 37#ifndef PERL_UNUSED_VAR
37# define PERL_UNUSED_VAR(var) if (0) var = var 38# define PERL_UNUSED_VAR(var) if (0) var = var
38#endif 39#endif
39 40
40#line 41 "Context.c" 41#line 42 "Context.c"
41 42
42XS(XS_Perf__Trace__Context_common_pc); /* prototype to pass -Wmissing-prototypes */ 43XS(XS_Perf__Trace__Context_common_pc); /* prototype to pass -Wmissing-prototypes */
43XS(XS_Perf__Trace__Context_common_pc) 44XS(XS_Perf__Trace__Context_common_pc)
diff --git a/tools/perf/scripts/perl/Perf-Trace-Util/Context.xs b/tools/perf/scripts/perl/Perf-Trace-Util/Context.xs
index fb78006c165e..549cf0467d30 100644
--- a/tools/perf/scripts/perl/Perf-Trace-Util/Context.xs
+++ b/tools/perf/scripts/perl/Perf-Trace-Util/Context.xs
@@ -22,7 +22,8 @@
22#include "EXTERN.h" 22#include "EXTERN.h"
23#include "perl.h" 23#include "perl.h"
24#include "XSUB.h" 24#include "XSUB.h"
25#include "../../../util/trace-event-perl.h" 25#include "../../../perf.h"
26#include "../../../util/trace-event.h"
26 27
27MODULE = Perf::Trace::Context PACKAGE = Perf::Trace::Context 28MODULE = Perf::Trace::Context PACKAGE = Perf::Trace::Context
28PROTOTYPES: ENABLE 29PROTOTYPES: ENABLE
diff --git a/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm b/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm
index 052f132ced24..d94b40c8ac85 100644
--- a/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm
+++ b/tools/perf/scripts/perl/Perf-Trace-Util/lib/Perf/Trace/Util.pm
@@ -15,6 +15,7 @@ our @EXPORT_OK = ( @{ $EXPORT_TAGS{'all'} } );
15 15
16our @EXPORT = qw( 16our @EXPORT = qw(
17avg nsecs nsecs_secs nsecs_nsecs nsecs_usecs print_nsecs 17avg nsecs nsecs_secs nsecs_nsecs nsecs_usecs print_nsecs
18clear_term
18); 19);
19 20
20our $VERSION = '0.01'; 21our $VERSION = '0.01';
@@ -44,7 +45,7 @@ sub nsecs_secs {
44sub nsecs_nsecs { 45sub nsecs_nsecs {
45 my ($nsecs) = @_; 46 my ($nsecs) = @_;
46 47
47 return $nsecs - nsecs_secs($nsecs); 48 return $nsecs % $NSECS_PER_SEC;
48} 49}
49 50
50sub nsecs_str { 51sub nsecs_str {
@@ -55,6 +56,11 @@ sub nsecs_str {
55 return $str; 56 return $str;
56} 57}
57 58
59sub clear_term
60{
61 print "\x1b[H\x1b[2J";
62}
63
581; 641;
59__END__ 65__END__
60=head1 NAME 66=head1 NAME
diff --git a/tools/perf/scripts/perl/bin/check-perf-trace-record b/tools/perf/scripts/perl/bin/check-perf-trace-record
index c7ec5de2f535..423ad6aed056 100644
--- a/tools/perf/scripts/perl/bin/check-perf-trace-record
+++ b/tools/perf/scripts/perl/bin/check-perf-trace-record
@@ -1,7 +1,2 @@
1#!/bin/bash 1#!/bin/bash
2perf record -c 1 -f -a -M -R -e kmem:kmalloc -e irq:softirq_entry 2perf record -a -e kmem:kmalloc -e irq:softirq_entry -e kmem:kfree
3
4
5
6
7
diff --git a/tools/perf/scripts/perl/bin/check-perf-trace-report b/tools/perf/scripts/perl/bin/check-perf-trace-report
deleted file mode 100644
index 7fc4a033dd49..000000000000
--- a/tools/perf/scripts/perl/bin/check-perf-trace-report
+++ /dev/null
@@ -1,6 +0,0 @@
1#!/bin/bash
2# description: useless but exhaustive test script
3perf trace -s ~/libexec/perf-core/scripts/perl/check-perf-trace.pl
4
5
6
diff --git a/tools/perf/scripts/perl/bin/failed-syscalls-record b/tools/perf/scripts/perl/bin/failed-syscalls-record
new file mode 100644
index 000000000000..eb5846bcb565
--- /dev/null
+++ b/tools/perf/scripts/perl/bin/failed-syscalls-record
@@ -0,0 +1,2 @@
1#!/bin/bash
2perf record -a -e raw_syscalls:sys_exit $@
diff --git a/tools/perf/scripts/perl/bin/failed-syscalls-report b/tools/perf/scripts/perl/bin/failed-syscalls-report
new file mode 100644
index 000000000000..e3a5e55d54ff
--- /dev/null
+++ b/tools/perf/scripts/perl/bin/failed-syscalls-report
@@ -0,0 +1,10 @@
1#!/bin/bash
2# description: system-wide failed syscalls
3# args: [comm]
4if [ $# -gt 0 ] ; then
5 if ! expr match "$1" "-" > /dev/null ; then
6 comm=$1
7 shift
8 fi
9fi
10perf trace $@ -s ~/libexec/perf-core/scripts/perl/failed-syscalls.pl $comm
diff --git a/tools/perf/scripts/perl/bin/rw-by-file-record b/tools/perf/scripts/perl/bin/rw-by-file-record
index b25056ebf963..5bfaae5a6cba 100644
--- a/tools/perf/scripts/perl/bin/rw-by-file-record
+++ b/tools/perf/scripts/perl/bin/rw-by-file-record
@@ -1,2 +1,3 @@
1#!/bin/bash 1#!/bin/bash
2perf record -c 1 -f -a -M -R -e syscalls:sys_enter_read -e syscalls:sys_enter_write 2perf record -a -e syscalls:sys_enter_read -e syscalls:sys_enter_write $@
3
diff --git a/tools/perf/scripts/perl/bin/rw-by-file-report b/tools/perf/scripts/perl/bin/rw-by-file-report
index eddb9ccce6a5..d83070b7eeb5 100644
--- a/tools/perf/scripts/perl/bin/rw-by-file-report
+++ b/tools/perf/scripts/perl/bin/rw-by-file-report
@@ -1,7 +1,13 @@
1#!/bin/bash 1#!/bin/bash
2# description: r/w activity for a program, by file 2# description: r/w activity for a program, by file
3# args: <comm> 3# args: <comm>
4perf trace -s ~/libexec/perf-core/scripts/perl/rw-by-file.pl $1 4if [ $# -lt 1 ] ; then
5 echo "usage: rw-by-file <comm>"
6 exit
7fi
8comm=$1
9shift
10perf trace $@ -s ~/libexec/perf-core/scripts/perl/rw-by-file.pl $comm
5 11
6 12
7 13
diff --git a/tools/perf/scripts/perl/bin/rw-by-pid-record b/tools/perf/scripts/perl/bin/rw-by-pid-record
index 8903979c5b6c..6e0b2f7755ac 100644
--- a/tools/perf/scripts/perl/bin/rw-by-pid-record
+++ b/tools/perf/scripts/perl/bin/rw-by-pid-record
@@ -1,2 +1,2 @@
1#!/bin/bash 1#!/bin/bash
2perf record -c 1 -f -a -M -R -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write 2perf record -a -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write $@
diff --git a/tools/perf/scripts/perl/bin/rw-by-pid-report b/tools/perf/scripts/perl/bin/rw-by-pid-report
index 7f44c25cc857..7ef46983f62f 100644
--- a/tools/perf/scripts/perl/bin/rw-by-pid-report
+++ b/tools/perf/scripts/perl/bin/rw-by-pid-report
@@ -1,6 +1,6 @@
1#!/bin/bash 1#!/bin/bash
2# description: system-wide r/w activity 2# description: system-wide r/w activity
3perf trace -s ~/libexec/perf-core/scripts/perl/rw-by-pid.pl 3perf trace $@ -s ~/libexec/perf-core/scripts/perl/rw-by-pid.pl
4 4
5 5
6 6
diff --git a/tools/perf/scripts/perl/bin/rwtop-record b/tools/perf/scripts/perl/bin/rwtop-record
new file mode 100644
index 000000000000..6e0b2f7755ac
--- /dev/null
+++ b/tools/perf/scripts/perl/bin/rwtop-record
@@ -0,0 +1,2 @@
1#!/bin/bash
2perf record -a -e syscalls:sys_enter_read -e syscalls:sys_exit_read -e syscalls:sys_enter_write -e syscalls:sys_exit_write $@
diff --git a/tools/perf/scripts/perl/bin/rwtop-report b/tools/perf/scripts/perl/bin/rwtop-report
new file mode 100644
index 000000000000..93e698cd3f38
--- /dev/null
+++ b/tools/perf/scripts/perl/bin/rwtop-report
@@ -0,0 +1,23 @@
1#!/bin/bash
2# description: system-wide r/w top
3# args: [interval]
4n_args=0
5for i in "$@"
6do
7 if expr match "$i" "-" > /dev/null ; then
8 break
9 fi
10 n_args=$(( $n_args + 1 ))
11done
12if [ "$n_args" -gt 1 ] ; then
13 echo "usage: rwtop-report [interval]"
14 exit
15fi
16if [ "$n_args" -gt 0 ] ; then
17 interval=$1
18 shift
19fi
20perf trace $@ -s ~/libexec/perf-core/scripts/perl/rwtop.pl $interval
21
22
23
diff --git a/tools/perf/scripts/perl/bin/wakeup-latency-record b/tools/perf/scripts/perl/bin/wakeup-latency-record
index 6abedda911a4..9f2acaaae9f0 100644
--- a/tools/perf/scripts/perl/bin/wakeup-latency-record
+++ b/tools/perf/scripts/perl/bin/wakeup-latency-record
@@ -1,5 +1,5 @@
1#!/bin/bash 1#!/bin/bash
2perf record -c 1 -f -a -M -R -e sched:sched_switch -e sched:sched_wakeup 2perf record -a -e sched:sched_switch -e sched:sched_wakeup $@
3 3
4 4
5 5
diff --git a/tools/perf/scripts/perl/bin/wakeup-latency-report b/tools/perf/scripts/perl/bin/wakeup-latency-report
index fce3adcb3249..a0d898f9ca1d 100644
--- a/tools/perf/scripts/perl/bin/wakeup-latency-report
+++ b/tools/perf/scripts/perl/bin/wakeup-latency-report
@@ -1,6 +1,6 @@
1#!/bin/bash 1#!/bin/bash
2# description: system-wide min/max/avg wakeup latency 2# description: system-wide min/max/avg wakeup latency
3perf trace -s ~/libexec/perf-core/scripts/perl/wakeup-latency.pl 3perf trace $@ -s ~/libexec/perf-core/scripts/perl/wakeup-latency.pl
4 4
5 5
6 6
diff --git a/tools/perf/scripts/perl/bin/workqueue-stats-record b/tools/perf/scripts/perl/bin/workqueue-stats-record
index fce6637b19ba..85301f2471ff 100644
--- a/tools/perf/scripts/perl/bin/workqueue-stats-record
+++ b/tools/perf/scripts/perl/bin/workqueue-stats-record
@@ -1,2 +1,2 @@
1#!/bin/bash 1#!/bin/bash
2perf record -c 1 -f -a -M -R -e workqueue:workqueue_creation -e workqueue:workqueue_destruction -e workqueue:workqueue_execution -e workqueue:workqueue_insertion 2perf record -a -e workqueue:workqueue_creation -e workqueue:workqueue_destruction -e workqueue:workqueue_execution -e workqueue:workqueue_insertion $@
diff --git a/tools/perf/scripts/perl/bin/workqueue-stats-report b/tools/perf/scripts/perl/bin/workqueue-stats-report
index 71cfbd182fb9..35081132ef97 100644
--- a/tools/perf/scripts/perl/bin/workqueue-stats-report
+++ b/tools/perf/scripts/perl/bin/workqueue-stats-report
@@ -1,6 +1,6 @@
1#!/bin/bash 1#!/bin/bash
2# description: workqueue stats (ins/exe/create/destroy) 2# description: workqueue stats (ins/exe/create/destroy)
3perf trace -s ~/libexec/perf-core/scripts/perl/workqueue-stats.pl 3perf trace $@ -s ~/libexec/perf-core/scripts/perl/workqueue-stats.pl
4 4
5 5
6 6
diff --git a/tools/perf/scripts/perl/failed-syscalls.pl b/tools/perf/scripts/perl/failed-syscalls.pl
new file mode 100644
index 000000000000..94bc25a347eb
--- /dev/null
+++ b/tools/perf/scripts/perl/failed-syscalls.pl
@@ -0,0 +1,42 @@
1# failed system call counts
2# (c) 2010, Tom Zanussi <tzanussi@gmail.com>
3# Licensed under the terms of the GNU GPL License version 2
4#
5# Displays system-wide failed system call totals
6# If a [comm] arg is specified, only syscalls called by [comm] are displayed.
7
8use lib "$ENV{'PERF_EXEC_PATH'}/scripts/perl/Perf-Trace-Util/lib";
9use lib "./Perf-Trace-Util/lib";
10use Perf::Trace::Core;
11use Perf::Trace::Context;
12use Perf::Trace::Util;
13
14my $for_comm = shift;
15
16my %failed_syscalls;
17
18sub raw_syscalls::sys_exit
19{
20 my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs,
21 $common_pid, $common_comm,
22 $id, $ret) = @_;
23
24 if ($ret < 0) {
25 $failed_syscalls{$common_comm}++;
26 }
27}
28
29sub trace_end
30{
31 printf("\nfailed syscalls by comm:\n\n");
32
33 printf("%-20s %10s\n", "comm", "# errors");
34 printf("%-20s %6s %10s\n", "--------------------", "----------");
35
36 foreach my $comm (sort {$failed_syscalls{$b} <=> $failed_syscalls{$a}}
37 keys %failed_syscalls) {
38 next if ($for_comm && $comm ne $for_comm);
39
40 printf("%-20s %10s\n", $comm, $failed_syscalls{$comm});
41 }
42}
diff --git a/tools/perf/scripts/perl/rw-by-pid.pl b/tools/perf/scripts/perl/rw-by-pid.pl
index da601fae1a00..9db23c9daf55 100644
--- a/tools/perf/scripts/perl/rw-by-pid.pl
+++ b/tools/perf/scripts/perl/rw-by-pid.pl
@@ -79,12 +79,12 @@ sub trace_end
79 printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------", 79 printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------",
80 "-----------", "----------", "----------"); 80 "-----------", "----------", "----------");
81 81
82 foreach my $pid (sort {$reads{$b}{bytes_read} <=> 82 foreach my $pid (sort { ($reads{$b}{bytes_read} || 0) <=>
83 $reads{$a}{bytes_read}} keys %reads) { 83 ($reads{$a}{bytes_read} || 0) } keys %reads) {
84 my $comm = $reads{$pid}{comm}; 84 my $comm = $reads{$pid}{comm} || "";
85 my $total_reads = $reads{$pid}{total_reads}; 85 my $total_reads = $reads{$pid}{total_reads} || 0;
86 my $bytes_requested = $reads{$pid}{bytes_requested}; 86 my $bytes_requested = $reads{$pid}{bytes_requested} || 0;
87 my $bytes_read = $reads{$pid}{bytes_read}; 87 my $bytes_read = $reads{$pid}{bytes_read} || 0;
88 88
89 printf("%6s %-20s %10s %10s %10s\n", $pid, $comm, 89 printf("%6s %-20s %10s %10s %10s\n", $pid, $comm,
90 $total_reads, $bytes_requested, $bytes_read); 90 $total_reads, $bytes_requested, $bytes_read);
@@ -96,16 +96,23 @@ sub trace_end
96 printf("%6s %20s %6s %10s\n", "------", "--------------------", 96 printf("%6s %20s %6s %10s\n", "------", "--------------------",
97 "------", "----------"); 97 "------", "----------");
98 98
99 foreach my $pid (keys %reads) { 99 my @errcounts = ();
100 my $comm = $reads{$pid}{comm};
101 foreach my $err (sort {$reads{$b}{comm} cmp $reads{$a}{comm}}
102 keys %{$reads{$pid}{errors}}) {
103 my $errors = $reads{$pid}{errors}{$err};
104 100
105 printf("%6d %-20s %6d %10s\n", $pid, $comm, $err, $errors); 101 foreach my $pid (keys %reads) {
102 foreach my $error (keys %{$reads{$pid}{errors}}) {
103 my $comm = $reads{$pid}{comm} || "";
104 my $errcount = $reads{$pid}{errors}{$error} || 0;
105 push @errcounts, [$pid, $comm, $error, $errcount];
106 } 106 }
107 } 107 }
108 108
109 @errcounts = sort { $b->[3] <=> $a->[3] } @errcounts;
110
111 for my $i (0 .. $#errcounts) {
112 printf("%6d %-20s %6d %10s\n", $errcounts[$i][0],
113 $errcounts[$i][1], $errcounts[$i][2], $errcounts[$i][3]);
114 }
115
109 printf("\nwrite counts by pid:\n\n"); 116 printf("\nwrite counts by pid:\n\n");
110 117
111 printf("%6s %20s %10s %10s\n", "pid", "comm", 118 printf("%6s %20s %10s %10s\n", "pid", "comm",
@@ -113,11 +120,11 @@ sub trace_end
113 printf("%6s %-20s %10s %10s\n", "------", "--------------------", 120 printf("%6s %-20s %10s %10s\n", "------", "--------------------",
114 "-----------", "----------"); 121 "-----------", "----------");
115 122
116 foreach my $pid (sort {$writes{$b}{bytes_written} <=> 123 foreach my $pid (sort { ($writes{$b}{bytes_written} || 0) <=>
117 $writes{$a}{bytes_written}} keys %writes) { 124 ($writes{$a}{bytes_written} || 0)} keys %writes) {
118 my $comm = $writes{$pid}{comm}; 125 my $comm = $writes{$pid}{comm} || "";
119 my $total_writes = $writes{$pid}{total_writes}; 126 my $total_writes = $writes{$pid}{total_writes} || 0;
120 my $bytes_written = $writes{$pid}{bytes_written}; 127 my $bytes_written = $writes{$pid}{bytes_written} || 0;
121 128
122 printf("%6s %-20s %10s %10s\n", $pid, $comm, 129 printf("%6s %-20s %10s %10s\n", $pid, $comm,
123 $total_writes, $bytes_written); 130 $total_writes, $bytes_written);
@@ -129,16 +136,23 @@ sub trace_end
129 printf("%6s %20s %6s %10s\n", "------", "--------------------", 136 printf("%6s %20s %6s %10s\n", "------", "--------------------",
130 "------", "----------"); 137 "------", "----------");
131 138
132 foreach my $pid (keys %writes) { 139 @errcounts = ();
133 my $comm = $writes{$pid}{comm};
134 foreach my $err (sort {$writes{$b}{comm} cmp $writes{$a}{comm}}
135 keys %{$writes{$pid}{errors}}) {
136 my $errors = $writes{$pid}{errors}{$err};
137 140
138 printf("%6d %-20s %6d %10s\n", $pid, $comm, $err, $errors); 141 foreach my $pid (keys %writes) {
142 foreach my $error (keys %{$writes{$pid}{errors}}) {
143 my $comm = $writes{$pid}{comm} || "";
144 my $errcount = $writes{$pid}{errors}{$error} || 0;
145 push @errcounts, [$pid, $comm, $error, $errcount];
139 } 146 }
140 } 147 }
141 148
149 @errcounts = sort { $b->[3] <=> $a->[3] } @errcounts;
150
151 for my $i (0 .. $#errcounts) {
152 printf("%6d %-20s %6d %10s\n", $errcounts[$i][0],
153 $errcounts[$i][1], $errcounts[$i][2], $errcounts[$i][3]);
154 }
155
142 print_unhandled(); 156 print_unhandled();
143} 157}
144 158
diff --git a/tools/perf/scripts/perl/rwtop.pl b/tools/perf/scripts/perl/rwtop.pl
new file mode 100644
index 000000000000..4bb3ecd33472
--- /dev/null
+++ b/tools/perf/scripts/perl/rwtop.pl
@@ -0,0 +1,199 @@
1#!/usr/bin/perl -w
2# (c) 2010, Tom Zanussi <tzanussi@gmail.com>
3# Licensed under the terms of the GNU GPL License version 2
4
5# read/write top
6#
7# Periodically displays system-wide r/w call activity, broken down by
8# pid. If an [interval] arg is specified, the display will be
9# refreshed every [interval] seconds. The default interval is 3
10# seconds.
11
12use 5.010000;
13use strict;
14use warnings;
15
16use lib "$ENV{'PERF_EXEC_PATH'}/scripts/perl/Perf-Trace-Util/lib";
17use lib "./Perf-Trace-Util/lib";
18use Perf::Trace::Core;
19use Perf::Trace::Util;
20
21my $default_interval = 3;
22my $nlines = 20;
23my $print_thread;
24my $print_pending = 0;
25
26my %reads;
27my %writes;
28
29my $interval = shift;
30if (!$interval) {
31 $interval = $default_interval;
32}
33
34sub syscalls::sys_exit_read
35{
36 my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs,
37 $common_pid, $common_comm,
38 $nr, $ret) = @_;
39
40 print_check();
41
42 if ($ret > 0) {
43 $reads{$common_pid}{bytes_read} += $ret;
44 } else {
45 if (!defined ($reads{$common_pid}{bytes_read})) {
46 $reads{$common_pid}{bytes_read} = 0;
47 }
48 $reads{$common_pid}{errors}{$ret}++;
49 }
50}
51
52sub syscalls::sys_enter_read
53{
54 my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs,
55 $common_pid, $common_comm,
56 $nr, $fd, $buf, $count) = @_;
57
58 print_check();
59
60 $reads{$common_pid}{bytes_requested} += $count;
61 $reads{$common_pid}{total_reads}++;
62 $reads{$common_pid}{comm} = $common_comm;
63}
64
65sub syscalls::sys_exit_write
66{
67 my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs,
68 $common_pid, $common_comm,
69 $nr, $ret) = @_;
70
71 print_check();
72
73 if ($ret <= 0) {
74 $writes{$common_pid}{errors}{$ret}++;
75 }
76}
77
78sub syscalls::sys_enter_write
79{
80 my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs,
81 $common_pid, $common_comm,
82 $nr, $fd, $buf, $count) = @_;
83
84 print_check();
85
86 $writes{$common_pid}{bytes_written} += $count;
87 $writes{$common_pid}{total_writes}++;
88 $writes{$common_pid}{comm} = $common_comm;
89}
90
91sub trace_begin
92{
93 $SIG{ALRM} = \&set_print_pending;
94 alarm 1;
95}
96
97sub trace_end
98{
99 print_unhandled();
100 print_totals();
101}
102
103sub print_check()
104{
105 if ($print_pending == 1) {
106 $print_pending = 0;
107 print_totals();
108 }
109}
110
111sub set_print_pending()
112{
113 $print_pending = 1;
114 alarm $interval;
115}
116
117sub print_totals
118{
119 my $count;
120
121 $count = 0;
122
123 clear_term();
124
125 printf("\nread counts by pid:\n\n");
126
127 printf("%6s %20s %10s %10s %10s\n", "pid", "comm",
128 "# reads", "bytes_req", "bytes_read");
129 printf("%6s %-20s %10s %10s %10s\n", "------", "--------------------",
130 "----------", "----------", "----------");
131
132 foreach my $pid (sort { ($reads{$b}{bytes_read} || 0) <=>
133 ($reads{$a}{bytes_read} || 0) } keys %reads) {
134 my $comm = $reads{$pid}{comm} || "";
135 my $total_reads = $reads{$pid}{total_reads} || 0;
136 my $bytes_requested = $reads{$pid}{bytes_requested} || 0;
137 my $bytes_read = $reads{$pid}{bytes_read} || 0;
138
139 printf("%6s %-20s %10s %10s %10s\n", $pid, $comm,
140 $total_reads, $bytes_requested, $bytes_read);
141
142 if (++$count == $nlines) {
143 last;
144 }
145 }
146
147 $count = 0;
148
149 printf("\nwrite counts by pid:\n\n");
150
151 printf("%6s %20s %10s %13s\n", "pid", "comm",
152 "# writes", "bytes_written");
153 printf("%6s %-20s %10s %13s\n", "------", "--------------------",
154 "----------", "-------------");
155
156 foreach my $pid (sort { ($writes{$b}{bytes_written} || 0) <=>
157 ($writes{$a}{bytes_written} || 0)} keys %writes) {
158 my $comm = $writes{$pid}{comm} || "";
159 my $total_writes = $writes{$pid}{total_writes} || 0;
160 my $bytes_written = $writes{$pid}{bytes_written} || 0;
161
162 printf("%6s %-20s %10s %13s\n", $pid, $comm,
163 $total_writes, $bytes_written);
164
165 if (++$count == $nlines) {
166 last;
167 }
168 }
169
170 %reads = ();
171 %writes = ();
172}
173
174my %unhandled;
175
176sub print_unhandled
177{
178 if ((scalar keys %unhandled) == 0) {
179 return;
180 }
181
182 print "\nunhandled events:\n\n";
183
184 printf("%-40s %10s\n", "event", "count");
185 printf("%-40s %10s\n", "----------------------------------------",
186 "-----------");
187
188 foreach my $event_name (keys %unhandled) {
189 printf("%-40s %10d\n", $event_name, $unhandled{$event_name});
190 }
191}
192
193sub trace_unhandled
194{
195 my ($event_name, $context, $common_cpu, $common_secs, $common_nsecs,
196 $common_pid, $common_comm) = @_;
197
198 $unhandled{$event_name}++;
199}
diff --git a/tools/perf/scripts/perl/wakeup-latency.pl b/tools/perf/scripts/perl/wakeup-latency.pl
index ed58ef284e23..d9143dcec6c6 100644
--- a/tools/perf/scripts/perl/wakeup-latency.pl
+++ b/tools/perf/scripts/perl/wakeup-latency.pl
@@ -22,8 +22,8 @@ my %last_wakeup;
22 22
23my $max_wakeup_latency; 23my $max_wakeup_latency;
24my $min_wakeup_latency; 24my $min_wakeup_latency;
25my $total_wakeup_latency; 25my $total_wakeup_latency = 0;
26my $total_wakeups; 26my $total_wakeups = 0;
27 27
28sub sched::sched_switch 28sub sched::sched_switch
29{ 29{
@@ -67,8 +67,12 @@ sub trace_end
67{ 67{
68 printf("wakeup_latency stats:\n\n"); 68 printf("wakeup_latency stats:\n\n");
69 print "total_wakeups: $total_wakeups\n"; 69 print "total_wakeups: $total_wakeups\n";
70 printf("avg_wakeup_latency (ns): %u\n", 70 if ($total_wakeups) {
71 avg($total_wakeup_latency, $total_wakeups)); 71 printf("avg_wakeup_latency (ns): %u\n",
72 avg($total_wakeup_latency, $total_wakeups));
73 } else {
74 printf("avg_wakeup_latency (ns): N/A\n");
75 }
72 printf("min_wakeup_latency (ns): %u\n", $min_wakeup_latency); 76 printf("min_wakeup_latency (ns): %u\n", $min_wakeup_latency);
73 printf("max_wakeup_latency (ns): %u\n", $max_wakeup_latency); 77 printf("max_wakeup_latency (ns): %u\n", $max_wakeup_latency);
74 78
diff --git a/tools/perf/scripts/perl/workqueue-stats.pl b/tools/perf/scripts/perl/workqueue-stats.pl
index 511302c8a494..b84b12699b70 100644
--- a/tools/perf/scripts/perl/workqueue-stats.pl
+++ b/tools/perf/scripts/perl/workqueue-stats.pl
@@ -71,9 +71,9 @@ sub trace_end
71 printf("%3s %6s %6s\t%-20s\n", "---", "---", "----", "----"); 71 printf("%3s %6s %6s\t%-20s\n", "---", "---", "----", "----");
72 foreach my $pidhash (@cpus) { 72 foreach my $pidhash (@cpus) {
73 while ((my $pid, my $wqhash) = each %$pidhash) { 73 while ((my $pid, my $wqhash) = each %$pidhash) {
74 my $ins = $$wqhash{'inserted'}; 74 my $ins = $$wqhash{'inserted'} || 0;
75 my $exe = $$wqhash{'executed'}; 75 my $exe = $$wqhash{'executed'} || 0;
76 my $comm = $$wqhash{'comm'}; 76 my $comm = $$wqhash{'comm'} || "";
77 if ($ins || $exe) { 77 if ($ins || $exe) {
78 printf("%3u %6u %6u\t%-20s\n", $cpu, $ins, $exe, $comm); 78 printf("%3u %6u %6u\t%-20s\n", $cpu, $ins, $exe, $comm);
79 } 79 }
@@ -87,9 +87,9 @@ sub trace_end
87 printf("%3s %6s %6s\t%-20s\n", "---", "-------", "---------", "----"); 87 printf("%3s %6s %6s\t%-20s\n", "---", "-------", "---------", "----");
88 foreach my $pidhash (@cpus) { 88 foreach my $pidhash (@cpus) {
89 while ((my $pid, my $wqhash) = each %$pidhash) { 89 while ((my $pid, my $wqhash) = each %$pidhash) {
90 my $created = $$wqhash{'created'}; 90 my $created = $$wqhash{'created'} || 0;
91 my $destroyed = $$wqhash{'destroyed'}; 91 my $destroyed = $$wqhash{'destroyed'} || 0;
92 my $comm = $$wqhash{'comm'}; 92 my $comm = $$wqhash{'comm'} || "";
93 if ($created || $destroyed) { 93 if ($created || $destroyed) {
94 printf("%3u %6u %6u\t%-20s\n", $cpu, $created, $destroyed, 94 printf("%3u %6u %6u\t%-20s\n", $cpu, $created, $destroyed,
95 $comm); 95 $comm);
diff --git a/tools/perf/scripts/python/Perf-Trace-Util/Context.c b/tools/perf/scripts/python/Perf-Trace-Util/Context.c
new file mode 100644
index 000000000000..957085dd5d8d
--- /dev/null
+++ b/tools/perf/scripts/python/Perf-Trace-Util/Context.c
@@ -0,0 +1,88 @@
1/*
2 * Context.c. Python interfaces for perf trace.
3 *
4 * Copyright (C) 2010 Tom Zanussi <tzanussi@gmail.com>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19 *
20 */
21
22#include <Python.h>
23#include "../../../perf.h"
24#include "../../../util/trace-event.h"
25
26PyMODINIT_FUNC initperf_trace_context(void);
27
28static PyObject *perf_trace_context_common_pc(PyObject *self, PyObject *args)
29{
30 static struct scripting_context *scripting_context;
31 PyObject *context;
32 int retval;
33
34 if (!PyArg_ParseTuple(args, "O", &context))
35 return NULL;
36
37 scripting_context = PyCObject_AsVoidPtr(context);
38 retval = common_pc(scripting_context);
39
40 return Py_BuildValue("i", retval);
41}
42
43static PyObject *perf_trace_context_common_flags(PyObject *self,
44 PyObject *args)
45{
46 static struct scripting_context *scripting_context;
47 PyObject *context;
48 int retval;
49
50 if (!PyArg_ParseTuple(args, "O", &context))
51 return NULL;
52
53 scripting_context = PyCObject_AsVoidPtr(context);
54 retval = common_flags(scripting_context);
55
56 return Py_BuildValue("i", retval);
57}
58
59static PyObject *perf_trace_context_common_lock_depth(PyObject *self,
60 PyObject *args)
61{
62 static struct scripting_context *scripting_context;
63 PyObject *context;
64 int retval;
65
66 if (!PyArg_ParseTuple(args, "O", &context))
67 return NULL;
68
69 scripting_context = PyCObject_AsVoidPtr(context);
70 retval = common_lock_depth(scripting_context);
71
72 return Py_BuildValue("i", retval);
73}
74
75static PyMethodDef ContextMethods[] = {
76 { "common_pc", perf_trace_context_common_pc, METH_VARARGS,
77 "Get the common preempt count event field value."},
78 { "common_flags", perf_trace_context_common_flags, METH_VARARGS,
79 "Get the common flags event field value."},
80 { "common_lock_depth", perf_trace_context_common_lock_depth,
81 METH_VARARGS, "Get the common lock depth event field value."},
82 { NULL, NULL, 0, NULL}
83};
84
85PyMODINIT_FUNC initperf_trace_context(void)
86{
87 (void) Py_InitModule("perf_trace_context", ContextMethods);
88}
diff --git a/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Core.py b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Core.py
new file mode 100644
index 000000000000..1dc464ee2ca8
--- /dev/null
+++ b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Core.py
@@ -0,0 +1,91 @@
1# Core.py - Python extension for perf trace, core functions
2#
3# Copyright (C) 2010 by Tom Zanussi <tzanussi@gmail.com>
4#
5# This software may be distributed under the terms of the GNU General
6# Public License ("GPL") version 2 as published by the Free Software
7# Foundation.
8
9from collections import defaultdict
10
11def autodict():
12 return defaultdict(autodict)
13
14flag_fields = autodict()
15symbolic_fields = autodict()
16
17def define_flag_field(event_name, field_name, delim):
18 flag_fields[event_name][field_name]['delim'] = delim
19
20def define_flag_value(event_name, field_name, value, field_str):
21 flag_fields[event_name][field_name]['values'][value] = field_str
22
23def define_symbolic_field(event_name, field_name):
24 # nothing to do, really
25 pass
26
27def define_symbolic_value(event_name, field_name, value, field_str):
28 symbolic_fields[event_name][field_name]['values'][value] = field_str
29
30def flag_str(event_name, field_name, value):
31 string = ""
32
33 if flag_fields[event_name][field_name]:
34 print_delim = 0
35 keys = flag_fields[event_name][field_name]['values'].keys()
36 keys.sort()
37 for idx in keys:
38 if not value and not idx:
39 string += flag_fields[event_name][field_name]['values'][idx]
40 break
41 if idx and (value & idx) == idx:
42 if print_delim and flag_fields[event_name][field_name]['delim']:
43 string += " " + flag_fields[event_name][field_name]['delim'] + " "
44 string += flag_fields[event_name][field_name]['values'][idx]
45 print_delim = 1
46 value &= ~idx
47
48 return string
49
50def symbol_str(event_name, field_name, value):
51 string = ""
52
53 if symbolic_fields[event_name][field_name]:
54 keys = symbolic_fields[event_name][field_name]['values'].keys()
55 keys.sort()
56 for idx in keys:
57 if not value and not idx:
58 string = symbolic_fields[event_name][field_name]['values'][idx]
59 break
60 if (value == idx):
61 string = symbolic_fields[event_name][field_name]['values'][idx]
62 break
63
64 return string
65
66trace_flags = { 0x00: "NONE", \
67 0x01: "IRQS_OFF", \
68 0x02: "IRQS_NOSUPPORT", \
69 0x04: "NEED_RESCHED", \
70 0x08: "HARDIRQ", \
71 0x10: "SOFTIRQ" }
72
73def trace_flag_str(value):
74 string = ""
75 print_delim = 0
76
77 keys = trace_flags.keys()
78
79 for idx in keys:
80 if not value and not idx:
81 string += "NONE"
82 break
83
84 if idx and (value & idx) == idx:
85 if print_delim:
86 string += " | ";
87 string += trace_flags[idx]
88 print_delim = 1
89 value &= ~idx
90
91 return string
diff --git a/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py
new file mode 100644
index 000000000000..9689bc0acd9f
--- /dev/null
+++ b/tools/perf/scripts/python/Perf-Trace-Util/lib/Perf/Trace/Util.py
@@ -0,0 +1,28 @@
1# Util.py - Python extension for perf trace, miscellaneous utility code
2#
3# Copyright (C) 2010 by Tom Zanussi <tzanussi@gmail.com>
4#
5# This software may be distributed under the terms of the GNU General
6# Public License ("GPL") version 2 as published by the Free Software
7# Foundation.
8
9NSECS_PER_SEC = 1000000000
10
11def avg(total, n):
12 return total / n
13
14def nsecs(secs, nsecs):
15 return secs * NSECS_PER_SEC + nsecs
16
17def nsecs_secs(nsecs):
18 return nsecs / NSECS_PER_SEC
19
20def nsecs_nsecs(nsecs):
21 return nsecs % NSECS_PER_SEC
22
23def nsecs_str(nsecs):
24 str = "%5u.%09u" % (nsecs_secs(nsecs), nsecs_nsecs(nsecs)),
25 return str
26
27def clear_term():
28 print("\x1b[H\x1b[2J")
diff --git a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record
new file mode 100644
index 000000000000..eb5846bcb565
--- /dev/null
+++ b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-record
@@ -0,0 +1,2 @@
1#!/bin/bash
2perf record -a -e raw_syscalls:sys_exit $@
diff --git a/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report
new file mode 100644
index 000000000000..30293545fcc2
--- /dev/null
+++ b/tools/perf/scripts/python/bin/failed-syscalls-by-pid-report
@@ -0,0 +1,10 @@
1#!/bin/bash
2# description: system-wide failed syscalls, by pid
3# args: [comm]
4if [ $# -gt 0 ] ; then
5 if ! expr match "$1" "-" > /dev/null ; then
6 comm=$1
7 shift
8 fi
9fi
10perf trace $@ -s ~/libexec/perf-core/scripts/python/failed-syscalls-by-pid.py $comm
diff --git a/tools/perf/scripts/python/bin/sctop-record b/tools/perf/scripts/python/bin/sctop-record
new file mode 100644
index 000000000000..1fc5998b721d
--- /dev/null
+++ b/tools/perf/scripts/python/bin/sctop-record
@@ -0,0 +1,2 @@
1#!/bin/bash
2perf record -a -e raw_syscalls:sys_enter $@
diff --git a/tools/perf/scripts/python/bin/sctop-report b/tools/perf/scripts/python/bin/sctop-report
new file mode 100644
index 000000000000..b01c842ae7b4
--- /dev/null
+++ b/tools/perf/scripts/python/bin/sctop-report
@@ -0,0 +1,24 @@
1#!/bin/bash
2# description: syscall top
3# args: [comm] [interval]
4n_args=0
5for i in "$@"
6do
7 if expr match "$i" "-" > /dev/null ; then
8 break
9 fi
10 n_args=$(( $n_args + 1 ))
11done
12if [ "$n_args" -gt 2 ] ; then
13 echo "usage: sctop-report [comm] [interval]"
14 exit
15fi
16if [ "$n_args" -gt 1 ] ; then
17 comm=$1
18 interval=$2
19 shift 2
20elif [ "$n_args" -gt 0 ] ; then
21 interval=$1
22 shift
23fi
24perf trace $@ -s ~/libexec/perf-core/scripts/python/sctop.py $comm $interval
diff --git a/tools/perf/scripts/python/bin/syscall-counts-by-pid-record b/tools/perf/scripts/python/bin/syscall-counts-by-pid-record
new file mode 100644
index 000000000000..1fc5998b721d
--- /dev/null
+++ b/tools/perf/scripts/python/bin/syscall-counts-by-pid-record
@@ -0,0 +1,2 @@
1#!/bin/bash
2perf record -a -e raw_syscalls:sys_enter $@
diff --git a/tools/perf/scripts/python/bin/syscall-counts-by-pid-report b/tools/perf/scripts/python/bin/syscall-counts-by-pid-report
new file mode 100644
index 000000000000..9e9d8ddd72ce
--- /dev/null
+++ b/tools/perf/scripts/python/bin/syscall-counts-by-pid-report
@@ -0,0 +1,10 @@
1#!/bin/bash
2# description: system-wide syscall counts, by pid
3# args: [comm]
4if [ $# -gt 0 ] ; then
5 if ! expr match "$1" "-" > /dev/null ; then
6 comm=$1
7 shift
8 fi
9fi
10perf trace $@ -s ~/libexec/perf-core/scripts/python/syscall-counts-by-pid.py $comm
diff --git a/tools/perf/scripts/python/bin/syscall-counts-record b/tools/perf/scripts/python/bin/syscall-counts-record
new file mode 100644
index 000000000000..1fc5998b721d
--- /dev/null
+++ b/tools/perf/scripts/python/bin/syscall-counts-record
@@ -0,0 +1,2 @@
1#!/bin/bash
2perf record -a -e raw_syscalls:sys_enter $@
diff --git a/tools/perf/scripts/python/bin/syscall-counts-report b/tools/perf/scripts/python/bin/syscall-counts-report
new file mode 100644
index 000000000000..dc076b618796
--- /dev/null
+++ b/tools/perf/scripts/python/bin/syscall-counts-report
@@ -0,0 +1,10 @@
1#!/bin/bash
2# description: system-wide syscall counts
3# args: [comm]
4if [ $# -gt 0 ] ; then
5 if ! expr match "$1" "-" > /dev/null ; then
6 comm=$1
7 shift
8 fi
9fi
10perf trace $@ -s ~/libexec/perf-core/scripts/python/syscall-counts.py $comm
diff --git a/tools/perf/scripts/python/check-perf-trace.py b/tools/perf/scripts/python/check-perf-trace.py
new file mode 100644
index 000000000000..d9f7893e315c
--- /dev/null
+++ b/tools/perf/scripts/python/check-perf-trace.py
@@ -0,0 +1,82 @@
1# perf trace event handlers, generated by perf trace -g python
2# (c) 2010, Tom Zanussi <tzanussi@gmail.com>
3# Licensed under the terms of the GNU GPL License version 2
4#
5# This script tests basic functionality such as flag and symbol
6# strings, common_xxx() calls back into perf, begin, end, unhandled
7# events, etc. Basically, if this script runs successfully and
8# displays expected results, Python scripting support should be ok.
9
10import os
11import sys
12
13sys.path.append(os.environ['PERF_EXEC_PATH'] + \
14 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
15
16from Core import *
17from perf_trace_context import *
18
19unhandled = autodict()
20
21def trace_begin():
22 print "trace_begin"
23 pass
24
25def trace_end():
26 print_unhandled()
27
28def irq__softirq_entry(event_name, context, common_cpu,
29 common_secs, common_nsecs, common_pid, common_comm,
30 vec):
31 print_header(event_name, common_cpu, common_secs, common_nsecs,
32 common_pid, common_comm)
33
34 print_uncommon(context)
35
36 print "vec=%s\n" % \
37 (symbol_str("irq__softirq_entry", "vec", vec)),
38
39def kmem__kmalloc(event_name, context, common_cpu,
40 common_secs, common_nsecs, common_pid, common_comm,
41 call_site, ptr, bytes_req, bytes_alloc,
42 gfp_flags):
43 print_header(event_name, common_cpu, common_secs, common_nsecs,
44 common_pid, common_comm)
45
46 print_uncommon(context)
47
48 print "call_site=%u, ptr=%u, bytes_req=%u, " \
49 "bytes_alloc=%u, gfp_flags=%s\n" % \
50 (call_site, ptr, bytes_req, bytes_alloc,
51
52 flag_str("kmem__kmalloc", "gfp_flags", gfp_flags)),
53
54def trace_unhandled(event_name, context, event_fields_dict):
55 try:
56 unhandled[event_name] += 1
57 except TypeError:
58 unhandled[event_name] = 1
59
60def print_header(event_name, cpu, secs, nsecs, pid, comm):
61 print "%-20s %5u %05u.%09u %8u %-20s " % \
62 (event_name, cpu, secs, nsecs, pid, comm),
63
64# print trace fields not included in handler args
65def print_uncommon(context):
66 print "common_preempt_count=%d, common_flags=%s, common_lock_depth=%d, " \
67 % (common_pc(context), trace_flag_str(common_flags(context)), \
68 common_lock_depth(context))
69
70def print_unhandled():
71 keys = unhandled.keys()
72 if not keys:
73 return
74
75 print "\nunhandled events:\n\n",
76
77 print "%-40s %10s\n" % ("event", "count"),
78 print "%-40s %10s\n" % ("----------------------------------------", \
79 "-----------"),
80
81 for event_name in keys:
82 print "%-40s %10d\n" % (event_name, unhandled[event_name])
diff --git a/tools/perf/scripts/python/failed-syscalls-by-pid.py b/tools/perf/scripts/python/failed-syscalls-by-pid.py
new file mode 100644
index 000000000000..0ca02278fe69
--- /dev/null
+++ b/tools/perf/scripts/python/failed-syscalls-by-pid.py
@@ -0,0 +1,68 @@
1# failed system call counts, by pid
2# (c) 2010, Tom Zanussi <tzanussi@gmail.com>
3# Licensed under the terms of the GNU GPL License version 2
4#
5# Displays system-wide failed system call totals, broken down by pid.
6# If a [comm] arg is specified, only syscalls called by [comm] are displayed.
7
8import os
9import sys
10
11sys.path.append(os.environ['PERF_EXEC_PATH'] + \
12 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
13
14from perf_trace_context import *
15from Core import *
16
17usage = "perf trace -s syscall-counts-by-pid.py [comm]\n";
18
19for_comm = None
20
21if len(sys.argv) > 2:
22 sys.exit(usage)
23
24if len(sys.argv) > 1:
25 for_comm = sys.argv[1]
26
27syscalls = autodict()
28
29def trace_begin():
30 pass
31
32def trace_end():
33 print_error_totals()
34
35def raw_syscalls__sys_exit(event_name, context, common_cpu,
36 common_secs, common_nsecs, common_pid, common_comm,
37 id, ret):
38 if for_comm is not None:
39 if common_comm != for_comm:
40 return
41
42 if ret < 0:
43 try:
44 syscalls[common_comm][common_pid][id][ret] += 1
45 except TypeError:
46 syscalls[common_comm][common_pid][id][ret] = 1
47
48def print_error_totals():
49 if for_comm is not None:
50 print "\nsyscall errors for %s:\n\n" % (for_comm),
51 else:
52 print "\nsyscall errors:\n\n",
53
54 print "%-30s %10s\n" % ("comm [pid]", "count"),
55 print "%-30s %10s\n" % ("------------------------------", \
56 "----------"),
57
58 comm_keys = syscalls.keys()
59 for comm in comm_keys:
60 pid_keys = syscalls[comm].keys()
61 for pid in pid_keys:
62 print "\n%s [%d]\n" % (comm, pid),
63 id_keys = syscalls[comm][pid].keys()
64 for id in id_keys:
65 print " syscall: %-16d\n" % (id),
66 ret_keys = syscalls[comm][pid][id].keys()
67 for ret, val in sorted(syscalls[comm][pid][id].iteritems(), key = lambda(k, v): (v, k), reverse = True):
68 print " err = %-20d %10d\n" % (ret, val),
diff --git a/tools/perf/scripts/python/sctop.py b/tools/perf/scripts/python/sctop.py
new file mode 100644
index 000000000000..6cafad40c296
--- /dev/null
+++ b/tools/perf/scripts/python/sctop.py
@@ -0,0 +1,78 @@
1# system call top
2# (c) 2010, Tom Zanussi <tzanussi@gmail.com>
3# Licensed under the terms of the GNU GPL License version 2
4#
5# Periodically displays system-wide system call totals, broken down by
6# syscall. If a [comm] arg is specified, only syscalls called by
7# [comm] are displayed. If an [interval] arg is specified, the display
8# will be refreshed every [interval] seconds. The default interval is
9# 3 seconds.
10
11import thread
12import time
13import os
14import sys
15
16sys.path.append(os.environ['PERF_EXEC_PATH'] + \
17 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
18
19from perf_trace_context import *
20from Core import *
21from Util import *
22
23usage = "perf trace -s syscall-counts.py [comm] [interval]\n";
24
25for_comm = None
26default_interval = 3
27interval = default_interval
28
29if len(sys.argv) > 3:
30 sys.exit(usage)
31
32if len(sys.argv) > 2:
33 for_comm = sys.argv[1]
34 interval = int(sys.argv[2])
35elif len(sys.argv) > 1:
36 try:
37 interval = int(sys.argv[1])
38 except ValueError:
39 for_comm = sys.argv[1]
40 interval = default_interval
41
42syscalls = autodict()
43
44def trace_begin():
45 thread.start_new_thread(print_syscall_totals, (interval,))
46 pass
47
48def raw_syscalls__sys_enter(event_name, context, common_cpu,
49 common_secs, common_nsecs, common_pid, common_comm,
50 id, args):
51 if for_comm is not None:
52 if common_comm != for_comm:
53 return
54 try:
55 syscalls[id] += 1
56 except TypeError:
57 syscalls[id] = 1
58
59def print_syscall_totals(interval):
60 while 1:
61 clear_term()
62 if for_comm is not None:
63 print "\nsyscall events for %s:\n\n" % (for_comm),
64 else:
65 print "\nsyscall events:\n\n",
66
67 print "%-40s %10s\n" % ("event", "count"),
68 print "%-40s %10s\n" % ("----------------------------------------", \
69 "----------"),
70
71 for id, val in sorted(syscalls.iteritems(), key = lambda(k, v): (v, k), \
72 reverse = True):
73 try:
74 print "%-40d %10d\n" % (id, val),
75 except TypeError:
76 pass
77 syscalls.clear()
78 time.sleep(interval)
diff --git a/tools/perf/scripts/python/syscall-counts-by-pid.py b/tools/perf/scripts/python/syscall-counts-by-pid.py
new file mode 100644
index 000000000000..af722d6a4b3f
--- /dev/null
+++ b/tools/perf/scripts/python/syscall-counts-by-pid.py
@@ -0,0 +1,64 @@
1# system call counts, by pid
2# (c) 2010, Tom Zanussi <tzanussi@gmail.com>
3# Licensed under the terms of the GNU GPL License version 2
4#
5# Displays system-wide system call totals, broken down by syscall.
6# If a [comm] arg is specified, only syscalls called by [comm] are displayed.
7
8import os
9import sys
10
11sys.path.append(os.environ['PERF_EXEC_PATH'] + \
12 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
13
14from perf_trace_context import *
15from Core import *
16
17usage = "perf trace -s syscall-counts-by-pid.py [comm]\n";
18
19for_comm = None
20
21if len(sys.argv) > 2:
22 sys.exit(usage)
23
24if len(sys.argv) > 1:
25 for_comm = sys.argv[1]
26
27syscalls = autodict()
28
29def trace_begin():
30 pass
31
32def trace_end():
33 print_syscall_totals()
34
35def raw_syscalls__sys_enter(event_name, context, common_cpu,
36 common_secs, common_nsecs, common_pid, common_comm,
37 id, args):
38 if for_comm is not None:
39 if common_comm != for_comm:
40 return
41 try:
42 syscalls[common_comm][common_pid][id] += 1
43 except TypeError:
44 syscalls[common_comm][common_pid][id] = 1
45
46def print_syscall_totals():
47 if for_comm is not None:
48 print "\nsyscall events for %s:\n\n" % (for_comm),
49 else:
50 print "\nsyscall events by comm/pid:\n\n",
51
52 print "%-40s %10s\n" % ("comm [pid]/syscalls", "count"),
53 print "%-40s %10s\n" % ("----------------------------------------", \
54 "----------"),
55
56 comm_keys = syscalls.keys()
57 for comm in comm_keys:
58 pid_keys = syscalls[comm].keys()
59 for pid in pid_keys:
60 print "\n%s [%d]\n" % (comm, pid),
61 id_keys = syscalls[comm][pid].keys()
62 for id, val in sorted(syscalls[comm][pid].iteritems(), \
63 key = lambda(k, v): (v, k), reverse = True):
64 print " %-38d %10d\n" % (id, val),
diff --git a/tools/perf/scripts/python/syscall-counts.py b/tools/perf/scripts/python/syscall-counts.py
new file mode 100644
index 000000000000..f977e85ff049
--- /dev/null
+++ b/tools/perf/scripts/python/syscall-counts.py
@@ -0,0 +1,58 @@
1# system call counts
2# (c) 2010, Tom Zanussi <tzanussi@gmail.com>
3# Licensed under the terms of the GNU GPL License version 2
4#
5# Displays system-wide system call totals, broken down by syscall.
6# If a [comm] arg is specified, only syscalls called by [comm] are displayed.
7
8import os
9import sys
10
11sys.path.append(os.environ['PERF_EXEC_PATH'] + \
12 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
13
14from perf_trace_context import *
15from Core import *
16
17usage = "perf trace -s syscall-counts.py [comm]\n";
18
19for_comm = None
20
21if len(sys.argv) > 2:
22 sys.exit(usage)
23
24if len(sys.argv) > 1:
25 for_comm = sys.argv[1]
26
27syscalls = autodict()
28
29def trace_begin():
30 pass
31
32def trace_end():
33 print_syscall_totals()
34
35def raw_syscalls__sys_enter(event_name, context, common_cpu,
36 common_secs, common_nsecs, common_pid, common_comm,
37 id, args):
38 if for_comm is not None:
39 if common_comm != for_comm:
40 return
41 try:
42 syscalls[id] += 1
43 except TypeError:
44 syscalls[id] = 1
45
46def print_syscall_totals():
47 if for_comm is not None:
48 print "\nsyscall events for %s:\n\n" % (for_comm),
49 else:
50 print "\nsyscall events:\n\n",
51
52 print "%-40s %10s\n" % ("event", "count"),
53 print "%-40s %10s\n" % ("----------------------------------------", \
54 "-----------"),
55
56 for id, val in sorted(syscalls.iteritems(), key = lambda(k, v): (v, k), \
57 reverse = True):
58 print "%-40d %10d\n" % (id, val),
diff --git a/tools/perf/util/PERF-VERSION-GEN b/tools/perf/util/PERF-VERSION-GEN
index 54552a00a117..97d76562a1a0 100755
--- a/tools/perf/util/PERF-VERSION-GEN
+++ b/tools/perf/util/PERF-VERSION-GEN
@@ -1,17 +1,17 @@
1#!/bin/sh 1#!/bin/sh
2 2
3GVF=PERF-VERSION-FILE 3if [ $# -eq 1 ] ; then
4DEF_VER=v0.0.2.PERF 4 OUTPUT=$1
5fi
6
7GVF=${OUTPUT}PERF-VERSION-FILE
5 8
6LF=' 9LF='
7' 10'
8 11
9# First see if there is a version file (included in release tarballs), 12# First check if there is a .git to get the version from git describe
10# then try git-describe, then default. 13# otherwise try to get the version from the kernel makefile
11if test -f version 14if test -d ../../.git -o -f ../../.git &&
12then
13 VN=$(cat version) || VN="$DEF_VER"
14elif test -d .git -o -f .git &&
15 VN=$(git describe --abbrev=4 HEAD 2>/dev/null) && 15 VN=$(git describe --abbrev=4 HEAD 2>/dev/null) &&
16 case "$VN" in 16 case "$VN" in
17 *$LF*) (exit 1) ;; 17 *$LF*) (exit 1) ;;
@@ -23,7 +23,12 @@ elif test -d .git -o -f .git &&
23then 23then
24 VN=$(echo "$VN" | sed -e 's/-/./g'); 24 VN=$(echo "$VN" | sed -e 's/-/./g');
25else 25else
26 VN="$DEF_VER" 26 eval `grep '^VERSION\s*=' ../../Makefile|tr -d ' '`
27 eval `grep '^PATCHLEVEL\s*=' ../../Makefile|tr -d ' '`
28 eval `grep '^SUBLEVEL\s*=' ../../Makefile|tr -d ' '`
29 eval `grep '^EXTRAVERSION\s*=' ../../Makefile|tr -d ' '`
30
31 VN="${VERSION}.${PATCHLEVEL}.${SUBLEVEL}${EXTRAVERSION}"
27fi 32fi
28 33
29VN=$(expr "$VN" : v*'\(.*\)') 34VN=$(expr "$VN" : v*'\(.*\)')
diff --git a/tools/perf/util/abspath.c b/tools/perf/util/abspath.c
index a791dd467261..0e76affe9c36 100644
--- a/tools/perf/util/abspath.c
+++ b/tools/perf/util/abspath.c
@@ -1,86 +1,5 @@
1#include "cache.h" 1#include "cache.h"
2 2
3/*
4 * Do not use this for inspecting *tracked* content. When path is a
5 * symlink to a directory, we do not want to say it is a directory when
6 * dealing with tracked content in the working tree.
7 */
8static int is_directory(const char *path)
9{
10 struct stat st;
11 return (!stat(path, &st) && S_ISDIR(st.st_mode));
12}
13
14/* We allow "recursive" symbolic links. Only within reason, though. */
15#define MAXDEPTH 5
16
17const char *make_absolute_path(const char *path)
18{
19 static char bufs[2][PATH_MAX + 1], *buf = bufs[0], *next_buf = bufs[1];
20 char cwd[1024] = "";
21 int buf_index = 1, len;
22
23 int depth = MAXDEPTH;
24 char *last_elem = NULL;
25 struct stat st;
26
27 if (strlcpy(buf, path, PATH_MAX) >= PATH_MAX)
28 die ("Too long path: %.*s", 60, path);
29
30 while (depth--) {
31 if (!is_directory(buf)) {
32 char *last_slash = strrchr(buf, '/');
33 if (last_slash) {
34 *last_slash = '\0';
35 last_elem = xstrdup(last_slash + 1);
36 } else {
37 last_elem = xstrdup(buf);
38 *buf = '\0';
39 }
40 }
41
42 if (*buf) {
43 if (!*cwd && !getcwd(cwd, sizeof(cwd)))
44 die ("Could not get current working directory");
45
46 if (chdir(buf))
47 die ("Could not switch to '%s'", buf);
48 }
49 if (!getcwd(buf, PATH_MAX))
50 die ("Could not get current working directory");
51
52 if (last_elem) {
53 len = strlen(buf);
54
55 if (len + strlen(last_elem) + 2 > PATH_MAX)
56 die ("Too long path name: '%s/%s'",
57 buf, last_elem);
58 buf[len] = '/';
59 strcpy(buf + len + 1, last_elem);
60 free(last_elem);
61 last_elem = NULL;
62 }
63
64 if (!lstat(buf, &st) && S_ISLNK(st.st_mode)) {
65 len = readlink(buf, next_buf, PATH_MAX);
66 if (len < 0)
67 die ("Invalid symlink: %s", buf);
68 if (PATH_MAX <= len)
69 die("symbolic link too long: %s", buf);
70 next_buf[len] = '\0';
71 buf = next_buf;
72 buf_index = 1 - buf_index;
73 next_buf = bufs[buf_index];
74 } else
75 break;
76 }
77
78 if (*cwd && chdir(cwd))
79 die ("Could not change back to '%s'", cwd);
80
81 return buf;
82}
83
84static const char *get_pwd_cwd(void) 3static const char *get_pwd_cwd(void)
85{ 4{
86 static char cwd[PATH_MAX + 1]; 5 static char cwd[PATH_MAX + 1];
diff --git a/tools/perf/util/bitmap.c b/tools/perf/util/bitmap.c
new file mode 100644
index 000000000000..5e230acae1e9
--- /dev/null
+++ b/tools/perf/util/bitmap.c
@@ -0,0 +1,21 @@
1/*
2 * From lib/bitmap.c
3 * Helper functions for bitmap.h.
4 *
5 * This source code is licensed under the GNU General Public License,
6 * Version 2. See the file COPYING for more details.
7 */
8#include <linux/bitmap.h>
9
10int __bitmap_weight(const unsigned long *bitmap, int bits)
11{
12 int k, w = 0, lim = bits/BITS_PER_LONG;
13
14 for (k = 0; k < lim; k++)
15 w += hweight_long(bitmap[k]);
16
17 if (bits % BITS_PER_LONG)
18 w += hweight_long(bitmap[k] & BITMAP_LAST_WORD_MASK(bits));
19
20 return w;
21}
diff --git a/tools/perf/util/build-id.c b/tools/perf/util/build-id.c
new file mode 100644
index 000000000000..70c5cf87d020
--- /dev/null
+++ b/tools/perf/util/build-id.c
@@ -0,0 +1,61 @@
1/*
2 * build-id.c
3 *
4 * build-id support
5 *
6 * Copyright (C) 2009, 2010 Red Hat Inc.
7 * Copyright (C) 2009, 2010 Arnaldo Carvalho de Melo <acme@redhat.com>
8 */
9#include "util.h"
10#include <stdio.h>
11#include "build-id.h"
12#include "event.h"
13#include "symbol.h"
14#include <linux/kernel.h>
15
16static int build_id__mark_dso_hit(event_t *event, struct perf_session *session)
17{
18 struct addr_location al;
19 u8 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
20 struct thread *thread = perf_session__findnew(session, event->ip.pid);
21
22 if (thread == NULL) {
23 pr_err("problem processing %d event, skipping it.\n",
24 event->header.type);
25 return -1;
26 }
27
28 thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION,
29 event->ip.pid, event->ip.ip, &al);
30
31 if (al.map != NULL)
32 al.map->dso->hit = 1;
33
34 return 0;
35}
36
37struct perf_event_ops build_id__mark_dso_hit_ops = {
38 .sample = build_id__mark_dso_hit,
39 .mmap = event__process_mmap,
40 .fork = event__process_task,
41};
42
43char *dso__build_id_filename(struct dso *self, char *bf, size_t size)
44{
45 char build_id_hex[BUILD_ID_SIZE * 2 + 1];
46 const char *home;
47
48 if (!self->has_build_id)
49 return NULL;
50
51 build_id__sprintf(self->build_id, sizeof(self->build_id), build_id_hex);
52 home = getenv("HOME");
53 if (bf == NULL) {
54 if (asprintf(&bf, "%s/%s/.build-id/%.2s/%s", home,
55 DEBUG_CACHE_DIR, build_id_hex, build_id_hex + 2) < 0)
56 return NULL;
57 } else
58 snprintf(bf, size, "%s/%s/.build-id/%.2s/%s", home,
59 DEBUG_CACHE_DIR, build_id_hex, build_id_hex + 2);
60 return bf;
61}
diff --git a/tools/perf/util/build-id.h b/tools/perf/util/build-id.h
new file mode 100644
index 000000000000..5dafb00eaa06
--- /dev/null
+++ b/tools/perf/util/build-id.h
@@ -0,0 +1,10 @@
1#ifndef PERF_BUILD_ID_H_
2#define PERF_BUILD_ID_H_ 1
3
4#include "session.h"
5
6extern struct perf_event_ops build_id__mark_dso_hit_ops;
7
8char *dso__build_id_filename(struct dso *self, char *bf, size_t size);
9
10#endif
diff --git a/tools/perf/util/cache.h b/tools/perf/util/cache.h
index 918eb376abe3..65fe664fddf6 100644
--- a/tools/perf/util/cache.h
+++ b/tools/perf/util/cache.h
@@ -1,6 +1,7 @@
1#ifndef __PERF_CACHE_H 1#ifndef __PERF_CACHE_H
2#define __PERF_CACHE_H 2#define __PERF_CACHE_H
3 3
4#include <stdbool.h>
4#include "util.h" 5#include "util.h"
5#include "strbuf.h" 6#include "strbuf.h"
6#include "../perf.h" 7#include "../perf.h"
@@ -12,56 +13,16 @@
12 13
13#define PERF_DIR_ENVIRONMENT "PERF_DIR" 14#define PERF_DIR_ENVIRONMENT "PERF_DIR"
14#define PERF_WORK_TREE_ENVIRONMENT "PERF_WORK_TREE" 15#define PERF_WORK_TREE_ENVIRONMENT "PERF_WORK_TREE"
15#define DEFAULT_PERF_DIR_ENVIRONMENT ".perf"
16#define DB_ENVIRONMENT "PERF_OBJECT_DIRECTORY"
17#define INDEX_ENVIRONMENT "PERF_INDEX_FILE"
18#define GRAFT_ENVIRONMENT "PERF_GRAFT_FILE"
19#define TEMPLATE_DIR_ENVIRONMENT "PERF_TEMPLATE_DIR"
20#define CONFIG_ENVIRONMENT "PERF_CONFIG"
21#define EXEC_PATH_ENVIRONMENT "PERF_EXEC_PATH" 16#define EXEC_PATH_ENVIRONMENT "PERF_EXEC_PATH"
22#define CEILING_DIRECTORIES_ENVIRONMENT "PERF_CEILING_DIRECTORIES" 17#define DEFAULT_PERF_DIR_ENVIRONMENT ".perf"
23#define PERFATTRIBUTES_FILE ".perfattributes"
24#define INFOATTRIBUTES_FILE "info/attributes"
25#define ATTRIBUTE_MACRO_PREFIX "[attr]"
26#define PERF_DEBUGFS_ENVIRONMENT "PERF_DEBUGFS_DIR" 18#define PERF_DEBUGFS_ENVIRONMENT "PERF_DEBUGFS_DIR"
27 19
28typedef int (*config_fn_t)(const char *, const char *, void *); 20typedef int (*config_fn_t)(const char *, const char *, void *);
29extern int perf_default_config(const char *, const char *, void *); 21extern int perf_default_config(const char *, const char *, void *);
30extern int perf_config_from_file(config_fn_t fn, const char *, void *);
31extern int perf_config(config_fn_t fn, void *); 22extern int perf_config(config_fn_t fn, void *);
32extern int perf_parse_ulong(const char *, unsigned long *);
33extern int perf_config_int(const char *, const char *); 23extern int perf_config_int(const char *, const char *);
34extern unsigned long perf_config_ulong(const char *, const char *);
35extern int perf_config_bool_or_int(const char *, const char *, int *);
36extern int perf_config_bool(const char *, const char *); 24extern int perf_config_bool(const char *, const char *);
37extern int perf_config_string(const char **, const char *, const char *);
38extern int perf_config_set(const char *, const char *);
39extern int perf_config_set_multivar(const char *, const char *, const char *, int);
40extern int perf_config_rename_section(const char *, const char *);
41extern const char *perf_etc_perfconfig(void);
42extern int check_repository_format_version(const char *var, const char *value, void *cb);
43extern int perf_config_system(void);
44extern int perf_config_global(void);
45extern int config_error_nonbool(const char *); 25extern int config_error_nonbool(const char *);
46extern const char *config_exclusive_filename;
47
48#define MAX_PERFNAME (1000)
49extern char perf_default_email[MAX_PERFNAME];
50extern char perf_default_name[MAX_PERFNAME];
51extern int user_ident_explicitly_given;
52
53extern const char *perf_log_output_encoding;
54extern const char *perf_mailmap_file;
55
56/* IO helper functions */
57extern void maybe_flush_or_die(FILE *, const char *);
58extern int copy_fd(int ifd, int ofd);
59extern int copy_file(const char *dst, const char *src, int mode);
60extern ssize_t write_in_full(int fd, const void *buf, size_t count);
61extern void write_or_die(int fd, const void *buf, size_t count);
62extern int write_or_whine(int fd, const void *buf, size_t count, const char *msg);
63extern int write_or_whine_pipe(int fd, const void *buf, size_t count, const char *msg);
64extern void fsync_or_die(int fd, const char *);
65 26
66/* pager.c */ 27/* pager.c */
67extern void setup_pager(void); 28extern void setup_pager(void);
@@ -69,8 +30,18 @@ extern const char *pager_program;
69extern int pager_in_use(void); 30extern int pager_in_use(void);
70extern int pager_use_color; 31extern int pager_use_color;
71 32
72extern const char *editor_program; 33extern int use_browser;
73extern const char *excludes_file; 34
35#ifdef NO_NEWT_SUPPORT
36static inline void setup_browser(void)
37{
38 setup_pager();
39}
40static inline void exit_browser(bool wait_for_ok __used) {}
41#else
42void setup_browser(void);
43void exit_browser(bool wait_for_ok);
44#endif
74 45
75char *alias_lookup(const char *alias); 46char *alias_lookup(const char *alias);
76int split_cmdline(char *cmdline, const char ***argv); 47int split_cmdline(char *cmdline, const char ***argv);
@@ -101,22 +72,12 @@ static inline int is_absolute_path(const char *path)
101 return path[0] == '/'; 72 return path[0] == '/';
102} 73}
103 74
104const char *make_absolute_path(const char *path);
105const char *make_nonrelative_path(const char *path); 75const char *make_nonrelative_path(const char *path);
106const char *make_relative_path(const char *abs, const char *base);
107int normalize_path_copy(char *dst, const char *src);
108int longest_ancestor_length(const char *path, const char *prefix_list);
109char *strip_path_suffix(const char *path, const char *suffix); 76char *strip_path_suffix(const char *path, const char *suffix);
110 77
111extern char *mkpath(const char *fmt, ...) __attribute__((format (printf, 1, 2))); 78extern char *mkpath(const char *fmt, ...) __attribute__((format (printf, 1, 2)));
112extern char *perf_path(const char *fmt, ...) __attribute__((format (printf, 1, 2))); 79extern char *perf_path(const char *fmt, ...) __attribute__((format (printf, 1, 2)));
113/* perf_mkstemp() - create tmp file honoring TMPDIR variable */
114extern int perf_mkstemp(char *path, size_t len, const char *template);
115 80
116extern char *mksnpath(char *buf, size_t n, const char *fmt, ...)
117 __attribute__((format (printf, 3, 4)));
118extern char *perf_snpath(char *buf, size_t n, const char *fmt, ...)
119 __attribute__((format (printf, 3, 4)));
120extern char *perf_pathdup(const char *fmt, ...) 81extern char *perf_pathdup(const char *fmt, ...)
121 __attribute__((format (printf, 1, 2))); 82 __attribute__((format (printf, 1, 2)));
122 83
diff --git a/tools/perf/util/callchain.c b/tools/perf/util/callchain.c
index b3b71258272a..52c777e451ed 100644
--- a/tools/perf/util/callchain.c
+++ b/tools/perf/util/callchain.c
@@ -1,5 +1,5 @@
1/* 1/*
2 * Copyright (C) 2009, Frederic Weisbecker <fweisbec@gmail.com> 2 * Copyright (C) 2009-2010, Frederic Weisbecker <fweisbec@gmail.com>
3 * 3 *
4 * Handle the callchains from the stream in an ad-hoc radix tree and then 4 * Handle the callchains from the stream in an ad-hoc radix tree and then
5 * sort them in an rbtree. 5 * sort them in an rbtree.
@@ -15,8 +15,16 @@
15#include <errno.h> 15#include <errno.h>
16#include <math.h> 16#include <math.h>
17 17
18#include "util.h"
18#include "callchain.h" 19#include "callchain.h"
19 20
21bool ip_callchain__valid(struct ip_callchain *chain, event_t *event)
22{
23 unsigned int chain_size = event->header.size;
24 chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event;
25 return chain->nr * sizeof(u64) <= chain_size;
26}
27
20#define chain_for_each_child(child, parent) \ 28#define chain_for_each_child(child, parent) \
21 list_for_each_entry(child, &parent->children, brothers) 29 list_for_each_entry(child, &parent->children, brothers)
22 30
@@ -160,7 +168,7 @@ create_child(struct callchain_node *parent, bool inherit_children)
160{ 168{
161 struct callchain_node *new; 169 struct callchain_node *new;
162 170
163 new = malloc(sizeof(*new)); 171 new = zalloc(sizeof(*new));
164 if (!new) { 172 if (!new) {
165 perror("not enough memory to create child for code path tree"); 173 perror("not enough memory to create child for code path tree");
166 return NULL; 174 return NULL;
@@ -183,25 +191,36 @@ create_child(struct callchain_node *parent, bool inherit_children)
183 return new; 191 return new;
184} 192}
185 193
194
195struct resolved_ip {
196 u64 ip;
197 struct map_symbol ms;
198};
199
200struct resolved_chain {
201 u64 nr;
202 struct resolved_ip ips[0];
203};
204
205
186/* 206/*
187 * Fill the node with callchain values 207 * Fill the node with callchain values
188 */ 208 */
189static void 209static void
190fill_node(struct callchain_node *node, struct ip_callchain *chain, 210fill_node(struct callchain_node *node, struct resolved_chain *chain, int start)
191 int start, struct symbol **syms)
192{ 211{
193 unsigned int i; 212 unsigned int i;
194 213
195 for (i = start; i < chain->nr; i++) { 214 for (i = start; i < chain->nr; i++) {
196 struct callchain_list *call; 215 struct callchain_list *call;
197 216
198 call = malloc(sizeof(*call)); 217 call = zalloc(sizeof(*call));
199 if (!call) { 218 if (!call) {
200 perror("not enough memory for the code path tree"); 219 perror("not enough memory for the code path tree");
201 return; 220 return;
202 } 221 }
203 call->ip = chain->ips[i]; 222 call->ip = chain->ips[i].ip;
204 call->sym = syms[i]; 223 call->ms = chain->ips[i].ms;
205 list_add_tail(&call->list, &node->val); 224 list_add_tail(&call->list, &node->val);
206 } 225 }
207 node->val_nr = chain->nr - start; 226 node->val_nr = chain->nr - start;
@@ -210,16 +229,16 @@ fill_node(struct callchain_node *node, struct ip_callchain *chain,
210} 229}
211 230
212static void 231static void
213add_child(struct callchain_node *parent, struct ip_callchain *chain, 232add_child(struct callchain_node *parent, struct resolved_chain *chain,
214 int start, struct symbol **syms) 233 int start, u64 period)
215{ 234{
216 struct callchain_node *new; 235 struct callchain_node *new;
217 236
218 new = create_child(parent, false); 237 new = create_child(parent, false);
219 fill_node(new, chain, start, syms); 238 fill_node(new, chain, start);
220 239
221 new->children_hit = 0; 240 new->children_hit = 0;
222 new->hit = 1; 241 new->hit = period;
223} 242}
224 243
225/* 244/*
@@ -228,9 +247,9 @@ add_child(struct callchain_node *parent, struct ip_callchain *chain,
228 * Then create another child to host the given callchain of new branch 247 * Then create another child to host the given callchain of new branch
229 */ 248 */
230static void 249static void
231split_add_child(struct callchain_node *parent, struct ip_callchain *chain, 250split_add_child(struct callchain_node *parent, struct resolved_chain *chain,
232 struct callchain_list *to_split, int idx_parents, int idx_local, 251 struct callchain_list *to_split, int idx_parents, int idx_local,
233 struct symbol **syms) 252 u64 period)
234{ 253{
235 struct callchain_node *new; 254 struct callchain_node *new;
236 struct list_head *old_tail; 255 struct list_head *old_tail;
@@ -257,40 +276,41 @@ split_add_child(struct callchain_node *parent, struct ip_callchain *chain,
257 /* create a new child for the new branch if any */ 276 /* create a new child for the new branch if any */
258 if (idx_total < chain->nr) { 277 if (idx_total < chain->nr) {
259 parent->hit = 0; 278 parent->hit = 0;
260 add_child(parent, chain, idx_total, syms); 279 add_child(parent, chain, idx_total, period);
261 parent->children_hit++; 280 parent->children_hit += period;
262 } else { 281 } else {
263 parent->hit = 1; 282 parent->hit = period;
264 } 283 }
265} 284}
266 285
267static int 286static int
268__append_chain(struct callchain_node *root, struct ip_callchain *chain, 287__append_chain(struct callchain_node *root, struct resolved_chain *chain,
269 unsigned int start, struct symbol **syms); 288 unsigned int start, u64 period);
270 289
271static void 290static void
272__append_chain_children(struct callchain_node *root, struct ip_callchain *chain, 291__append_chain_children(struct callchain_node *root,
273 struct symbol **syms, unsigned int start) 292 struct resolved_chain *chain,
293 unsigned int start, u64 period)
274{ 294{
275 struct callchain_node *rnode; 295 struct callchain_node *rnode;
276 296
277 /* lookup in childrens */ 297 /* lookup in childrens */
278 chain_for_each_child(rnode, root) { 298 chain_for_each_child(rnode, root) {
279 unsigned int ret = __append_chain(rnode, chain, start, syms); 299 unsigned int ret = __append_chain(rnode, chain, start, period);
280 300
281 if (!ret) 301 if (!ret)
282 goto inc_children_hit; 302 goto inc_children_hit;
283 } 303 }
284 /* nothing in children, add to the current node */ 304 /* nothing in children, add to the current node */
285 add_child(root, chain, start, syms); 305 add_child(root, chain, start, period);
286 306
287inc_children_hit: 307inc_children_hit:
288 root->children_hit++; 308 root->children_hit += period;
289} 309}
290 310
291static int 311static int
292__append_chain(struct callchain_node *root, struct ip_callchain *chain, 312__append_chain(struct callchain_node *root, struct resolved_chain *chain,
293 unsigned int start, struct symbol **syms) 313 unsigned int start, u64 period)
294{ 314{
295 struct callchain_list *cnode; 315 struct callchain_list *cnode;
296 unsigned int i = start; 316 unsigned int i = start;
@@ -302,13 +322,19 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain,
302 * anywhere inside a function. 322 * anywhere inside a function.
303 */ 323 */
304 list_for_each_entry(cnode, &root->val, list) { 324 list_for_each_entry(cnode, &root->val, list) {
325 struct symbol *sym;
326
305 if (i == chain->nr) 327 if (i == chain->nr)
306 break; 328 break;
307 if (cnode->sym && syms[i]) { 329
308 if (cnode->sym->start != syms[i]->start) 330 sym = chain->ips[i].ms.sym;
331
332 if (cnode->ms.sym && sym) {
333 if (cnode->ms.sym->start != sym->start)
309 break; 334 break;
310 } else if (cnode->ip != chain->ips[i]) 335 } else if (cnode->ip != chain->ips[i].ip)
311 break; 336 break;
337
312 if (!found) 338 if (!found)
313 found = true; 339 found = true;
314 i++; 340 i++;
@@ -320,26 +346,61 @@ __append_chain(struct callchain_node *root, struct ip_callchain *chain,
320 346
321 /* we match only a part of the node. Split it and add the new chain */ 347 /* we match only a part of the node. Split it and add the new chain */
322 if (i - start < root->val_nr) { 348 if (i - start < root->val_nr) {
323 split_add_child(root, chain, cnode, start, i - start, syms); 349 split_add_child(root, chain, cnode, start, i - start, period);
324 return 0; 350 return 0;
325 } 351 }
326 352
327 /* we match 100% of the path, increment the hit */ 353 /* we match 100% of the path, increment the hit */
328 if (i - start == root->val_nr && i == chain->nr) { 354 if (i - start == root->val_nr && i == chain->nr) {
329 root->hit++; 355 root->hit += period;
330 return 0; 356 return 0;
331 } 357 }
332 358
333 /* We match the node and still have a part remaining */ 359 /* We match the node and still have a part remaining */
334 __append_chain_children(root, chain, syms, i); 360 __append_chain_children(root, chain, i, period);
335 361
336 return 0; 362 return 0;
337} 363}
338 364
339void append_chain(struct callchain_node *root, struct ip_callchain *chain, 365static void filter_context(struct ip_callchain *old, struct resolved_chain *new,
340 struct symbol **syms) 366 struct map_symbol *syms)
341{ 367{
368 int i, j = 0;
369
370 for (i = 0; i < (int)old->nr; i++) {
371 if (old->ips[i] >= PERF_CONTEXT_MAX)
372 continue;
373
374 new->ips[j].ip = old->ips[i];
375 new->ips[j].ms = syms[i];
376 j++;
377 }
378
379 new->nr = j;
380}
381
382
383int append_chain(struct callchain_node *root, struct ip_callchain *chain,
384 struct map_symbol *syms, u64 period)
385{
386 struct resolved_chain *filtered;
387
342 if (!chain->nr) 388 if (!chain->nr)
343 return; 389 return 0;
344 __append_chain_children(root, chain, syms, 0); 390
391 filtered = zalloc(sizeof(*filtered) +
392 chain->nr * sizeof(struct resolved_ip));
393 if (!filtered)
394 return -ENOMEM;
395
396 filter_context(chain, filtered, syms);
397
398 if (!filtered->nr)
399 goto end;
400
401 __append_chain_children(root, filtered, 0, period);
402end:
403 free(filtered);
404
405 return 0;
345} 406}
diff --git a/tools/perf/util/callchain.h b/tools/perf/util/callchain.h
index ad4626de4c2b..f2e9ee164bd8 100644
--- a/tools/perf/util/callchain.h
+++ b/tools/perf/util/callchain.h
@@ -4,7 +4,7 @@
4#include "../perf.h" 4#include "../perf.h"
5#include <linux/list.h> 5#include <linux/list.h>
6#include <linux/rbtree.h> 6#include <linux/rbtree.h>
7#include "util.h" 7#include "event.h"
8#include "symbol.h" 8#include "symbol.h"
9 9
10enum chain_mode { 10enum chain_mode {
@@ -33,13 +33,14 @@ typedef void (*sort_chain_func_t)(struct rb_root *, struct callchain_node *,
33 33
34struct callchain_param { 34struct callchain_param {
35 enum chain_mode mode; 35 enum chain_mode mode;
36 u32 print_limit;
36 double min_percent; 37 double min_percent;
37 sort_chain_func_t sort; 38 sort_chain_func_t sort;
38}; 39};
39 40
40struct callchain_list { 41struct callchain_list {
41 u64 ip; 42 u64 ip;
42 struct symbol *sym; 43 struct map_symbol ms;
43 struct list_head list; 44 struct list_head list;
44}; 45};
45 46
@@ -48,6 +49,9 @@ static inline void callchain_init(struct callchain_node *node)
48 INIT_LIST_HEAD(&node->brothers); 49 INIT_LIST_HEAD(&node->brothers);
49 INIT_LIST_HEAD(&node->children); 50 INIT_LIST_HEAD(&node->children);
50 INIT_LIST_HEAD(&node->val); 51 INIT_LIST_HEAD(&node->val);
52
53 node->parent = NULL;
54 node->hit = 0;
51} 55}
52 56
53static inline u64 cumul_hits(struct callchain_node *node) 57static inline u64 cumul_hits(struct callchain_node *node)
@@ -56,6 +60,8 @@ static inline u64 cumul_hits(struct callchain_node *node)
56} 60}
57 61
58int register_callchain_param(struct callchain_param *param); 62int register_callchain_param(struct callchain_param *param);
59void append_chain(struct callchain_node *root, struct ip_callchain *chain, 63int append_chain(struct callchain_node *root, struct ip_callchain *chain,
60 struct symbol **syms); 64 struct map_symbol *syms, u64 period);
65
66bool ip_callchain__valid(struct ip_callchain *chain, event_t *event);
61#endif /* __PERF_CALLCHAIN_H */ 67#endif /* __PERF_CALLCHAIN_H */
diff --git a/tools/perf/util/color.c b/tools/perf/util/color.c
index e88bca55a599..e191eb9a667f 100644
--- a/tools/perf/util/color.c
+++ b/tools/perf/util/color.c
@@ -166,6 +166,31 @@ int perf_color_default_config(const char *var, const char *value, void *cb)
166 return perf_default_config(var, value, cb); 166 return perf_default_config(var, value, cb);
167} 167}
168 168
169static int __color_vsnprintf(char *bf, size_t size, const char *color,
170 const char *fmt, va_list args, const char *trail)
171{
172 int r = 0;
173
174 /*
175 * Auto-detect:
176 */
177 if (perf_use_color_default < 0) {
178 if (isatty(1) || pager_in_use())
179 perf_use_color_default = 1;
180 else
181 perf_use_color_default = 0;
182 }
183
184 if (perf_use_color_default && *color)
185 r += snprintf(bf, size, "%s", color);
186 r += vsnprintf(bf + r, size - r, fmt, args);
187 if (perf_use_color_default && *color)
188 r += snprintf(bf + r, size - r, "%s", PERF_COLOR_RESET);
189 if (trail)
190 r += snprintf(bf + r, size - r, "%s", trail);
191 return r;
192}
193
169static int __color_vfprintf(FILE *fp, const char *color, const char *fmt, 194static int __color_vfprintf(FILE *fp, const char *color, const char *fmt,
170 va_list args, const char *trail) 195 va_list args, const char *trail)
171{ 196{
@@ -191,11 +216,28 @@ static int __color_vfprintf(FILE *fp, const char *color, const char *fmt,
191 return r; 216 return r;
192} 217}
193 218
219int color_vsnprintf(char *bf, size_t size, const char *color,
220 const char *fmt, va_list args)
221{
222 return __color_vsnprintf(bf, size, color, fmt, args, NULL);
223}
224
194int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args) 225int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args)
195{ 226{
196 return __color_vfprintf(fp, color, fmt, args, NULL); 227 return __color_vfprintf(fp, color, fmt, args, NULL);
197} 228}
198 229
230int color_snprintf(char *bf, size_t size, const char *color,
231 const char *fmt, ...)
232{
233 va_list args;
234 int r;
235
236 va_start(args, fmt);
237 r = color_vsnprintf(bf, size, color, fmt, args);
238 va_end(args);
239 return r;
240}
199 241
200int color_fprintf(FILE *fp, const char *color, const char *fmt, ...) 242int color_fprintf(FILE *fp, const char *color, const char *fmt, ...)
201{ 243{
@@ -274,3 +316,9 @@ int percent_color_fprintf(FILE *fp, const char *fmt, double percent)
274 316
275 return r; 317 return r;
276} 318}
319
320int percent_color_snprintf(char *bf, size_t size, const char *fmt, double percent)
321{
322 const char *color = get_percent_color(percent);
323 return color_snprintf(bf, size, color, fmt, percent);
324}
diff --git a/tools/perf/util/color.h b/tools/perf/util/color.h
index 24e8809210bb..dea082b79602 100644
--- a/tools/perf/util/color.h
+++ b/tools/perf/util/color.h
@@ -32,10 +32,14 @@ int perf_color_default_config(const char *var, const char *value, void *cb);
32int perf_config_colorbool(const char *var, const char *value, int stdout_is_tty); 32int perf_config_colorbool(const char *var, const char *value, int stdout_is_tty);
33void color_parse(const char *value, const char *var, char *dst); 33void color_parse(const char *value, const char *var, char *dst);
34void color_parse_mem(const char *value, int len, const char *var, char *dst); 34void color_parse_mem(const char *value, int len, const char *var, char *dst);
35int color_vsnprintf(char *bf, size_t size, const char *color,
36 const char *fmt, va_list args);
35int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args); 37int color_vfprintf(FILE *fp, const char *color, const char *fmt, va_list args);
36int color_fprintf(FILE *fp, const char *color, const char *fmt, ...); 38int color_fprintf(FILE *fp, const char *color, const char *fmt, ...);
39int color_snprintf(char *bf, size_t size, const char *color, const char *fmt, ...);
37int color_fprintf_ln(FILE *fp, const char *color, const char *fmt, ...); 40int color_fprintf_ln(FILE *fp, const char *color, const char *fmt, ...);
38int color_fwrite_lines(FILE *fp, const char *color, size_t count, const char *buf); 41int color_fwrite_lines(FILE *fp, const char *color, size_t count, const char *buf);
42int percent_color_snprintf(char *bf, size_t size, const char *fmt, double percent);
39int percent_color_fprintf(FILE *fp, const char *fmt, double percent); 43int percent_color_fprintf(FILE *fp, const char *fmt, double percent);
40const char *get_percent_color(double percent); 44const char *get_percent_color(double percent);
41 45
diff --git a/tools/perf/util/config.c b/tools/perf/util/config.c
index 8784649109ce..dabe892d0e53 100644
--- a/tools/perf/util/config.c
+++ b/tools/perf/util/config.c
@@ -16,7 +16,7 @@ static const char *config_file_name;
16static int config_linenr; 16static int config_linenr;
17static int config_file_eof; 17static int config_file_eof;
18 18
19const char *config_exclusive_filename = NULL; 19static const char *config_exclusive_filename;
20 20
21static int get_next_char(void) 21static int get_next_char(void)
22{ 22{
@@ -291,19 +291,6 @@ static int perf_parse_long(const char *value, long *ret)
291 return 0; 291 return 0;
292} 292}
293 293
294int perf_parse_ulong(const char *value, unsigned long *ret)
295{
296 if (value && *value) {
297 char *end;
298 unsigned long val = strtoul(value, &end, 0);
299 if (!parse_unit_factor(end, &val))
300 return 0;
301 *ret = val;
302 return 1;
303 }
304 return 0;
305}
306
307static void die_bad_config(const char *name) 294static void die_bad_config(const char *name)
308{ 295{
309 if (config_file_name) 296 if (config_file_name)
@@ -319,15 +306,7 @@ int perf_config_int(const char *name, const char *value)
319 return ret; 306 return ret;
320} 307}
321 308
322unsigned long perf_config_ulong(const char *name, const char *value) 309static int perf_config_bool_or_int(const char *name, const char *value, int *is_bool)
323{
324 unsigned long ret;
325 if (!perf_parse_ulong(value, &ret))
326 die_bad_config(name);
327 return ret;
328}
329
330int perf_config_bool_or_int(const char *name, const char *value, int *is_bool)
331{ 310{
332 *is_bool = 1; 311 *is_bool = 1;
333 if (!value) 312 if (!value)
@@ -348,14 +327,6 @@ int perf_config_bool(const char *name, const char *value)
348 return !!perf_config_bool_or_int(name, value, &discard); 327 return !!perf_config_bool_or_int(name, value, &discard);
349} 328}
350 329
351int perf_config_string(const char **dest, const char *var, const char *value)
352{
353 if (!value)
354 return config_error_nonbool(var);
355 *dest = strdup(value);
356 return 0;
357}
358
359static int perf_default_core_config(const char *var __used, const char *value __used) 330static int perf_default_core_config(const char *var __used, const char *value __used)
360{ 331{
361 /* Add other config variables here and to Documentation/config.txt. */ 332 /* Add other config variables here and to Documentation/config.txt. */
@@ -371,7 +342,7 @@ int perf_default_config(const char *var, const char *value, void *dummy __used)
371 return 0; 342 return 0;
372} 343}
373 344
374int perf_config_from_file(config_fn_t fn, const char *filename, void *data) 345static int perf_config_from_file(config_fn_t fn, const char *filename, void *data)
375{ 346{
376 int ret; 347 int ret;
377 FILE *f = fopen(filename, "r"); 348 FILE *f = fopen(filename, "r");
@@ -389,7 +360,7 @@ int perf_config_from_file(config_fn_t fn, const char *filename, void *data)
389 return ret; 360 return ret;
390} 361}
391 362
392const char *perf_etc_perfconfig(void) 363static const char *perf_etc_perfconfig(void)
393{ 364{
394 static const char *system_wide; 365 static const char *system_wide;
395 if (!system_wide) 366 if (!system_wide)
@@ -403,12 +374,12 @@ static int perf_env_bool(const char *k, int def)
403 return v ? perf_config_bool(k, v) : def; 374 return v ? perf_config_bool(k, v) : def;
404} 375}
405 376
406int perf_config_system(void) 377static int perf_config_system(void)
407{ 378{
408 return !perf_env_bool("PERF_CONFIG_NOSYSTEM", 0); 379 return !perf_env_bool("PERF_CONFIG_NOSYSTEM", 0);
409} 380}
410 381
411int perf_config_global(void) 382static int perf_config_global(void)
412{ 383{
413 return !perf_env_bool("PERF_CONFIG_NOGLOBAL", 0); 384 return !perf_env_bool("PERF_CONFIG_NOGLOBAL", 0);
414} 385}
@@ -450,426 +421,6 @@ int perf_config(config_fn_t fn, void *data)
450} 421}
451 422
452/* 423/*
453 * Find all the stuff for perf_config_set() below.
454 */
455
456#define MAX_MATCHES 512
457
458static struct {
459 int baselen;
460 char* key;
461 int do_not_match;
462 regex_t* value_regex;
463 int multi_replace;
464 size_t offset[MAX_MATCHES];
465 enum { START, SECTION_SEEN, SECTION_END_SEEN, KEY_SEEN } state;
466 int seen;
467} store;
468
469static int matches(const char* key, const char* value)
470{
471 return !strcmp(key, store.key) &&
472 (store.value_regex == NULL ||
473 (store.do_not_match ^
474 !regexec(store.value_regex, value, 0, NULL, 0)));
475}
476
477static int store_aux(const char* key, const char* value, void *cb __used)
478{
479 int section_len;
480 const char *ep;
481
482 switch (store.state) {
483 case KEY_SEEN:
484 if (matches(key, value)) {
485 if (store.seen == 1 && store.multi_replace == 0) {
486 warning("%s has multiple values", key);
487 } else if (store.seen >= MAX_MATCHES) {
488 error("too many matches for %s", key);
489 return 1;
490 }
491
492 store.offset[store.seen] = ftell(config_file);
493 store.seen++;
494 }
495 break;
496 case SECTION_SEEN:
497 /*
498 * What we are looking for is in store.key (both
499 * section and var), and its section part is baselen
500 * long. We found key (again, both section and var).
501 * We would want to know if this key is in the same
502 * section as what we are looking for. We already
503 * know we are in the same section as what should
504 * hold store.key.
505 */
506 ep = strrchr(key, '.');
507 section_len = ep - key;
508
509 if ((section_len != store.baselen) ||
510 memcmp(key, store.key, section_len+1)) {
511 store.state = SECTION_END_SEEN;
512 break;
513 }
514
515 /*
516 * Do not increment matches: this is no match, but we
517 * just made sure we are in the desired section.
518 */
519 store.offset[store.seen] = ftell(config_file);
520 /* fallthru */
521 case SECTION_END_SEEN:
522 case START:
523 if (matches(key, value)) {
524 store.offset[store.seen] = ftell(config_file);
525 store.state = KEY_SEEN;
526 store.seen++;
527 } else {
528 if (strrchr(key, '.') - key == store.baselen &&
529 !strncmp(key, store.key, store.baselen)) {
530 store.state = SECTION_SEEN;
531 store.offset[store.seen] = ftell(config_file);
532 }
533 }
534 default:
535 break;
536 }
537 return 0;
538}
539
540static int store_write_section(int fd, const char* key)
541{
542 const char *dot;
543 int i, success;
544 struct strbuf sb = STRBUF_INIT;
545
546 dot = memchr(key, '.', store.baselen);
547 if (dot) {
548 strbuf_addf(&sb, "[%.*s \"", (int)(dot - key), key);
549 for (i = dot - key + 1; i < store.baselen; i++) {
550 if (key[i] == '"' || key[i] == '\\')
551 strbuf_addch(&sb, '\\');
552 strbuf_addch(&sb, key[i]);
553 }
554 strbuf_addstr(&sb, "\"]\n");
555 } else {
556 strbuf_addf(&sb, "[%.*s]\n", store.baselen, key);
557 }
558
559 success = (write_in_full(fd, sb.buf, sb.len) == (ssize_t)sb.len);
560 strbuf_release(&sb);
561
562 return success;
563}
564
565static int store_write_pair(int fd, const char* key, const char* value)
566{
567 int i, success;
568 int length = strlen(key + store.baselen + 1);
569 const char *quote = "";
570 struct strbuf sb = STRBUF_INIT;
571
572 /*
573 * Check to see if the value needs to be surrounded with a dq pair.
574 * Note that problematic characters are always backslash-quoted; this
575 * check is about not losing leading or trailing SP and strings that
576 * follow beginning-of-comment characters (i.e. ';' and '#') by the
577 * configuration parser.
578 */
579 if (value[0] == ' ')
580 quote = "\"";
581 for (i = 0; value[i]; i++)
582 if (value[i] == ';' || value[i] == '#')
583 quote = "\"";
584 if (i && value[i - 1] == ' ')
585 quote = "\"";
586
587 strbuf_addf(&sb, "\t%.*s = %s",
588 length, key + store.baselen + 1, quote);
589
590 for (i = 0; value[i]; i++)
591 switch (value[i]) {
592 case '\n':
593 strbuf_addstr(&sb, "\\n");
594 break;
595 case '\t':
596 strbuf_addstr(&sb, "\\t");
597 break;
598 case '"':
599 case '\\':
600 strbuf_addch(&sb, '\\');
601 default:
602 strbuf_addch(&sb, value[i]);
603 break;
604 }
605 strbuf_addf(&sb, "%s\n", quote);
606
607 success = (write_in_full(fd, sb.buf, sb.len) == (ssize_t)sb.len);
608 strbuf_release(&sb);
609
610 return success;
611}
612
613static ssize_t find_beginning_of_line(const char* contents, size_t size,
614 size_t offset_, int* found_bracket)
615{
616 size_t equal_offset = size, bracket_offset = size;
617 ssize_t offset;
618
619contline:
620 for (offset = offset_-2; offset > 0
621 && contents[offset] != '\n'; offset--)
622 switch (contents[offset]) {
623 case '=': equal_offset = offset; break;
624 case ']': bracket_offset = offset; break;
625 default: break;
626 }
627 if (offset > 0 && contents[offset-1] == '\\') {
628 offset_ = offset;
629 goto contline;
630 }
631 if (bracket_offset < equal_offset) {
632 *found_bracket = 1;
633 offset = bracket_offset+1;
634 } else
635 offset++;
636
637 return offset;
638}
639
640int perf_config_set(const char* key, const char* value)
641{
642 return perf_config_set_multivar(key, value, NULL, 0);
643}
644
645/*
646 * If value==NULL, unset in (remove from) config,
647 * if value_regex!=NULL, disregard key/value pairs where value does not match.
648 * if multi_replace==0, nothing, or only one matching key/value is replaced,
649 * else all matching key/values (regardless how many) are removed,
650 * before the new pair is written.
651 *
652 * Returns 0 on success.
653 *
654 * This function does this:
655 *
656 * - it locks the config file by creating ".perf/config.lock"
657 *
658 * - it then parses the config using store_aux() as validator to find
659 * the position on the key/value pair to replace. If it is to be unset,
660 * it must be found exactly once.
661 *
662 * - the config file is mmap()ed and the part before the match (if any) is
663 * written to the lock file, then the changed part and the rest.
664 *
665 * - the config file is removed and the lock file rename()d to it.
666 *
667 */
668int perf_config_set_multivar(const char* key, const char* value,
669 const char* value_regex, int multi_replace)
670{
671 int i, dot;
672 int fd = -1, in_fd;
673 int ret = 0;
674 char* config_filename;
675 const char* last_dot = strrchr(key, '.');
676
677 if (config_exclusive_filename)
678 config_filename = strdup(config_exclusive_filename);
679 else
680 config_filename = perf_pathdup("config");
681
682 /*
683 * Since "key" actually contains the section name and the real
684 * key name separated by a dot, we have to know where the dot is.
685 */
686
687 if (last_dot == NULL) {
688 error("key does not contain a section: %s", key);
689 ret = 2;
690 goto out_free;
691 }
692 store.baselen = last_dot - key;
693
694 store.multi_replace = multi_replace;
695
696 /*
697 * Validate the key and while at it, lower case it for matching.
698 */
699 store.key = malloc(strlen(key) + 1);
700 dot = 0;
701 for (i = 0; key[i]; i++) {
702 unsigned char c = key[i];
703 if (c == '.')
704 dot = 1;
705 /* Leave the extended basename untouched.. */
706 if (!dot || i > store.baselen) {
707 if (!iskeychar(c) || (i == store.baselen+1 && !isalpha(c))) {
708 error("invalid key: %s", key);
709 free(store.key);
710 ret = 1;
711 goto out_free;
712 }
713 c = tolower(c);
714 } else if (c == '\n') {
715 error("invalid key (newline): %s", key);
716 free(store.key);
717 ret = 1;
718 goto out_free;
719 }
720 store.key[i] = c;
721 }
722 store.key[i] = 0;
723
724 /*
725 * If .perf/config does not exist yet, write a minimal version.
726 */
727 in_fd = open(config_filename, O_RDONLY);
728 if ( in_fd < 0 ) {
729 free(store.key);
730
731 if ( ENOENT != errno ) {
732 error("opening %s: %s", config_filename,
733 strerror(errno));
734 ret = 3; /* same as "invalid config file" */
735 goto out_free;
736 }
737 /* if nothing to unset, error out */
738 if (value == NULL) {
739 ret = 5;
740 goto out_free;
741 }
742
743 store.key = (char*)key;
744 if (!store_write_section(fd, key) ||
745 !store_write_pair(fd, key, value))
746 goto write_err_out;
747 } else {
748 struct stat st;
749 char *contents;
750 ssize_t contents_sz, copy_begin, copy_end;
751 int new_line = 0;
752
753 if (value_regex == NULL)
754 store.value_regex = NULL;
755 else {
756 if (value_regex[0] == '!') {
757 store.do_not_match = 1;
758 value_regex++;
759 } else
760 store.do_not_match = 0;
761
762 store.value_regex = (regex_t*)malloc(sizeof(regex_t));
763 if (regcomp(store.value_regex, value_regex,
764 REG_EXTENDED)) {
765 error("invalid pattern: %s", value_regex);
766 free(store.value_regex);
767 ret = 6;
768 goto out_free;
769 }
770 }
771
772 store.offset[0] = 0;
773 store.state = START;
774 store.seen = 0;
775
776 /*
777 * After this, store.offset will contain the *end* offset
778 * of the last match, or remain at 0 if no match was found.
779 * As a side effect, we make sure to transform only a valid
780 * existing config file.
781 */
782 if (perf_config_from_file(store_aux, config_filename, NULL)) {
783 error("invalid config file %s", config_filename);
784 free(store.key);
785 if (store.value_regex != NULL) {
786 regfree(store.value_regex);
787 free(store.value_regex);
788 }
789 ret = 3;
790 goto out_free;
791 }
792
793 free(store.key);
794 if (store.value_regex != NULL) {
795 regfree(store.value_regex);
796 free(store.value_regex);
797 }
798
799 /* if nothing to unset, or too many matches, error out */
800 if ((store.seen == 0 && value == NULL) ||
801 (store.seen > 1 && multi_replace == 0)) {
802 ret = 5;
803 goto out_free;
804 }
805
806 fstat(in_fd, &st);
807 contents_sz = xsize_t(st.st_size);
808 contents = mmap(NULL, contents_sz, PROT_READ,
809 MAP_PRIVATE, in_fd, 0);
810 close(in_fd);
811
812 if (store.seen == 0)
813 store.seen = 1;
814
815 for (i = 0, copy_begin = 0; i < store.seen; i++) {
816 if (store.offset[i] == 0) {
817 store.offset[i] = copy_end = contents_sz;
818 } else if (store.state != KEY_SEEN) {
819 copy_end = store.offset[i];
820 } else
821 copy_end = find_beginning_of_line(
822 contents, contents_sz,
823 store.offset[i]-2, &new_line);
824
825 if (copy_end > 0 && contents[copy_end-1] != '\n')
826 new_line = 1;
827
828 /* write the first part of the config */
829 if (copy_end > copy_begin) {
830 if (write_in_full(fd, contents + copy_begin,
831 copy_end - copy_begin) <
832 copy_end - copy_begin)
833 goto write_err_out;
834 if (new_line &&
835 write_in_full(fd, "\n", 1) != 1)
836 goto write_err_out;
837 }
838 copy_begin = store.offset[i];
839 }
840
841 /* write the pair (value == NULL means unset) */
842 if (value != NULL) {
843 if (store.state == START) {
844 if (!store_write_section(fd, key))
845 goto write_err_out;
846 }
847 if (!store_write_pair(fd, key, value))
848 goto write_err_out;
849 }
850
851 /* write the rest of the config */
852 if (copy_begin < contents_sz)
853 if (write_in_full(fd, contents + copy_begin,
854 contents_sz - copy_begin) <
855 contents_sz - copy_begin)
856 goto write_err_out;
857
858 munmap(contents, contents_sz);
859 }
860
861 ret = 0;
862
863out_free:
864 free(config_filename);
865 return ret;
866
867write_err_out:
868 goto out_free;
869
870}
871
872/*
873 * Call this to report error for your variable that should not 424 * Call this to report error for your variable that should not
874 * get a boolean value (i.e. "[my] var" means "true"). 425 * get a boolean value (i.e. "[my] var" means "true").
875 */ 426 */
diff --git a/tools/perf/util/cpumap.c b/tools/perf/util/cpumap.c
new file mode 100644
index 000000000000..4e01490e51e5
--- /dev/null
+++ b/tools/perf/util/cpumap.c
@@ -0,0 +1,59 @@
1#include "util.h"
2#include "../perf.h"
3#include "cpumap.h"
4#include <assert.h>
5#include <stdio.h>
6
7int cpumap[MAX_NR_CPUS];
8
9static int default_cpu_map(void)
10{
11 int nr_cpus, i;
12
13 nr_cpus = sysconf(_SC_NPROCESSORS_ONLN);
14 assert(nr_cpus <= MAX_NR_CPUS);
15 assert((int)nr_cpus >= 0);
16
17 for (i = 0; i < nr_cpus; ++i)
18 cpumap[i] = i;
19
20 return nr_cpus;
21}
22
23int read_cpu_map(void)
24{
25 FILE *onlnf;
26 int nr_cpus = 0;
27 int n, cpu, prev;
28 char sep;
29
30 onlnf = fopen("/sys/devices/system/cpu/online", "r");
31 if (!onlnf)
32 return default_cpu_map();
33
34 sep = 0;
35 prev = -1;
36 for (;;) {
37 n = fscanf(onlnf, "%u%c", &cpu, &sep);
38 if (n <= 0)
39 break;
40 if (prev >= 0) {
41 assert(nr_cpus + cpu - prev - 1 < MAX_NR_CPUS);
42 while (++prev < cpu)
43 cpumap[nr_cpus++] = prev;
44 }
45 assert (nr_cpus < MAX_NR_CPUS);
46 cpumap[nr_cpus++] = cpu;
47 if (n == 2 && sep == '-')
48 prev = cpu;
49 else
50 prev = -1;
51 if (n == 1 || sep == '\n')
52 break;
53 }
54 fclose(onlnf);
55 if (nr_cpus > 0)
56 return nr_cpus;
57
58 return default_cpu_map();
59}
diff --git a/tools/perf/util/cpumap.h b/tools/perf/util/cpumap.h
new file mode 100644
index 000000000000..86c78bb33098
--- /dev/null
+++ b/tools/perf/util/cpumap.h
@@ -0,0 +1,7 @@
1#ifndef __PERF_CPUMAP_H
2#define __PERF_CPUMAP_H
3
4extern int read_cpu_map(void);
5extern int cpumap[];
6
7#endif /* __PERF_CPUMAP_H */
diff --git a/tools/perf/util/data_map.c b/tools/perf/util/data_map.c
deleted file mode 100644
index b557b836de3d..000000000000
--- a/tools/perf/util/data_map.c
+++ /dev/null
@@ -1,252 +0,0 @@
1#include "symbol.h"
2#include "util.h"
3#include "debug.h"
4#include "thread.h"
5#include "session.h"
6
7static int process_event_stub(event_t *event __used,
8 struct perf_session *session __used)
9{
10 dump_printf(": unhandled!\n");
11 return 0;
12}
13
14static void perf_event_ops__fill_defaults(struct perf_event_ops *handler)
15{
16 if (!handler->process_sample_event)
17 handler->process_sample_event = process_event_stub;
18 if (!handler->process_mmap_event)
19 handler->process_mmap_event = process_event_stub;
20 if (!handler->process_comm_event)
21 handler->process_comm_event = process_event_stub;
22 if (!handler->process_fork_event)
23 handler->process_fork_event = process_event_stub;
24 if (!handler->process_exit_event)
25 handler->process_exit_event = process_event_stub;
26 if (!handler->process_lost_event)
27 handler->process_lost_event = process_event_stub;
28 if (!handler->process_read_event)
29 handler->process_read_event = process_event_stub;
30 if (!handler->process_throttle_event)
31 handler->process_throttle_event = process_event_stub;
32 if (!handler->process_unthrottle_event)
33 handler->process_unthrottle_event = process_event_stub;
34}
35
36static const char *event__name[] = {
37 [0] = "TOTAL",
38 [PERF_RECORD_MMAP] = "MMAP",
39 [PERF_RECORD_LOST] = "LOST",
40 [PERF_RECORD_COMM] = "COMM",
41 [PERF_RECORD_EXIT] = "EXIT",
42 [PERF_RECORD_THROTTLE] = "THROTTLE",
43 [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE",
44 [PERF_RECORD_FORK] = "FORK",
45 [PERF_RECORD_READ] = "READ",
46 [PERF_RECORD_SAMPLE] = "SAMPLE",
47};
48
49unsigned long event__total[PERF_RECORD_MAX];
50
51void event__print_totals(void)
52{
53 int i;
54 for (i = 0; i < PERF_RECORD_MAX; ++i)
55 pr_info("%10s events: %10ld\n",
56 event__name[i], event__total[i]);
57}
58
59static int process_event(event_t *event, struct perf_session *session,
60 struct perf_event_ops *ops,
61 unsigned long offset, unsigned long head)
62{
63 trace_event(event);
64
65 if (event->header.type < PERF_RECORD_MAX) {
66 dump_printf("%p [%p]: PERF_RECORD_%s",
67 (void *)(offset + head),
68 (void *)(long)(event->header.size),
69 event__name[event->header.type]);
70 ++event__total[0];
71 ++event__total[event->header.type];
72 }
73
74 switch (event->header.type) {
75 case PERF_RECORD_SAMPLE:
76 return ops->process_sample_event(event, session);
77 case PERF_RECORD_MMAP:
78 return ops->process_mmap_event(event, session);
79 case PERF_RECORD_COMM:
80 return ops->process_comm_event(event, session);
81 case PERF_RECORD_FORK:
82 return ops->process_fork_event(event, session);
83 case PERF_RECORD_EXIT:
84 return ops->process_exit_event(event, session);
85 case PERF_RECORD_LOST:
86 return ops->process_lost_event(event, session);
87 case PERF_RECORD_READ:
88 return ops->process_read_event(event, session);
89 case PERF_RECORD_THROTTLE:
90 return ops->process_throttle_event(event, session);
91 case PERF_RECORD_UNTHROTTLE:
92 return ops->process_unthrottle_event(event, session);
93 default:
94 ops->total_unknown++;
95 return -1;
96 }
97}
98
99int perf_header__read_build_ids(int input, u64 offset, u64 size)
100{
101 struct build_id_event bev;
102 char filename[PATH_MAX];
103 u64 limit = offset + size;
104 int err = -1;
105
106 while (offset < limit) {
107 struct dso *dso;
108 ssize_t len;
109
110 if (read(input, &bev, sizeof(bev)) != sizeof(bev))
111 goto out;
112
113 len = bev.header.size - sizeof(bev);
114 if (read(input, filename, len) != len)
115 goto out;
116
117 dso = dsos__findnew(filename);
118 if (dso != NULL)
119 dso__set_build_id(dso, &bev.build_id);
120
121 offset += bev.header.size;
122 }
123 err = 0;
124out:
125 return err;
126}
127
128static struct thread *perf_session__register_idle_thread(struct perf_session *self)
129{
130 struct thread *thread = perf_session__findnew(self, 0);
131
132 if (!thread || thread__set_comm(thread, "swapper")) {
133 pr_err("problem inserting idle task.\n");
134 thread = NULL;
135 }
136
137 return thread;
138}
139
140int perf_session__process_events(struct perf_session *self,
141 struct perf_event_ops *ops)
142{
143 int err;
144 unsigned long head, shift;
145 unsigned long offset = 0;
146 size_t page_size;
147 event_t *event;
148 uint32_t size;
149 char *buf;
150
151 if (perf_session__register_idle_thread(self) == NULL)
152 return -ENOMEM;
153
154 perf_event_ops__fill_defaults(ops);
155
156 page_size = getpagesize();
157
158 head = self->header.data_offset;
159 self->sample_type = perf_header__sample_type(&self->header);
160
161 err = -EINVAL;
162 if (ops->sample_type_check && ops->sample_type_check(self) < 0)
163 goto out_err;
164
165 if (!ops->full_paths) {
166 char bf[PATH_MAX];
167
168 if (getcwd(bf, sizeof(bf)) == NULL) {
169 err = -errno;
170out_getcwd_err:
171 pr_err("failed to get the current directory\n");
172 goto out_err;
173 }
174 self->cwd = strdup(bf);
175 if (self->cwd == NULL) {
176 err = -ENOMEM;
177 goto out_getcwd_err;
178 }
179 self->cwdlen = strlen(self->cwd);
180 }
181
182 shift = page_size * (head / page_size);
183 offset += shift;
184 head -= shift;
185
186remap:
187 buf = mmap(NULL, page_size * self->mmap_window, PROT_READ,
188 MAP_SHARED, self->fd, offset);
189 if (buf == MAP_FAILED) {
190 pr_err("failed to mmap file\n");
191 err = -errno;
192 goto out_err;
193 }
194
195more:
196 event = (event_t *)(buf + head);
197
198 size = event->header.size;
199 if (!size)
200 size = 8;
201
202 if (head + event->header.size >= page_size * self->mmap_window) {
203 int munmap_ret;
204
205 shift = page_size * (head / page_size);
206
207 munmap_ret = munmap(buf, page_size * self->mmap_window);
208 assert(munmap_ret == 0);
209
210 offset += shift;
211 head -= shift;
212 goto remap;
213 }
214
215 size = event->header.size;
216
217 dump_printf("\n%p [%p]: event: %d\n",
218 (void *)(offset + head),
219 (void *)(long)event->header.size,
220 event->header.type);
221
222 if (!size || process_event(event, self, ops, offset, head) < 0) {
223
224 dump_printf("%p [%p]: skipping unknown header type: %d\n",
225 (void *)(offset + head),
226 (void *)(long)(event->header.size),
227 event->header.type);
228
229 /*
230 * assume we lost track of the stream, check alignment, and
231 * increment a single u64 in the hope to catch on again 'soon'.
232 */
233
234 if (unlikely(head & 7))
235 head &= ~7ULL;
236
237 size = 8;
238 }
239
240 head += size;
241
242 if (offset + head >= self->header.data_offset + self->header.data_size)
243 goto done;
244
245 if (offset + head < self->size)
246 goto more;
247
248done:
249 err = 0;
250out_err:
251 return err;
252}
diff --git a/tools/perf/util/debug.c b/tools/perf/util/debug.c
index 28d520d5a1fb..6cddff2bc970 100644
--- a/tools/perf/util/debug.c
+++ b/tools/perf/util/debug.c
@@ -6,12 +6,14 @@
6#include <stdarg.h> 6#include <stdarg.h>
7#include <stdio.h> 7#include <stdio.h>
8 8
9#include "cache.h"
9#include "color.h" 10#include "color.h"
10#include "event.h" 11#include "event.h"
11#include "debug.h" 12#include "debug.h"
13#include "util.h"
12 14
13int verbose = 0; 15int verbose = 0;
14int dump_trace = 0; 16bool dump_trace = false;
15 17
16int eprintf(int level, const char *fmt, ...) 18int eprintf(int level, const char *fmt, ...)
17{ 19{
@@ -20,7 +22,10 @@ int eprintf(int level, const char *fmt, ...)
20 22
21 if (verbose >= level) { 23 if (verbose >= level) {
22 va_start(args, fmt); 24 va_start(args, fmt);
23 ret = vfprintf(stderr, fmt, args); 25 if (use_browser > 0)
26 ret = browser__show_help(fmt, args);
27 else
28 ret = vfprintf(stderr, fmt, args);
24 va_end(args); 29 va_end(args);
25 } 30 }
26 31
diff --git a/tools/perf/util/debug.h b/tools/perf/util/debug.h
index c6c24c522dea..047ac3324ebe 100644
--- a/tools/perf/util/debug.h
+++ b/tools/perf/util/debug.h
@@ -2,14 +2,38 @@
2#ifndef __PERF_DEBUG_H 2#ifndef __PERF_DEBUG_H
3#define __PERF_DEBUG_H 3#define __PERF_DEBUG_H
4 4
5#include <stdbool.h>
5#include "event.h" 6#include "event.h"
6 7
7extern int verbose; 8extern int verbose;
8extern int dump_trace; 9extern bool dump_trace;
9 10
10int eprintf(int level,
11 const char *fmt, ...) __attribute__((format(printf, 2, 3)));
12int dump_printf(const char *fmt, ...) __attribute__((format(printf, 1, 2))); 11int dump_printf(const char *fmt, ...) __attribute__((format(printf, 1, 2)));
13void trace_event(event_t *event); 12void trace_event(event_t *event);
14 13
14struct ui_progress;
15
16#ifdef NO_NEWT_SUPPORT
17static inline int browser__show_help(const char *format __used, va_list ap __used)
18{
19 return 0;
20}
21
22static inline struct ui_progress *ui_progress__new(const char *title __used,
23 u64 total __used)
24{
25 return (struct ui_progress *)1;
26}
27
28static inline void ui_progress__update(struct ui_progress *self __used,
29 u64 curr __used) {}
30
31static inline void ui_progress__delete(struct ui_progress *self __used) {}
32#else
33int browser__show_help(const char *format, va_list ap);
34struct ui_progress *ui_progress__new(const char *title, u64 total);
35void ui_progress__update(struct ui_progress *self, u64 curr);
36void ui_progress__delete(struct ui_progress *self);
37#endif
38
15#endif /* __PERF_DEBUG_H */ 39#endif /* __PERF_DEBUG_H */
diff --git a/tools/perf/util/debugfs.c b/tools/perf/util/debugfs.c
index 06b73ee02c49..a88fefc0cc0a 100644
--- a/tools/perf/util/debugfs.c
+++ b/tools/perf/util/debugfs.c
@@ -106,16 +106,14 @@ int debugfs_valid_entry(const char *path)
106 return 0; 106 return 0;
107} 107}
108 108
109/* mount the debugfs somewhere */ 109/* mount the debugfs somewhere if it's not mounted */
110 110
111int debugfs_mount(const char *mountpoint) 111char *debugfs_mount(const char *mountpoint)
112{ 112{
113 char mountcmd[128];
114
115 /* see if it's already mounted */ 113 /* see if it's already mounted */
116 if (debugfs_find_mountpoint()) { 114 if (debugfs_find_mountpoint()) {
117 debugfs_premounted = 1; 115 debugfs_premounted = 1;
118 return 0; 116 return debugfs_mountpoint;
119 } 117 }
120 118
121 /* if not mounted and no argument */ 119 /* if not mounted and no argument */
@@ -127,13 +125,14 @@ int debugfs_mount(const char *mountpoint)
127 mountpoint = "/sys/kernel/debug"; 125 mountpoint = "/sys/kernel/debug";
128 } 126 }
129 127
128 if (mount(NULL, mountpoint, "debugfs", 0, NULL) < 0)
129 return NULL;
130
130 /* save the mountpoint */ 131 /* save the mountpoint */
131 strncpy(debugfs_mountpoint, mountpoint, sizeof(debugfs_mountpoint)); 132 strncpy(debugfs_mountpoint, mountpoint, sizeof(debugfs_mountpoint));
133 debugfs_found = 1;
132 134
133 /* mount it */ 135 return debugfs_mountpoint;
134 snprintf(mountcmd, sizeof(mountcmd),
135 "/bin/mount -t debugfs debugfs %s", mountpoint);
136 return system(mountcmd);
137} 136}
138 137
139/* umount the debugfs */ 138/* umount the debugfs */
diff --git a/tools/perf/util/debugfs.h b/tools/perf/util/debugfs.h
index 3cd14f9ae784..83a02879745f 100644
--- a/tools/perf/util/debugfs.h
+++ b/tools/perf/util/debugfs.h
@@ -15,7 +15,7 @@
15extern const char *debugfs_find_mountpoint(void); 15extern const char *debugfs_find_mountpoint(void);
16extern int debugfs_valid_mountpoint(const char *debugfs); 16extern int debugfs_valid_mountpoint(const char *debugfs);
17extern int debugfs_valid_entry(const char *path); 17extern int debugfs_valid_entry(const char *path);
18extern int debugfs_mount(const char *mountpoint); 18extern char *debugfs_mount(const char *mountpoint);
19extern int debugfs_umount(void); 19extern int debugfs_umount(void);
20extern int debugfs_write(const char *entry, const char *value); 20extern int debugfs_write(const char *entry, const char *value);
21extern int debugfs_read(const char *entry, char *buffer, size_t size); 21extern int debugfs_read(const char *entry, char *buffer, size_t size);
diff --git a/tools/perf/util/event.c b/tools/perf/util/event.c
index 8a9e6baa3099..2fbf6a463c81 100644
--- a/tools/perf/util/event.c
+++ b/tools/perf/util/event.c
@@ -7,9 +7,25 @@
7#include "strlist.h" 7#include "strlist.h"
8#include "thread.h" 8#include "thread.h"
9 9
10const char *event__name[] = {
11 [0] = "TOTAL",
12 [PERF_RECORD_MMAP] = "MMAP",
13 [PERF_RECORD_LOST] = "LOST",
14 [PERF_RECORD_COMM] = "COMM",
15 [PERF_RECORD_EXIT] = "EXIT",
16 [PERF_RECORD_THROTTLE] = "THROTTLE",
17 [PERF_RECORD_UNTHROTTLE] = "UNTHROTTLE",
18 [PERF_RECORD_FORK] = "FORK",
19 [PERF_RECORD_READ] = "READ",
20 [PERF_RECORD_SAMPLE] = "SAMPLE",
21 [PERF_RECORD_HEADER_ATTR] = "ATTR",
22 [PERF_RECORD_HEADER_EVENT_TYPE] = "EVENT_TYPE",
23 [PERF_RECORD_HEADER_TRACING_DATA] = "TRACING_DATA",
24 [PERF_RECORD_HEADER_BUILD_ID] = "BUILD_ID",
25};
26
10static pid_t event__synthesize_comm(pid_t pid, int full, 27static pid_t event__synthesize_comm(pid_t pid, int full,
11 int (*process)(event_t *event, 28 event__handler_t process,
12 struct perf_session *session),
13 struct perf_session *session) 29 struct perf_session *session)
14{ 30{
15 event_t ev; 31 event_t ev;
@@ -91,8 +107,7 @@ out_failure:
91} 107}
92 108
93static int event__synthesize_mmap_events(pid_t pid, pid_t tgid, 109static int event__synthesize_mmap_events(pid_t pid, pid_t tgid,
94 int (*process)(event_t *event, 110 event__handler_t process,
95 struct perf_session *session),
96 struct perf_session *session) 111 struct perf_session *session)
97{ 112{
98 char filename[PATH_MAX]; 113 char filename[PATH_MAX];
@@ -112,7 +127,14 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid,
112 while (1) { 127 while (1) {
113 char bf[BUFSIZ], *pbf = bf; 128 char bf[BUFSIZ], *pbf = bf;
114 event_t ev = { 129 event_t ev = {
115 .header = { .type = PERF_RECORD_MMAP }, 130 .header = {
131 .type = PERF_RECORD_MMAP,
132 /*
133 * Just like the kernel, see __perf_event_mmap
134 * in kernel/perf_event.c
135 */
136 .misc = PERF_RECORD_MISC_USER,
137 },
116 }; 138 };
117 int n; 139 int n;
118 size_t size; 140 size_t size;
@@ -129,6 +151,7 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid,
129 continue; 151 continue;
130 pbf += n + 3; 152 pbf += n + 3;
131 if (*pbf == 'x') { /* vm_exec */ 153 if (*pbf == 'x') { /* vm_exec */
154 u64 vm_pgoff;
132 char *execname = strchr(bf, '/'); 155 char *execname = strchr(bf, '/');
133 156
134 /* Catch VDSO */ 157 /* Catch VDSO */
@@ -138,6 +161,14 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid,
138 if (execname == NULL) 161 if (execname == NULL)
139 continue; 162 continue;
140 163
164 pbf += 3;
165 n = hex2u64(pbf, &vm_pgoff);
166 /* pgoff is in bytes, not pages */
167 if (n >= 0)
168 ev.mmap.pgoff = vm_pgoff << getpagesize();
169 else
170 ev.mmap.pgoff = 0;
171
141 size = strlen(execname); 172 size = strlen(execname);
142 execname[size - 1] = '\0'; /* Remove \n */ 173 execname[size - 1] = '\0'; /* Remove \n */
143 memcpy(ev.mmap.filename, execname, size); 174 memcpy(ev.mmap.filename, execname, size);
@@ -156,9 +187,51 @@ static int event__synthesize_mmap_events(pid_t pid, pid_t tgid,
156 return 0; 187 return 0;
157} 188}
158 189
159int event__synthesize_thread(pid_t pid, 190int event__synthesize_modules(event__handler_t process,
160 int (*process)(event_t *event, 191 struct perf_session *session,
161 struct perf_session *session), 192 struct machine *machine)
193{
194 struct rb_node *nd;
195 struct map_groups *kmaps = &machine->kmaps;
196 u16 misc;
197
198 /*
199 * kernel uses 0 for user space maps, see kernel/perf_event.c
200 * __perf_event_mmap
201 */
202 if (machine__is_host(machine))
203 misc = PERF_RECORD_MISC_KERNEL;
204 else
205 misc = PERF_RECORD_MISC_GUEST_KERNEL;
206
207 for (nd = rb_first(&kmaps->maps[MAP__FUNCTION]);
208 nd; nd = rb_next(nd)) {
209 event_t ev;
210 size_t size;
211 struct map *pos = rb_entry(nd, struct map, rb_node);
212
213 if (pos->dso->kernel)
214 continue;
215
216 size = ALIGN(pos->dso->long_name_len + 1, sizeof(u64));
217 memset(&ev, 0, sizeof(ev));
218 ev.mmap.header.misc = misc;
219 ev.mmap.header.type = PERF_RECORD_MMAP;
220 ev.mmap.header.size = (sizeof(ev.mmap) -
221 (sizeof(ev.mmap.filename) - size));
222 ev.mmap.start = pos->start;
223 ev.mmap.len = pos->end - pos->start;
224 ev.mmap.pid = machine->pid;
225
226 memcpy(ev.mmap.filename, pos->dso->long_name,
227 pos->dso->long_name_len + 1);
228 process(&ev, session);
229 }
230
231 return 0;
232}
233
234int event__synthesize_thread(pid_t pid, event__handler_t process,
162 struct perf_session *session) 235 struct perf_session *session)
163{ 236{
164 pid_t tgid = event__synthesize_comm(pid, 1, process, session); 237 pid_t tgid = event__synthesize_comm(pid, 1, process, session);
@@ -167,8 +240,7 @@ int event__synthesize_thread(pid_t pid,
167 return event__synthesize_mmap_events(pid, tgid, process, session); 240 return event__synthesize_mmap_events(pid, tgid, process, session);
168} 241}
169 242
170void event__synthesize_threads(int (*process)(event_t *event, 243void event__synthesize_threads(event__handler_t process,
171 struct perf_session *session),
172 struct perf_session *session) 244 struct perf_session *session)
173{ 245{
174 DIR *proc; 246 DIR *proc;
@@ -189,6 +261,85 @@ void event__synthesize_threads(int (*process)(event_t *event,
189 closedir(proc); 261 closedir(proc);
190} 262}
191 263
264struct process_symbol_args {
265 const char *name;
266 u64 start;
267};
268
269static int find_symbol_cb(void *arg, const char *name, char type, u64 start)
270{
271 struct process_symbol_args *args = arg;
272
273 /*
274 * Must be a function or at least an alias, as in PARISC64, where "_text" is
275 * an 'A' to the same address as "_stext".
276 */
277 if (!(symbol_type__is_a(type, MAP__FUNCTION) ||
278 type == 'A') || strcmp(name, args->name))
279 return 0;
280
281 args->start = start;
282 return 1;
283}
284
285int event__synthesize_kernel_mmap(event__handler_t process,
286 struct perf_session *session,
287 struct machine *machine,
288 const char *symbol_name)
289{
290 size_t size;
291 const char *filename, *mmap_name;
292 char path[PATH_MAX];
293 char name_buff[PATH_MAX];
294 struct map *map;
295
296 event_t ev = {
297 .header = {
298 .type = PERF_RECORD_MMAP,
299 },
300 };
301 /*
302 * We should get this from /sys/kernel/sections/.text, but till that is
303 * available use this, and after it is use this as a fallback for older
304 * kernels.
305 */
306 struct process_symbol_args args = { .name = symbol_name, };
307
308 mmap_name = machine__mmap_name(machine, name_buff, sizeof(name_buff));
309 if (machine__is_host(machine)) {
310 /*
311 * kernel uses PERF_RECORD_MISC_USER for user space maps,
312 * see kernel/perf_event.c __perf_event_mmap
313 */
314 ev.header.misc = PERF_RECORD_MISC_KERNEL;
315 filename = "/proc/kallsyms";
316 } else {
317 ev.header.misc = PERF_RECORD_MISC_GUEST_KERNEL;
318 if (machine__is_default_guest(machine))
319 filename = (char *) symbol_conf.default_guest_kallsyms;
320 else {
321 sprintf(path, "%s/proc/kallsyms", machine->root_dir);
322 filename = path;
323 }
324 }
325
326 if (kallsyms__parse(filename, &args, find_symbol_cb) <= 0)
327 return -ENOENT;
328
329 map = machine->vmlinux_maps[MAP__FUNCTION];
330 size = snprintf(ev.mmap.filename, sizeof(ev.mmap.filename),
331 "%s%s", mmap_name, symbol_name) + 1;
332 size = ALIGN(size, sizeof(u64));
333 ev.mmap.header.size = (sizeof(ev.mmap) -
334 (sizeof(ev.mmap.filename) - size));
335 ev.mmap.pgoff = args.start;
336 ev.mmap.start = map->start;
337 ev.mmap.len = map->end - ev.mmap.start;
338 ev.mmap.pid = machine->pid;
339
340 return process(&ev, session);
341}
342
192static void thread__comm_adjust(struct thread *self) 343static void thread__comm_adjust(struct thread *self)
193{ 344{
194 char *comm = self->comm; 345 char *comm = self->comm;
@@ -219,9 +370,9 @@ static int thread__set_comm_adjust(struct thread *self, const char *comm)
219 370
220int event__process_comm(event_t *self, struct perf_session *session) 371int event__process_comm(event_t *self, struct perf_session *session)
221{ 372{
222 struct thread *thread = perf_session__findnew(session, self->comm.pid); 373 struct thread *thread = perf_session__findnew(session, self->comm.tid);
223 374
224 dump_printf(": %s:%d\n", self->comm.comm, self->comm.pid); 375 dump_printf(": %s:%d\n", self->comm.comm, self->comm.tid);
225 376
226 if (thread == NULL || thread__set_comm_adjust(thread, self->comm.comm)) { 377 if (thread == NULL || thread__set_comm_adjust(thread, self->comm.comm)) {
227 dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n"); 378 dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n");
@@ -234,46 +385,163 @@ int event__process_comm(event_t *self, struct perf_session *session)
234int event__process_lost(event_t *self, struct perf_session *session) 385int event__process_lost(event_t *self, struct perf_session *session)
235{ 386{
236 dump_printf(": id:%Ld: lost:%Ld\n", self->lost.id, self->lost.lost); 387 dump_printf(": id:%Ld: lost:%Ld\n", self->lost.id, self->lost.lost);
237 session->events_stats.lost += self->lost.lost; 388 session->hists.stats.total_lost += self->lost.lost;
238 return 0; 389 return 0;
239} 390}
240 391
392static void event_set_kernel_mmap_len(struct map **maps, event_t *self)
393{
394 maps[MAP__FUNCTION]->start = self->mmap.start;
395 maps[MAP__FUNCTION]->end = self->mmap.start + self->mmap.len;
396 /*
397 * Be a bit paranoid here, some perf.data file came with
398 * a zero sized synthesized MMAP event for the kernel.
399 */
400 if (maps[MAP__FUNCTION]->end == 0)
401 maps[MAP__FUNCTION]->end = ~0UL;
402}
403
404static int event__process_kernel_mmap(event_t *self,
405 struct perf_session *session)
406{
407 struct map *map;
408 char kmmap_prefix[PATH_MAX];
409 struct machine *machine;
410 enum dso_kernel_type kernel_type;
411 bool is_kernel_mmap;
412
413 machine = perf_session__findnew_machine(session, self->mmap.pid);
414 if (!machine) {
415 pr_err("Can't find id %d's machine\n", self->mmap.pid);
416 goto out_problem;
417 }
418
419 machine__mmap_name(machine, kmmap_prefix, sizeof(kmmap_prefix));
420 if (machine__is_host(machine))
421 kernel_type = DSO_TYPE_KERNEL;
422 else
423 kernel_type = DSO_TYPE_GUEST_KERNEL;
424
425 is_kernel_mmap = memcmp(self->mmap.filename,
426 kmmap_prefix,
427 strlen(kmmap_prefix)) == 0;
428 if (self->mmap.filename[0] == '/' ||
429 (!is_kernel_mmap && self->mmap.filename[0] == '[')) {
430
431 char short_module_name[1024];
432 char *name, *dot;
433
434 if (self->mmap.filename[0] == '/') {
435 name = strrchr(self->mmap.filename, '/');
436 if (name == NULL)
437 goto out_problem;
438
439 ++name; /* skip / */
440 dot = strrchr(name, '.');
441 if (dot == NULL)
442 goto out_problem;
443 snprintf(short_module_name, sizeof(short_module_name),
444 "[%.*s]", (int)(dot - name), name);
445 strxfrchar(short_module_name, '-', '_');
446 } else
447 strcpy(short_module_name, self->mmap.filename);
448
449 map = machine__new_module(machine, self->mmap.start,
450 self->mmap.filename);
451 if (map == NULL)
452 goto out_problem;
453
454 name = strdup(short_module_name);
455 if (name == NULL)
456 goto out_problem;
457
458 map->dso->short_name = name;
459 map->end = map->start + self->mmap.len;
460 } else if (is_kernel_mmap) {
461 const char *symbol_name = (self->mmap.filename +
462 strlen(kmmap_prefix));
463 /*
464 * Should be there already, from the build-id table in
465 * the header.
466 */
467 struct dso *kernel = __dsos__findnew(&machine->kernel_dsos,
468 kmmap_prefix);
469 if (kernel == NULL)
470 goto out_problem;
471
472 kernel->kernel = kernel_type;
473 if (__machine__create_kernel_maps(machine, kernel) < 0)
474 goto out_problem;
475
476 event_set_kernel_mmap_len(machine->vmlinux_maps, self);
477 perf_session__set_kallsyms_ref_reloc_sym(machine->vmlinux_maps,
478 symbol_name,
479 self->mmap.pgoff);
480 if (machine__is_default_guest(machine)) {
481 /*
482 * preload dso of guest kernel and modules
483 */
484 dso__load(kernel, machine->vmlinux_maps[MAP__FUNCTION],
485 NULL);
486 }
487 }
488 return 0;
489out_problem:
490 return -1;
491}
492
241int event__process_mmap(event_t *self, struct perf_session *session) 493int event__process_mmap(event_t *self, struct perf_session *session)
242{ 494{
243 struct thread *thread = perf_session__findnew(session, self->mmap.pid); 495 struct machine *machine;
244 struct map *map = map__new(&self->mmap, MAP__FUNCTION, 496 struct thread *thread;
245 session->cwd, session->cwdlen); 497 struct map *map;
498 u8 cpumode = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
499 int ret = 0;
500
501 dump_printf(" %d/%d: [%#Lx(%#Lx) @ %#Lx]: %s\n",
502 self->mmap.pid, self->mmap.tid, self->mmap.start,
503 self->mmap.len, self->mmap.pgoff, self->mmap.filename);
504
505 if (cpumode == PERF_RECORD_MISC_GUEST_KERNEL ||
506 cpumode == PERF_RECORD_MISC_KERNEL) {
507 ret = event__process_kernel_mmap(self, session);
508 if (ret < 0)
509 goto out_problem;
510 return 0;
511 }
246 512
247 dump_printf(" %d/%d: [%p(%p) @ %p]: %s\n", 513 machine = perf_session__find_host_machine(session);
248 self->mmap.pid, self->mmap.tid, 514 if (machine == NULL)
249 (void *)(long)self->mmap.start, 515 goto out_problem;
250 (void *)(long)self->mmap.len, 516 thread = perf_session__findnew(session, self->mmap.pid);
251 (void *)(long)self->mmap.pgoff, 517 map = map__new(&machine->user_dsos, self->mmap.start,
252 self->mmap.filename); 518 self->mmap.len, self->mmap.pgoff,
519 self->mmap.pid, self->mmap.filename,
520 MAP__FUNCTION, session->cwd, session->cwdlen);
253 521
254 if (thread == NULL || map == NULL) 522 if (thread == NULL || map == NULL)
255 dump_printf("problem processing PERF_RECORD_MMAP, skipping event.\n"); 523 goto out_problem;
256 else
257 thread__insert_map(thread, map);
258 524
525 thread__insert_map(thread, map);
526 return 0;
527
528out_problem:
529 dump_printf("problem processing PERF_RECORD_MMAP, skipping event.\n");
259 return 0; 530 return 0;
260} 531}
261 532
262int event__process_task(event_t *self, struct perf_session *session) 533int event__process_task(event_t *self, struct perf_session *session)
263{ 534{
264 struct thread *thread = perf_session__findnew(session, self->fork.pid); 535 struct thread *thread = perf_session__findnew(session, self->fork.tid);
265 struct thread *parent = perf_session__findnew(session, self->fork.ppid); 536 struct thread *parent = perf_session__findnew(session, self->fork.ptid);
266 537
267 dump_printf("(%d:%d):(%d:%d)\n", self->fork.pid, self->fork.tid, 538 dump_printf("(%d:%d):(%d:%d)\n", self->fork.pid, self->fork.tid,
268 self->fork.ppid, self->fork.ptid); 539 self->fork.ppid, self->fork.ptid);
269 /*
270 * A thread clone will have the same PID for both parent and child.
271 */
272 if (thread == parent)
273 return 0;
274 540
275 if (self->header.type == PERF_RECORD_EXIT) 541 if (self->header.type == PERF_RECORD_EXIT) {
542 perf_session__remove_thread(session, thread);
276 return 0; 543 return 0;
544 }
277 545
278 if (thread == NULL || parent == NULL || 546 if (thread == NULL || parent == NULL ||
279 thread__fork(thread, parent) < 0) { 547 thread__fork(thread, parent) < 0) {
@@ -284,26 +552,58 @@ int event__process_task(event_t *self, struct perf_session *session)
284 return 0; 552 return 0;
285} 553}
286 554
287void thread__find_addr_location(struct thread *self, 555void thread__find_addr_map(struct thread *self,
288 struct perf_session *session, u8 cpumode, 556 struct perf_session *session, u8 cpumode,
289 enum map_type type, u64 addr, 557 enum map_type type, pid_t pid, u64 addr,
290 struct addr_location *al, 558 struct addr_location *al)
291 symbol_filter_t filter)
292{ 559{
293 struct map_groups *mg = &self->mg; 560 struct map_groups *mg = &self->mg;
561 struct machine *machine = NULL;
294 562
295 al->thread = self; 563 al->thread = self;
296 al->addr = addr; 564 al->addr = addr;
565 al->cpumode = cpumode;
566 al->filtered = false;
297 567
298 if (cpumode == PERF_RECORD_MISC_KERNEL) { 568 if (cpumode == PERF_RECORD_MISC_KERNEL && perf_host) {
299 al->level = 'k'; 569 al->level = 'k';
300 mg = &session->kmaps; 570 machine = perf_session__find_host_machine(session);
301 } else if (cpumode == PERF_RECORD_MISC_USER) 571 if (machine == NULL) {
572 al->map = NULL;
573 return;
574 }
575 mg = &machine->kmaps;
576 } else if (cpumode == PERF_RECORD_MISC_USER && perf_host) {
302 al->level = '.'; 577 al->level = '.';
303 else { 578 machine = perf_session__find_host_machine(session);
304 al->level = 'H'; 579 } else if (cpumode == PERF_RECORD_MISC_GUEST_KERNEL && perf_guest) {
580 al->level = 'g';
581 machine = perf_session__find_machine(session, pid);
582 if (machine == NULL) {
583 al->map = NULL;
584 return;
585 }
586 mg = &machine->kmaps;
587 } else {
588 /*
589 * 'u' means guest os user space.
590 * TODO: We don't support guest user space. Might support late.
591 */
592 if (cpumode == PERF_RECORD_MISC_GUEST_USER && perf_guest)
593 al->level = 'u';
594 else
595 al->level = 'H';
305 al->map = NULL; 596 al->map = NULL;
306 al->sym = NULL; 597
598 if ((cpumode == PERF_RECORD_MISC_GUEST_USER ||
599 cpumode == PERF_RECORD_MISC_GUEST_KERNEL) &&
600 !perf_guest)
601 al->filtered = true;
602 if ((cpumode == PERF_RECORD_MISC_USER ||
603 cpumode == PERF_RECORD_MISC_KERNEL) &&
604 !perf_host)
605 al->filtered = true;
606
307 return; 607 return;
308 } 608 }
309try_again: 609try_again:
@@ -318,15 +618,27 @@ try_again:
318 * "[vdso]" dso, but for now lets use the old trick of looking 618 * "[vdso]" dso, but for now lets use the old trick of looking
319 * in the whole kernel symbol list. 619 * in the whole kernel symbol list.
320 */ 620 */
321 if ((long long)al->addr < 0 && mg != &session->kmaps) { 621 if ((long long)al->addr < 0 &&
322 mg = &session->kmaps; 622 cpumode == PERF_RECORD_MISC_KERNEL &&
623 machine && mg != &machine->kmaps) {
624 mg = &machine->kmaps;
323 goto try_again; 625 goto try_again;
324 } 626 }
325 al->sym = NULL; 627 } else
326 } else {
327 al->addr = al->map->map_ip(al->map, al->addr); 628 al->addr = al->map->map_ip(al->map, al->addr);
328 al->sym = map__find_symbol(al->map, session, al->addr, filter); 629}
329 } 630
631void thread__find_addr_location(struct thread *self,
632 struct perf_session *session, u8 cpumode,
633 enum map_type type, pid_t pid, u64 addr,
634 struct addr_location *al,
635 symbol_filter_t filter)
636{
637 thread__find_addr_map(self, session, cpumode, type, pid, addr, al);
638 if (al->map != NULL)
639 al->sym = map__find_symbol(al->map, al->addr, filter);
640 else
641 al->sym = NULL;
330} 642}
331 643
332static void dso__calc_col_width(struct dso *self) 644static void dso__calc_col_width(struct dso *self)
@@ -334,8 +646,10 @@ static void dso__calc_col_width(struct dso *self)
334 if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep && 646 if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep &&
335 (!symbol_conf.dso_list || 647 (!symbol_conf.dso_list ||
336 strlist__has_entry(symbol_conf.dso_list, self->name))) { 648 strlist__has_entry(symbol_conf.dso_list, self->name))) {
337 unsigned int slen = strlen(self->name); 649 u16 slen = self->short_name_len;
338 if (slen > dsos__col_width) 650 if (verbose)
651 slen = self->long_name_len;
652 if (dsos__col_width < slen)
339 dsos__col_width = slen; 653 dsos__col_width = slen;
340 } 654 }
341 655
@@ -356,31 +670,55 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session,
356 goto out_filtered; 670 goto out_filtered;
357 671
358 dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid); 672 dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid);
673 /*
674 * Have we already created the kernel maps for the host machine?
675 *
676 * This should have happened earlier, when we processed the kernel MMAP
677 * events, but for older perf.data files there was no such thing, so do
678 * it now.
679 */
680 if (cpumode == PERF_RECORD_MISC_KERNEL &&
681 session->host_machine.vmlinux_maps[MAP__FUNCTION] == NULL)
682 machine__create_kernel_maps(&session->host_machine);
359 683
360 thread__find_addr_location(thread, session, cpumode, MAP__FUNCTION, 684 thread__find_addr_map(thread, session, cpumode, MAP__FUNCTION,
361 self->ip.ip, al, filter); 685 self->ip.pid, self->ip.ip, al);
362 dump_printf(" ...... dso: %s\n", 686 dump_printf(" ...... dso: %s\n",
363 al->map ? al->map->dso->long_name : 687 al->map ? al->map->dso->long_name :
364 al->level == 'H' ? "[hypervisor]" : "<not found>"); 688 al->level == 'H' ? "[hypervisor]" : "<not found>");
365 /* 689 al->sym = NULL;
366 * We have to do this here as we may have a dso with no symbol hit that 690
367 * has a name longer than the ones with symbols sampled. 691 if (al->map) {
368 */ 692 if (symbol_conf.dso_list &&
369 if (al->map && !sort_dso.elide && !al->map->dso->slen_calculated) 693 (!al->map || !al->map->dso ||
370 dso__calc_col_width(al->map->dso); 694 !(strlist__has_entry(symbol_conf.dso_list,
371 695 al->map->dso->short_name) ||
372 if (symbol_conf.dso_list && 696 (al->map->dso->short_name != al->map->dso->long_name &&
373 (!al->map || !al->map->dso || 697 strlist__has_entry(symbol_conf.dso_list,
374 !(strlist__has_entry(symbol_conf.dso_list, al->map->dso->short_name) || 698 al->map->dso->long_name)))))
375 (al->map->dso->short_name != al->map->dso->long_name && 699 goto out_filtered;
376 strlist__has_entry(symbol_conf.dso_list, al->map->dso->long_name))))) 700 /*
377 goto out_filtered; 701 * We have to do this here as we may have a dso with no symbol
702 * hit that has a name longer than the ones with symbols
703 * sampled.
704 */
705 if (!sort_dso.elide && !al->map->dso->slen_calculated)
706 dso__calc_col_width(al->map->dso);
707
708 al->sym = map__find_symbol(al->map, al->addr, filter);
709 } else {
710 const unsigned int unresolved_col_width = BITS_PER_LONG / 4;
711
712 if (dsos__col_width < unresolved_col_width &&
713 !symbol_conf.col_width_list_str && !symbol_conf.field_sep &&
714 !symbol_conf.dso_list)
715 dsos__col_width = unresolved_col_width;
716 }
378 717
379 if (symbol_conf.sym_list && al->sym && 718 if (symbol_conf.sym_list && al->sym &&
380 !strlist__has_entry(symbol_conf.sym_list, al->sym->name)) 719 !strlist__has_entry(symbol_conf.sym_list, al->sym->name))
381 goto out_filtered; 720 goto out_filtered;
382 721
383 al->filtered = false;
384 return 0; 722 return 0;
385 723
386out_filtered: 724out_filtered:
@@ -414,6 +752,7 @@ int event__parse_sample(event_t *event, u64 type, struct sample_data *data)
414 array++; 752 array++;
415 } 753 }
416 754
755 data->id = -1ULL;
417 if (type & PERF_SAMPLE_ID) { 756 if (type & PERF_SAMPLE_ID) {
418 data->id = *array; 757 data->id = *array;
419 array++; 758 array++;
diff --git a/tools/perf/util/event.h b/tools/perf/util/event.h
index 690a96d0467c..8577085db067 100644
--- a/tools/perf/util/event.h
+++ b/tools/perf/util/event.h
@@ -1,10 +1,10 @@
1#ifndef __PERF_RECORD_H 1#ifndef __PERF_RECORD_H
2#define __PERF_RECORD_H 2#define __PERF_RECORD_H
3 3
4#include <limits.h>
5
4#include "../perf.h" 6#include "../perf.h"
5#include "util.h" 7#include "map.h"
6#include <linux/list.h>
7#include <linux/rbtree.h>
8 8
9/* 9/*
10 * PERF_SAMPLE_IP | PERF_SAMPLE_TID | * 10 * PERF_SAMPLE_IP | PERF_SAMPLE_TID | *
@@ -68,21 +68,54 @@ struct sample_data {
68 u64 addr; 68 u64 addr;
69 u64 id; 69 u64 id;
70 u64 stream_id; 70 u64 stream_id;
71 u32 cpu;
72 u64 period; 71 u64 period;
73 struct ip_callchain *callchain; 72 u32 cpu;
74 u32 raw_size; 73 u32 raw_size;
75 void *raw_data; 74 void *raw_data;
75 struct ip_callchain *callchain;
76}; 76};
77 77
78#define BUILD_ID_SIZE 20 78#define BUILD_ID_SIZE 20
79 79
80struct build_id_event { 80struct build_id_event {
81 struct perf_event_header header; 81 struct perf_event_header header;
82 pid_t pid;
82 u8 build_id[ALIGN(BUILD_ID_SIZE, sizeof(u64))]; 83 u8 build_id[ALIGN(BUILD_ID_SIZE, sizeof(u64))];
83 char filename[]; 84 char filename[];
84}; 85};
85 86
87enum perf_user_event_type { /* above any possible kernel type */
88 PERF_RECORD_HEADER_ATTR = 64,
89 PERF_RECORD_HEADER_EVENT_TYPE = 65,
90 PERF_RECORD_HEADER_TRACING_DATA = 66,
91 PERF_RECORD_HEADER_BUILD_ID = 67,
92 PERF_RECORD_FINISHED_ROUND = 68,
93 PERF_RECORD_HEADER_MAX
94};
95
96struct attr_event {
97 struct perf_event_header header;
98 struct perf_event_attr attr;
99 u64 id[];
100};
101
102#define MAX_EVENT_NAME 64
103
104struct perf_trace_event_type {
105 u64 event_id;
106 char name[MAX_EVENT_NAME];
107};
108
109struct event_type_event {
110 struct perf_event_header header;
111 struct perf_trace_event_type event_type;
112};
113
114struct tracing_data_event {
115 struct perf_event_header header;
116 u32 size;
117};
118
86typedef union event_union { 119typedef union event_union {
87 struct perf_event_header header; 120 struct perf_event_header header;
88 struct ip_event ip; 121 struct ip_event ip;
@@ -92,83 +125,30 @@ typedef union event_union {
92 struct lost_event lost; 125 struct lost_event lost;
93 struct read_event read; 126 struct read_event read;
94 struct sample_event sample; 127 struct sample_event sample;
128 struct attr_event attr;
129 struct event_type_event event_type;
130 struct tracing_data_event tracing_data;
131 struct build_id_event build_id;
95} event_t; 132} event_t;
96 133
97struct events_stats {
98 u64 total;
99 u64 lost;
100};
101
102void event__print_totals(void); 134void event__print_totals(void);
103 135
104enum map_type {
105 MAP__FUNCTION = 0,
106 MAP__VARIABLE,
107};
108
109#define MAP__NR_TYPES (MAP__VARIABLE + 1)
110
111struct map {
112 union {
113 struct rb_node rb_node;
114 struct list_head node;
115 };
116 u64 start;
117 u64 end;
118 enum map_type type;
119 u64 pgoff;
120 u64 (*map_ip)(struct map *, u64);
121 u64 (*unmap_ip)(struct map *, u64);
122 struct dso *dso;
123};
124
125static inline u64 map__map_ip(struct map *map, u64 ip)
126{
127 return ip - map->start + map->pgoff;
128}
129
130static inline u64 map__unmap_ip(struct map *map, u64 ip)
131{
132 return ip + map->start - map->pgoff;
133}
134
135static inline u64 identity__map_ip(struct map *map __used, u64 ip)
136{
137 return ip;
138}
139
140struct symbol;
141
142typedef int (*symbol_filter_t)(struct map *map, struct symbol *sym);
143
144void map__init(struct map *self, enum map_type type,
145 u64 start, u64 end, u64 pgoff, struct dso *dso);
146struct map *map__new(struct mmap_event *event, enum map_type,
147 char *cwd, int cwdlen);
148void map__delete(struct map *self);
149struct map *map__clone(struct map *self);
150int map__overlap(struct map *l, struct map *r);
151size_t map__fprintf(struct map *self, FILE *fp);
152
153struct perf_session; 136struct perf_session;
154 137
155int map__load(struct map *self, struct perf_session *session, 138typedef int (*event__handler_t)(event_t *event, struct perf_session *session);
156 symbol_filter_t filter); 139
157struct symbol *map__find_symbol(struct map *self, struct perf_session *session, 140int event__synthesize_thread(pid_t pid, event__handler_t process,
158 u64 addr, symbol_filter_t filter);
159struct symbol *map__find_symbol_by_name(struct map *self, const char *name,
160 struct perf_session *session,
161 symbol_filter_t filter);
162void map__fixup_start(struct map *self);
163void map__fixup_end(struct map *self);
164
165int event__synthesize_thread(pid_t pid,
166 int (*process)(event_t *event,
167 struct perf_session *session),
168 struct perf_session *session); 141 struct perf_session *session);
169void event__synthesize_threads(int (*process)(event_t *event, 142void event__synthesize_threads(event__handler_t process,
170 struct perf_session *session),
171 struct perf_session *session); 143 struct perf_session *session);
144int event__synthesize_kernel_mmap(event__handler_t process,
145 struct perf_session *session,
146 struct machine *machine,
147 const char *symbol_name);
148
149int event__synthesize_modules(event__handler_t process,
150 struct perf_session *session,
151 struct machine *machine);
172 152
173int event__process_comm(event_t *self, struct perf_session *session); 153int event__process_comm(event_t *self, struct perf_session *session);
174int event__process_lost(event_t *self, struct perf_session *session); 154int event__process_lost(event_t *self, struct perf_session *session);
@@ -180,4 +160,6 @@ int event__preprocess_sample(const event_t *self, struct perf_session *session,
180 struct addr_location *al, symbol_filter_t filter); 160 struct addr_location *al, symbol_filter_t filter);
181int event__parse_sample(event_t *event, u64 type, struct sample_data *data); 161int event__parse_sample(event_t *event, u64 type, struct sample_data *data);
182 162
163extern const char *event__name[];
164
183#endif /* __PERF_RECORD_H */ 165#endif /* __PERF_RECORD_H */
diff --git a/tools/perf/util/exec_cmd.c b/tools/perf/util/exec_cmd.c
index 2745605dba11..67eeff571568 100644
--- a/tools/perf/util/exec_cmd.c
+++ b/tools/perf/util/exec_cmd.c
@@ -53,8 +53,8 @@ const char *perf_extract_argv0_path(const char *argv0)
53 slash--; 53 slash--;
54 54
55 if (slash >= argv0) { 55 if (slash >= argv0) {
56 argv0_path = xstrndup(argv0, slash - argv0); 56 argv0_path = strndup(argv0, slash - argv0);
57 return slash + 1; 57 return argv0_path ? slash + 1 : NULL;
58 } 58 }
59 59
60 return argv0; 60 return argv0;
@@ -116,7 +116,7 @@ void setup_path(void)
116 strbuf_release(&new_path); 116 strbuf_release(&new_path);
117} 117}
118 118
119const char **prepare_perf_cmd(const char **argv) 119static const char **prepare_perf_cmd(const char **argv)
120{ 120{
121 int argc; 121 int argc;
122 const char **nargv; 122 const char **nargv;
diff --git a/tools/perf/util/exec_cmd.h b/tools/perf/util/exec_cmd.h
index 31647ac92ed1..bc4b915963f5 100644
--- a/tools/perf/util/exec_cmd.h
+++ b/tools/perf/util/exec_cmd.h
@@ -5,7 +5,6 @@ extern void perf_set_argv_exec_path(const char *exec_path);
5extern const char *perf_extract_argv0_path(const char *path); 5extern const char *perf_extract_argv0_path(const char *path);
6extern const char *perf_exec_path(void); 6extern const char *perf_exec_path(void);
7extern void setup_path(void); 7extern void setup_path(void);
8extern const char **prepare_perf_cmd(const char **argv);
9extern int execv_perf_cmd(const char **argv); /* NULL terminated */ 8extern int execv_perf_cmd(const char **argv); /* NULL terminated */
10extern int execl_perf_cmd(const char *cmd, ...); 9extern int execl_perf_cmd(const char *cmd, ...);
11extern const char *system_path(const char *path); 10extern const char *system_path(const char *path);
diff --git a/tools/perf/util/header.c b/tools/perf/util/header.c
index 8a0bca55106f..1f62435f96c2 100644
--- a/tools/perf/util/header.c
+++ b/tools/perf/util/header.c
@@ -1,8 +1,12 @@
1#define _FILE_OFFSET_BITS 64
2
1#include <sys/types.h> 3#include <sys/types.h>
4#include <byteswap.h>
2#include <unistd.h> 5#include <unistd.h>
3#include <stdio.h> 6#include <stdio.h>
4#include <stdlib.h> 7#include <stdlib.h>
5#include <linux/list.h> 8#include <linux/list.h>
9#include <linux/kernel.h>
6 10
7#include "util.h" 11#include "util.h"
8#include "header.h" 12#include "header.h"
@@ -95,34 +99,31 @@ int perf_header__add_attr(struct perf_header *self,
95 return 0; 99 return 0;
96} 100}
97 101
98#define MAX_EVENT_NAME 64
99
100struct perf_trace_event_type {
101 u64 event_id;
102 char name[MAX_EVENT_NAME];
103};
104
105static int event_count; 102static int event_count;
106static struct perf_trace_event_type *events; 103static struct perf_trace_event_type *events;
107 104
108void perf_header__push_event(u64 id, const char *name) 105int perf_header__push_event(u64 id, const char *name)
109{ 106{
110 if (strlen(name) > MAX_EVENT_NAME) 107 if (strlen(name) > MAX_EVENT_NAME)
111 pr_warning("Event %s will be truncated\n", name); 108 pr_warning("Event %s will be truncated\n", name);
112 109
113 if (!events) { 110 if (!events) {
114 events = malloc(sizeof(struct perf_trace_event_type)); 111 events = malloc(sizeof(struct perf_trace_event_type));
115 if (!events) 112 if (events == NULL)
116 die("nomem"); 113 return -ENOMEM;
117 } else { 114 } else {
118 events = realloc(events, (event_count + 1) * sizeof(struct perf_trace_event_type)); 115 struct perf_trace_event_type *nevents;
119 if (!events) 116
120 die("nomem"); 117 nevents = realloc(events, (event_count + 1) * sizeof(*events));
118 if (nevents == NULL)
119 return -ENOMEM;
120 events = nevents;
121 } 121 }
122 memset(&events[event_count], 0, sizeof(struct perf_trace_event_type)); 122 memset(&events[event_count], 0, sizeof(struct perf_trace_event_type));
123 events[event_count].event_id = id; 123 events[event_count].event_id = id;
124 strncpy(events[event_count].name, name, MAX_EVENT_NAME - 1); 124 strncpy(events[event_count].name, name, MAX_EVENT_NAME - 1);
125 event_count++; 125 event_count++;
126 return 0;
126} 127}
127 128
128char *perf_header__find_event(u64 id) 129char *perf_header__find_event(u64 id)
@@ -169,31 +170,50 @@ static int do_write(int fd, const void *buf, size_t size)
169 return 0; 170 return 0;
170} 171}
171 172
172static int __dsos__write_buildid_table(struct list_head *head, int fd) 173#define NAME_ALIGN 64
174
175static int write_padded(int fd, const void *bf, size_t count,
176 size_t count_aligned)
173{ 177{
174#define NAME_ALIGN 64
175 struct dso *pos;
176 static const char zero_buf[NAME_ALIGN]; 178 static const char zero_buf[NAME_ALIGN];
179 int err = do_write(fd, bf, count);
180
181 if (!err)
182 err = do_write(fd, zero_buf, count_aligned - count);
177 183
178 list_for_each_entry(pos, head, node) { 184 return err;
185}
186
187#define dsos__for_each_with_build_id(pos, head) \
188 list_for_each_entry(pos, head, node) \
189 if (!pos->has_build_id) \
190 continue; \
191 else
192
193static int __dsos__write_buildid_table(struct list_head *head, pid_t pid,
194 u16 misc, int fd)
195{
196 struct dso *pos;
197
198 dsos__for_each_with_build_id(pos, head) {
179 int err; 199 int err;
180 struct build_id_event b; 200 struct build_id_event b;
181 size_t len; 201 size_t len;
182 202
183 if (!pos->has_build_id) 203 if (!pos->hit)
184 continue; 204 continue;
185 len = pos->long_name_len + 1; 205 len = pos->long_name_len + 1;
186 len = ALIGN(len, NAME_ALIGN); 206 len = ALIGN(len, NAME_ALIGN);
187 memset(&b, 0, sizeof(b)); 207 memset(&b, 0, sizeof(b));
188 memcpy(&b.build_id, pos->build_id, sizeof(pos->build_id)); 208 memcpy(&b.build_id, pos->build_id, sizeof(pos->build_id));
209 b.pid = pid;
210 b.header.misc = misc;
189 b.header.size = sizeof(b) + len; 211 b.header.size = sizeof(b) + len;
190 err = do_write(fd, &b, sizeof(b)); 212 err = do_write(fd, &b, sizeof(b));
191 if (err < 0) 213 if (err < 0)
192 return err; 214 return err;
193 err = do_write(fd, pos->long_name, pos->long_name_len + 1); 215 err = write_padded(fd, pos->long_name,
194 if (err < 0) 216 pos->long_name_len + 1, len);
195 return err;
196 err = do_write(fd, zero_buf, len - pos->long_name_len - 1);
197 if (err < 0) 217 if (err < 0)
198 return err; 218 return err;
199 } 219 }
@@ -201,23 +221,216 @@ static int __dsos__write_buildid_table(struct list_head *head, int fd)
201 return 0; 221 return 0;
202} 222}
203 223
204static int dsos__write_buildid_table(int fd) 224static int machine__write_buildid_table(struct machine *self, int fd)
205{ 225{
206 int err = __dsos__write_buildid_table(&dsos__kernel, fd); 226 int err;
227 u16 kmisc = PERF_RECORD_MISC_KERNEL,
228 umisc = PERF_RECORD_MISC_USER;
229
230 if (!machine__is_host(self)) {
231 kmisc = PERF_RECORD_MISC_GUEST_KERNEL;
232 umisc = PERF_RECORD_MISC_GUEST_USER;
233 }
234
235 err = __dsos__write_buildid_table(&self->kernel_dsos, self->pid,
236 kmisc, fd);
207 if (err == 0) 237 if (err == 0)
208 err = __dsos__write_buildid_table(&dsos__user, fd); 238 err = __dsos__write_buildid_table(&self->user_dsos,
239 self->pid, umisc, fd);
240 return err;
241}
242
243static int dsos__write_buildid_table(struct perf_header *header, int fd)
244{
245 struct perf_session *session = container_of(header,
246 struct perf_session, header);
247 struct rb_node *nd;
248 int err = machine__write_buildid_table(&session->host_machine, fd);
249
250 if (err)
251 return err;
252
253 for (nd = rb_first(&session->machines); nd; nd = rb_next(nd)) {
254 struct machine *pos = rb_entry(nd, struct machine, rb_node);
255 err = machine__write_buildid_table(pos, fd);
256 if (err)
257 break;
258 }
259 return err;
260}
261
262int build_id_cache__add_s(const char *sbuild_id, const char *debugdir,
263 const char *name, bool is_kallsyms)
264{
265 const size_t size = PATH_MAX;
266 char *filename = malloc(size),
267 *linkname = malloc(size), *targetname;
268 int len, err = -1;
269
270 if (filename == NULL || linkname == NULL)
271 goto out_free;
272
273 len = snprintf(filename, size, "%s%s%s",
274 debugdir, is_kallsyms ? "/" : "", name);
275 if (mkdir_p(filename, 0755))
276 goto out_free;
277
278 snprintf(filename + len, sizeof(filename) - len, "/%s", sbuild_id);
279
280 if (access(filename, F_OK)) {
281 if (is_kallsyms) {
282 if (copyfile("/proc/kallsyms", filename))
283 goto out_free;
284 } else if (link(name, filename) && copyfile(name, filename))
285 goto out_free;
286 }
287
288 len = snprintf(linkname, size, "%s/.build-id/%.2s",
289 debugdir, sbuild_id);
290
291 if (access(linkname, X_OK) && mkdir_p(linkname, 0755))
292 goto out_free;
293
294 snprintf(linkname + len, size - len, "/%s", sbuild_id + 2);
295 targetname = filename + strlen(debugdir) - 5;
296 memcpy(targetname, "../..", 5);
297
298 if (symlink(targetname, linkname) == 0)
299 err = 0;
300out_free:
301 free(filename);
302 free(linkname);
303 return err;
304}
305
306static int build_id_cache__add_b(const u8 *build_id, size_t build_id_size,
307 const char *name, const char *debugdir,
308 bool is_kallsyms)
309{
310 char sbuild_id[BUILD_ID_SIZE * 2 + 1];
311
312 build_id__sprintf(build_id, build_id_size, sbuild_id);
313
314 return build_id_cache__add_s(sbuild_id, debugdir, name, is_kallsyms);
315}
316
317int build_id_cache__remove_s(const char *sbuild_id, const char *debugdir)
318{
319 const size_t size = PATH_MAX;
320 char *filename = malloc(size),
321 *linkname = malloc(size);
322 int err = -1;
323
324 if (filename == NULL || linkname == NULL)
325 goto out_free;
326
327 snprintf(linkname, size, "%s/.build-id/%.2s/%s",
328 debugdir, sbuild_id, sbuild_id + 2);
329
330 if (access(linkname, F_OK))
331 goto out_free;
332
333 if (readlink(linkname, filename, size) < 0)
334 goto out_free;
335
336 if (unlink(linkname))
337 goto out_free;
338
339 /*
340 * Since the link is relative, we must make it absolute:
341 */
342 snprintf(linkname, size, "%s/.build-id/%.2s/%s",
343 debugdir, sbuild_id, filename);
344
345 if (unlink(linkname))
346 goto out_free;
347
348 err = 0;
349out_free:
350 free(filename);
351 free(linkname);
352 return err;
353}
354
355static int dso__cache_build_id(struct dso *self, const char *debugdir)
356{
357 bool is_kallsyms = self->kernel && self->long_name[0] != '/';
358
359 return build_id_cache__add_b(self->build_id, sizeof(self->build_id),
360 self->long_name, debugdir, is_kallsyms);
361}
362
363static int __dsos__cache_build_ids(struct list_head *head, const char *debugdir)
364{
365 struct dso *pos;
366 int err = 0;
367
368 dsos__for_each_with_build_id(pos, head)
369 if (dso__cache_build_id(pos, debugdir))
370 err = -1;
371
209 return err; 372 return err;
210} 373}
211 374
375static int machine__cache_build_ids(struct machine *self, const char *debugdir)
376{
377 int ret = __dsos__cache_build_ids(&self->kernel_dsos, debugdir);
378 ret |= __dsos__cache_build_ids(&self->user_dsos, debugdir);
379 return ret;
380}
381
382static int perf_session__cache_build_ids(struct perf_session *self)
383{
384 struct rb_node *nd;
385 int ret;
386 char debugdir[PATH_MAX];
387
388 snprintf(debugdir, sizeof(debugdir), "%s/%s", getenv("HOME"),
389 DEBUG_CACHE_DIR);
390
391 if (mkdir(debugdir, 0755) != 0 && errno != EEXIST)
392 return -1;
393
394 ret = machine__cache_build_ids(&self->host_machine, debugdir);
395
396 for (nd = rb_first(&self->machines); nd; nd = rb_next(nd)) {
397 struct machine *pos = rb_entry(nd, struct machine, rb_node);
398 ret |= machine__cache_build_ids(pos, debugdir);
399 }
400 return ret ? -1 : 0;
401}
402
403static bool machine__read_build_ids(struct machine *self, bool with_hits)
404{
405 bool ret = __dsos__read_build_ids(&self->kernel_dsos, with_hits);
406 ret |= __dsos__read_build_ids(&self->user_dsos, with_hits);
407 return ret;
408}
409
410static bool perf_session__read_build_ids(struct perf_session *self, bool with_hits)
411{
412 struct rb_node *nd;
413 bool ret = machine__read_build_ids(&self->host_machine, with_hits);
414
415 for (nd = rb_first(&self->machines); nd; nd = rb_next(nd)) {
416 struct machine *pos = rb_entry(nd, struct machine, rb_node);
417 ret |= machine__read_build_ids(pos, with_hits);
418 }
419
420 return ret;
421}
422
212static int perf_header__adds_write(struct perf_header *self, int fd) 423static int perf_header__adds_write(struct perf_header *self, int fd)
213{ 424{
214 int nr_sections; 425 int nr_sections;
426 struct perf_session *session;
215 struct perf_file_section *feat_sec; 427 struct perf_file_section *feat_sec;
216 int sec_size; 428 int sec_size;
217 u64 sec_start; 429 u64 sec_start;
218 int idx = 0, err; 430 int idx = 0, err;
219 431
220 if (dsos__read_build_ids()) 432 session = container_of(self, struct perf_session, header);
433 if (perf_session__read_build_ids(session, true))
221 perf_header__set_feat(self, HEADER_BUILD_ID); 434 perf_header__set_feat(self, HEADER_BUILD_ID);
222 435
223 nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS); 436 nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS);
@@ -244,7 +457,6 @@ static int perf_header__adds_write(struct perf_header *self, int fd)
244 trace_sec->size = lseek(fd, 0, SEEK_CUR) - trace_sec->offset; 457 trace_sec->size = lseek(fd, 0, SEEK_CUR) - trace_sec->offset;
245 } 458 }
246 459
247
248 if (perf_header__has_feat(self, HEADER_BUILD_ID)) { 460 if (perf_header__has_feat(self, HEADER_BUILD_ID)) {
249 struct perf_file_section *buildid_sec; 461 struct perf_file_section *buildid_sec;
250 462
@@ -252,12 +464,14 @@ static int perf_header__adds_write(struct perf_header *self, int fd)
252 464
253 /* Write build-ids */ 465 /* Write build-ids */
254 buildid_sec->offset = lseek(fd, 0, SEEK_CUR); 466 buildid_sec->offset = lseek(fd, 0, SEEK_CUR);
255 err = dsos__write_buildid_table(fd); 467 err = dsos__write_buildid_table(self, fd);
256 if (err < 0) { 468 if (err < 0) {
257 pr_debug("failed to write buildid table\n"); 469 pr_debug("failed to write buildid table\n");
258 goto out_free; 470 goto out_free;
259 } 471 }
260 buildid_sec->size = lseek(fd, 0, SEEK_CUR) - buildid_sec->offset; 472 buildid_sec->size = lseek(fd, 0, SEEK_CUR) -
473 buildid_sec->offset;
474 perf_session__cache_build_ids(session);
261 } 475 }
262 476
263 lseek(fd, sec_start, SEEK_SET); 477 lseek(fd, sec_start, SEEK_SET);
@@ -269,6 +483,25 @@ out_free:
269 return err; 483 return err;
270} 484}
271 485
486int perf_header__write_pipe(int fd)
487{
488 struct perf_pipe_file_header f_header;
489 int err;
490
491 f_header = (struct perf_pipe_file_header){
492 .magic = PERF_MAGIC,
493 .size = sizeof(f_header),
494 };
495
496 err = do_write(fd, &f_header, sizeof(f_header));
497 if (err < 0) {
498 pr_debug("failed to write perf pipe header\n");
499 return err;
500 }
501
502 return 0;
503}
504
272int perf_header__write(struct perf_header *self, int fd, bool at_exit) 505int perf_header__write(struct perf_header *self, int fd, bool at_exit)
273{ 506{
274 struct perf_file_header f_header; 507 struct perf_file_header f_header;
@@ -278,7 +511,6 @@ int perf_header__write(struct perf_header *self, int fd, bool at_exit)
278 511
279 lseek(fd, sizeof(f_header), SEEK_SET); 512 lseek(fd, sizeof(f_header), SEEK_SET);
280 513
281
282 for (i = 0; i < self->attrs; i++) { 514 for (i = 0; i < self->attrs; i++) {
283 attr = self->attr[i]; 515 attr = self->attr[i];
284 516
@@ -360,30 +592,28 @@ int perf_header__write(struct perf_header *self, int fd, bool at_exit)
360 return 0; 592 return 0;
361} 593}
362 594
363static void do_read(int fd, void *buf, size_t size) 595static int perf_header__getbuffer64(struct perf_header *self,
596 int fd, void *buf, size_t size)
364{ 597{
365 while (size) { 598 if (do_read(fd, buf, size) <= 0)
366 int ret = read(fd, buf, size); 599 return -1;
367 600
368 if (ret < 0) 601 if (self->needs_swap)
369 die("failed to read"); 602 mem_bswap_64(buf, size);
370 if (ret == 0)
371 die("failed to read: missing data");
372 603
373 size -= ret; 604 return 0;
374 buf += ret;
375 }
376} 605}
377 606
378int perf_header__process_sections(struct perf_header *self, int fd, 607int perf_header__process_sections(struct perf_header *self, int fd,
379 int (*process)(struct perf_file_section *self, 608 int (*process)(struct perf_file_section *self,
609 struct perf_header *ph,
380 int feat, int fd)) 610 int feat, int fd))
381{ 611{
382 struct perf_file_section *feat_sec; 612 struct perf_file_section *feat_sec;
383 int nr_sections; 613 int nr_sections;
384 int sec_size; 614 int sec_size;
385 int idx = 0; 615 int idx = 0;
386 int err = 0, feat = 1; 616 int err = -1, feat = 1;
387 617
388 nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS); 618 nr_sections = bitmap_weight(self->adds_features, HEADER_FEAT_BITS);
389 if (!nr_sections) 619 if (!nr_sections)
@@ -397,33 +627,45 @@ int perf_header__process_sections(struct perf_header *self, int fd,
397 627
398 lseek(fd, self->data_offset + self->data_size, SEEK_SET); 628 lseek(fd, self->data_offset + self->data_size, SEEK_SET);
399 629
400 do_read(fd, feat_sec, sec_size); 630 if (perf_header__getbuffer64(self, fd, feat_sec, sec_size))
631 goto out_free;
401 632
633 err = 0;
402 while (idx < nr_sections && feat < HEADER_LAST_FEATURE) { 634 while (idx < nr_sections && feat < HEADER_LAST_FEATURE) {
403 if (perf_header__has_feat(self, feat)) { 635 if (perf_header__has_feat(self, feat)) {
404 struct perf_file_section *sec = &feat_sec[idx++]; 636 struct perf_file_section *sec = &feat_sec[idx++];
405 637
406 err = process(sec, feat, fd); 638 err = process(sec, self, feat, fd);
407 if (err < 0) 639 if (err < 0)
408 break; 640 break;
409 } 641 }
410 ++feat; 642 ++feat;
411 } 643 }
412 644out_free:
413 free(feat_sec); 645 free(feat_sec);
414 return err; 646 return err;
415}; 647}
416 648
417int perf_file_header__read(struct perf_file_header *self, 649int perf_file_header__read(struct perf_file_header *self,
418 struct perf_header *ph, int fd) 650 struct perf_header *ph, int fd)
419{ 651{
420 lseek(fd, 0, SEEK_SET); 652 lseek(fd, 0, SEEK_SET);
421 do_read(fd, self, sizeof(*self));
422 653
423 if (self->magic != PERF_MAGIC || 654 if (do_read(fd, self, sizeof(*self)) <= 0 ||
424 self->attr_size != sizeof(struct perf_file_attr)) 655 memcmp(&self->magic, __perf_magic, sizeof(self->magic)))
425 return -1; 656 return -1;
426 657
658 if (self->attr_size != sizeof(struct perf_file_attr)) {
659 u64 attr_size = bswap_64(self->attr_size);
660
661 if (attr_size != sizeof(struct perf_file_attr))
662 return -1;
663
664 mem_bswap_64(self, offsetof(struct perf_file_header,
665 adds_features));
666 ph->needs_swap = true;
667 }
668
427 if (self->size != sizeof(*self)) { 669 if (self->size != sizeof(*self)) {
428 /* Support the previous format */ 670 /* Support the previous format */
429 if (self->size == offsetof(typeof(*self), adds_features)) 671 if (self->size == offsetof(typeof(*self), adds_features))
@@ -433,19 +675,118 @@ int perf_file_header__read(struct perf_file_header *self,
433 } 675 }
434 676
435 memcpy(&ph->adds_features, &self->adds_features, 677 memcpy(&ph->adds_features, &self->adds_features,
436 sizeof(self->adds_features)); 678 sizeof(ph->adds_features));
679 /*
680 * FIXME: hack that assumes that if we need swap the perf.data file
681 * may be coming from an arch with a different word-size, ergo different
682 * DEFINE_BITMAP format, investigate more later, but for now its mostly
683 * safe to assume that we have a build-id section. Trace files probably
684 * have several other issues in this realm anyway...
685 */
686 if (ph->needs_swap) {
687 memset(&ph->adds_features, 0, sizeof(ph->adds_features));
688 perf_header__set_feat(ph, HEADER_BUILD_ID);
689 }
437 690
438 ph->event_offset = self->event_types.offset; 691 ph->event_offset = self->event_types.offset;
439 ph->event_size = self->event_types.size; 692 ph->event_size = self->event_types.size;
440 ph->data_offset = self->data.offset; 693 ph->data_offset = self->data.offset;
441 ph->data_size = self->data.size; 694 ph->data_size = self->data.size;
442 return 0; 695 return 0;
443} 696}
444 697
698static int __event_process_build_id(struct build_id_event *bev,
699 char *filename,
700 struct perf_session *session)
701{
702 int err = -1;
703 struct list_head *head;
704 struct machine *machine;
705 u16 misc;
706 struct dso *dso;
707 enum dso_kernel_type dso_type;
708
709 machine = perf_session__findnew_machine(session, bev->pid);
710 if (!machine)
711 goto out;
712
713 misc = bev->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
714
715 switch (misc) {
716 case PERF_RECORD_MISC_KERNEL:
717 dso_type = DSO_TYPE_KERNEL;
718 head = &machine->kernel_dsos;
719 break;
720 case PERF_RECORD_MISC_GUEST_KERNEL:
721 dso_type = DSO_TYPE_GUEST_KERNEL;
722 head = &machine->kernel_dsos;
723 break;
724 case PERF_RECORD_MISC_USER:
725 case PERF_RECORD_MISC_GUEST_USER:
726 dso_type = DSO_TYPE_USER;
727 head = &machine->user_dsos;
728 break;
729 default:
730 goto out;
731 }
732
733 dso = __dsos__findnew(head, filename);
734 if (dso != NULL) {
735 char sbuild_id[BUILD_ID_SIZE * 2 + 1];
736
737 dso__set_build_id(dso, &bev->build_id);
738
739 if (filename[0] == '[')
740 dso->kernel = dso_type;
741
742 build_id__sprintf(dso->build_id, sizeof(dso->build_id),
743 sbuild_id);
744 pr_debug("build id event received for %s: %s\n",
745 dso->long_name, sbuild_id);
746 }
747
748 err = 0;
749out:
750 return err;
751}
752
753static int perf_header__read_build_ids(struct perf_header *self,
754 int input, u64 offset, u64 size)
755{
756 struct perf_session *session = container_of(self,
757 struct perf_session, header);
758 struct build_id_event bev;
759 char filename[PATH_MAX];
760 u64 limit = offset + size;
761 int err = -1;
762
763 while (offset < limit) {
764 ssize_t len;
765
766 if (read(input, &bev, sizeof(bev)) != sizeof(bev))
767 goto out;
768
769 if (self->needs_swap)
770 perf_event_header__bswap(&bev.header);
771
772 len = bev.header.size - sizeof(bev);
773 if (read(input, filename, len) != len)
774 goto out;
775
776 __event_process_build_id(&bev, filename, session);
777
778 offset += bev.header.size;
779 }
780 err = 0;
781out:
782 return err;
783}
784
445static int perf_file_section__process(struct perf_file_section *self, 785static int perf_file_section__process(struct perf_file_section *self,
786 struct perf_header *ph,
446 int feat, int fd) 787 int feat, int fd)
447{ 788{
448 if (lseek(fd, self->offset, SEEK_SET) < 0) { 789 if (lseek(fd, self->offset, SEEK_SET) == (off_t)-1) {
449 pr_debug("Failed to lseek to %Ld offset for feature %d, " 790 pr_debug("Failed to lseek to %Ld offset for feature %d, "
450 "continuing...\n", self->offset, feat); 791 "continuing...\n", self->offset, feat);
451 return 0; 792 return 0;
@@ -453,11 +794,11 @@ static int perf_file_section__process(struct perf_file_section *self,
453 794
454 switch (feat) { 795 switch (feat) {
455 case HEADER_TRACE_INFO: 796 case HEADER_TRACE_INFO:
456 trace_report(fd); 797 trace_report(fd, false);
457 break; 798 break;
458 799
459 case HEADER_BUILD_ID: 800 case HEADER_BUILD_ID:
460 if (perf_header__read_build_ids(fd, self->offset, self->size)) 801 if (perf_header__read_build_ids(ph, fd, self->offset, self->size))
461 pr_debug("Failed to read buildids, continuing...\n"); 802 pr_debug("Failed to read buildids, continuing...\n");
462 break; 803 break;
463 default: 804 default:
@@ -467,13 +808,56 @@ static int perf_file_section__process(struct perf_file_section *self,
467 return 0; 808 return 0;
468} 809}
469 810
470int perf_header__read(struct perf_header *self, int fd) 811static int perf_file_header__read_pipe(struct perf_pipe_file_header *self,
812 struct perf_header *ph, int fd,
813 bool repipe)
471{ 814{
472 struct perf_file_header f_header; 815 if (do_read(fd, self, sizeof(*self)) <= 0 ||
816 memcmp(&self->magic, __perf_magic, sizeof(self->magic)))
817 return -1;
818
819 if (repipe && do_write(STDOUT_FILENO, self, sizeof(*self)) < 0)
820 return -1;
821
822 if (self->size != sizeof(*self)) {
823 u64 size = bswap_64(self->size);
824
825 if (size != sizeof(*self))
826 return -1;
827
828 ph->needs_swap = true;
829 }
830
831 return 0;
832}
833
834static int perf_header__read_pipe(struct perf_session *session, int fd)
835{
836 struct perf_header *self = &session->header;
837 struct perf_pipe_file_header f_header;
838
839 if (perf_file_header__read_pipe(&f_header, self, fd,
840 session->repipe) < 0) {
841 pr_debug("incompatible file format\n");
842 return -EINVAL;
843 }
844
845 session->fd = fd;
846
847 return 0;
848}
849
850int perf_header__read(struct perf_session *session, int fd)
851{
852 struct perf_header *self = &session->header;
853 struct perf_file_header f_header;
473 struct perf_file_attr f_attr; 854 struct perf_file_attr f_attr;
474 u64 f_id; 855 u64 f_id;
475 int nr_attrs, nr_ids, i, j; 856 int nr_attrs, nr_ids, i, j;
476 857
858 if (session->fd_pipe)
859 return perf_header__read_pipe(session, fd);
860
477 if (perf_file_header__read(&f_header, self, fd) < 0) { 861 if (perf_file_header__read(&f_header, self, fd) < 0) {
478 pr_debug("incompatible file format\n"); 862 pr_debug("incompatible file format\n");
479 return -EINVAL; 863 return -EINVAL;
@@ -486,7 +870,9 @@ int perf_header__read(struct perf_header *self, int fd)
486 struct perf_header_attr *attr; 870 struct perf_header_attr *attr;
487 off_t tmp; 871 off_t tmp;
488 872
489 do_read(fd, &f_attr, sizeof(f_attr)); 873 if (perf_header__getbuffer64(self, fd, &f_attr, sizeof(f_attr)))
874 goto out_errno;
875
490 tmp = lseek(fd, 0, SEEK_CUR); 876 tmp = lseek(fd, 0, SEEK_CUR);
491 877
492 attr = perf_header_attr__new(&f_attr.attr); 878 attr = perf_header_attr__new(&f_attr.attr);
@@ -497,7 +883,8 @@ int perf_header__read(struct perf_header *self, int fd)
497 lseek(fd, f_attr.ids.offset, SEEK_SET); 883 lseek(fd, f_attr.ids.offset, SEEK_SET);
498 884
499 for (j = 0; j < nr_ids; j++) { 885 for (j = 0; j < nr_ids; j++) {
500 do_read(fd, &f_id, sizeof(f_id)); 886 if (perf_header__getbuffer64(self, fd, &f_id, sizeof(f_id)))
887 goto out_errno;
501 888
502 if (perf_header_attr__add_id(attr, f_id) < 0) { 889 if (perf_header_attr__add_id(attr, f_id) < 0) {
503 perf_header_attr__delete(attr); 890 perf_header_attr__delete(attr);
@@ -517,7 +904,9 @@ int perf_header__read(struct perf_header *self, int fd)
517 events = malloc(f_header.event_types.size); 904 events = malloc(f_header.event_types.size);
518 if (events == NULL) 905 if (events == NULL)
519 return -ENOMEM; 906 return -ENOMEM;
520 do_read(fd, events, f_header.event_types.size); 907 if (perf_header__getbuffer64(self, fd, events,
908 f_header.event_types.size))
909 goto out_errno;
521 event_count = f_header.event_types.size / sizeof(struct perf_trace_event_type); 910 event_count = f_header.event_types.size / sizeof(struct perf_trace_event_type);
522 } 911 }
523 912
@@ -527,6 +916,8 @@ int perf_header__read(struct perf_header *self, int fd)
527 916
528 self->frozen = 1; 917 self->frozen = 1;
529 return 0; 918 return 0;
919out_errno:
920 return -errno;
530} 921}
531 922
532u64 perf_header__sample_type(struct perf_header *header) 923u64 perf_header__sample_type(struct perf_header *header)
@@ -551,6 +942,14 @@ perf_header__find_attr(u64 id, struct perf_header *header)
551{ 942{
552 int i; 943 int i;
553 944
945 /*
946 * We set id to -1 if the data file doesn't contain sample
947 * ids. Check for this and avoid walking through the entire
948 * list of ids which may be large.
949 */
950 if (id == -1ULL)
951 return NULL;
952
554 for (i = 0; i < header->attrs; i++) { 953 for (i = 0; i < header->attrs; i++) {
555 struct perf_header_attr *attr = header->attr[i]; 954 struct perf_header_attr *attr = header->attr[i];
556 int j; 955 int j;
@@ -563,3 +962,231 @@ perf_header__find_attr(u64 id, struct perf_header *header)
563 962
564 return NULL; 963 return NULL;
565} 964}
965
966int event__synthesize_attr(struct perf_event_attr *attr, u16 ids, u64 *id,
967 event__handler_t process,
968 struct perf_session *session)
969{
970 event_t *ev;
971 size_t size;
972 int err;
973
974 size = sizeof(struct perf_event_attr);
975 size = ALIGN(size, sizeof(u64));
976 size += sizeof(struct perf_event_header);
977 size += ids * sizeof(u64);
978
979 ev = malloc(size);
980
981 ev->attr.attr = *attr;
982 memcpy(ev->attr.id, id, ids * sizeof(u64));
983
984 ev->attr.header.type = PERF_RECORD_HEADER_ATTR;
985 ev->attr.header.size = size;
986
987 err = process(ev, session);
988
989 free(ev);
990
991 return err;
992}
993
994int event__synthesize_attrs(struct perf_header *self,
995 event__handler_t process,
996 struct perf_session *session)
997{
998 struct perf_header_attr *attr;
999 int i, err = 0;
1000
1001 for (i = 0; i < self->attrs; i++) {
1002 attr = self->attr[i];
1003
1004 err = event__synthesize_attr(&attr->attr, attr->ids, attr->id,
1005 process, session);
1006 if (err) {
1007 pr_debug("failed to create perf header attribute\n");
1008 return err;
1009 }
1010 }
1011
1012 return err;
1013}
1014
1015int event__process_attr(event_t *self, struct perf_session *session)
1016{
1017 struct perf_header_attr *attr;
1018 unsigned int i, ids, n_ids;
1019
1020 attr = perf_header_attr__new(&self->attr.attr);
1021 if (attr == NULL)
1022 return -ENOMEM;
1023
1024 ids = self->header.size;
1025 ids -= (void *)&self->attr.id - (void *)self;
1026 n_ids = ids / sizeof(u64);
1027
1028 for (i = 0; i < n_ids; i++) {
1029 if (perf_header_attr__add_id(attr, self->attr.id[i]) < 0) {
1030 perf_header_attr__delete(attr);
1031 return -ENOMEM;
1032 }
1033 }
1034
1035 if (perf_header__add_attr(&session->header, attr) < 0) {
1036 perf_header_attr__delete(attr);
1037 return -ENOMEM;
1038 }
1039
1040 perf_session__update_sample_type(session);
1041
1042 return 0;
1043}
1044
1045int event__synthesize_event_type(u64 event_id, char *name,
1046 event__handler_t process,
1047 struct perf_session *session)
1048{
1049 event_t ev;
1050 size_t size = 0;
1051 int err = 0;
1052
1053 memset(&ev, 0, sizeof(ev));
1054
1055 ev.event_type.event_type.event_id = event_id;
1056 memset(ev.event_type.event_type.name, 0, MAX_EVENT_NAME);
1057 strncpy(ev.event_type.event_type.name, name, MAX_EVENT_NAME - 1);
1058
1059 ev.event_type.header.type = PERF_RECORD_HEADER_EVENT_TYPE;
1060 size = strlen(name);
1061 size = ALIGN(size, sizeof(u64));
1062 ev.event_type.header.size = sizeof(ev.event_type) -
1063 (sizeof(ev.event_type.event_type.name) - size);
1064
1065 err = process(&ev, session);
1066
1067 return err;
1068}
1069
1070int event__synthesize_event_types(event__handler_t process,
1071 struct perf_session *session)
1072{
1073 struct perf_trace_event_type *type;
1074 int i, err = 0;
1075
1076 for (i = 0; i < event_count; i++) {
1077 type = &events[i];
1078
1079 err = event__synthesize_event_type(type->event_id, type->name,
1080 process, session);
1081 if (err) {
1082 pr_debug("failed to create perf header event type\n");
1083 return err;
1084 }
1085 }
1086
1087 return err;
1088}
1089
1090int event__process_event_type(event_t *self,
1091 struct perf_session *session __unused)
1092{
1093 if (perf_header__push_event(self->event_type.event_type.event_id,
1094 self->event_type.event_type.name) < 0)
1095 return -ENOMEM;
1096
1097 return 0;
1098}
1099
1100int event__synthesize_tracing_data(int fd, struct perf_event_attr *pattrs,
1101 int nb_events,
1102 event__handler_t process,
1103 struct perf_session *session __unused)
1104{
1105 event_t ev;
1106 ssize_t size = 0, aligned_size = 0, padding;
1107 int err = 0;
1108
1109 memset(&ev, 0, sizeof(ev));
1110
1111 ev.tracing_data.header.type = PERF_RECORD_HEADER_TRACING_DATA;
1112 size = read_tracing_data_size(fd, pattrs, nb_events);
1113 if (size <= 0)
1114 return size;
1115 aligned_size = ALIGN(size, sizeof(u64));
1116 padding = aligned_size - size;
1117 ev.tracing_data.header.size = sizeof(ev.tracing_data);
1118 ev.tracing_data.size = aligned_size;
1119
1120 process(&ev, session);
1121
1122 err = read_tracing_data(fd, pattrs, nb_events);
1123 write_padded(fd, NULL, 0, padding);
1124
1125 return aligned_size;
1126}
1127
1128int event__process_tracing_data(event_t *self,
1129 struct perf_session *session)
1130{
1131 ssize_t size_read, padding, size = self->tracing_data.size;
1132 off_t offset = lseek(session->fd, 0, SEEK_CUR);
1133 char buf[BUFSIZ];
1134
1135 /* setup for reading amidst mmap */
1136 lseek(session->fd, offset + sizeof(struct tracing_data_event),
1137 SEEK_SET);
1138
1139 size_read = trace_report(session->fd, session->repipe);
1140
1141 padding = ALIGN(size_read, sizeof(u64)) - size_read;
1142
1143 if (read(session->fd, buf, padding) < 0)
1144 die("reading input file");
1145 if (session->repipe) {
1146 int retw = write(STDOUT_FILENO, buf, padding);
1147 if (retw <= 0 || retw != padding)
1148 die("repiping tracing data padding");
1149 }
1150
1151 if (size_read + padding != size)
1152 die("tracing data size mismatch");
1153
1154 return size_read + padding;
1155}
1156
1157int event__synthesize_build_id(struct dso *pos, u16 misc,
1158 event__handler_t process,
1159 struct machine *machine,
1160 struct perf_session *session)
1161{
1162 event_t ev;
1163 size_t len;
1164 int err = 0;
1165
1166 if (!pos->hit)
1167 return err;
1168
1169 memset(&ev, 0, sizeof(ev));
1170
1171 len = pos->long_name_len + 1;
1172 len = ALIGN(len, NAME_ALIGN);
1173 memcpy(&ev.build_id.build_id, pos->build_id, sizeof(pos->build_id));
1174 ev.build_id.header.type = PERF_RECORD_HEADER_BUILD_ID;
1175 ev.build_id.header.misc = misc;
1176 ev.build_id.pid = machine->pid;
1177 ev.build_id.header.size = sizeof(ev.build_id) + len;
1178 memcpy(&ev.build_id.filename, pos->long_name, pos->long_name_len);
1179
1180 err = process(&ev, session);
1181
1182 return err;
1183}
1184
1185int event__process_build_id(event_t *self,
1186 struct perf_session *session)
1187{
1188 __event_process_build_id(&self->build_id,
1189 self->build_id.filename,
1190 session);
1191 return 0;
1192}
diff --git a/tools/perf/util/header.h b/tools/perf/util/header.h
index d118d05d3abe..402ac2454cf8 100644
--- a/tools/perf/util/header.h
+++ b/tools/perf/util/header.h
@@ -5,6 +5,7 @@
5#include <sys/types.h> 5#include <sys/types.h>
6#include <stdbool.h> 6#include <stdbool.h>
7#include "types.h" 7#include "types.h"
8#include "event.h"
8 9
9#include <linux/bitmap.h> 10#include <linux/bitmap.h>
10 11
@@ -38,6 +39,11 @@ struct perf_file_header {
38 DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS); 39 DECLARE_BITMAP(adds_features, HEADER_FEAT_BITS);
39}; 40};
40 41
42struct perf_pipe_file_header {
43 u64 magic;
44 u64 size;
45};
46
41struct perf_header; 47struct perf_header;
42 48
43int perf_file_header__read(struct perf_file_header *self, 49int perf_file_header__read(struct perf_file_header *self,
@@ -46,6 +52,7 @@ int perf_file_header__read(struct perf_file_header *self,
46struct perf_header { 52struct perf_header {
47 int frozen; 53 int frozen;
48 int attrs, size; 54 int attrs, size;
55 bool needs_swap;
49 struct perf_header_attr **attr; 56 struct perf_header_attr **attr;
50 s64 attr_offset; 57 s64 attr_offset;
51 u64 data_offset; 58 u64 data_offset;
@@ -58,13 +65,14 @@ struct perf_header {
58int perf_header__init(struct perf_header *self); 65int perf_header__init(struct perf_header *self);
59void perf_header__exit(struct perf_header *self); 66void perf_header__exit(struct perf_header *self);
60 67
61int perf_header__read(struct perf_header *self, int fd); 68int perf_header__read(struct perf_session *session, int fd);
62int perf_header__write(struct perf_header *self, int fd, bool at_exit); 69int perf_header__write(struct perf_header *self, int fd, bool at_exit);
70int perf_header__write_pipe(int fd);
63 71
64int perf_header__add_attr(struct perf_header *self, 72int perf_header__add_attr(struct perf_header *self,
65 struct perf_header_attr *attr); 73 struct perf_header_attr *attr);
66 74
67void perf_header__push_event(u64 id, const char *name); 75int perf_header__push_event(u64 id, const char *name);
68char *perf_header__find_event(u64 id); 76char *perf_header__find_event(u64 id);
69 77
70struct perf_header_attr *perf_header_attr__new(struct perf_event_attr *attr); 78struct perf_header_attr *perf_header_attr__new(struct perf_event_attr *attr);
@@ -80,6 +88,40 @@ bool perf_header__has_feat(const struct perf_header *self, int feat);
80 88
81int perf_header__process_sections(struct perf_header *self, int fd, 89int perf_header__process_sections(struct perf_header *self, int fd,
82 int (*process)(struct perf_file_section *self, 90 int (*process)(struct perf_file_section *self,
91 struct perf_header *ph,
83 int feat, int fd)); 92 int feat, int fd));
84 93
94int build_id_cache__add_s(const char *sbuild_id, const char *debugdir,
95 const char *name, bool is_kallsyms);
96int build_id_cache__remove_s(const char *sbuild_id, const char *debugdir);
97
98int event__synthesize_attr(struct perf_event_attr *attr, u16 ids, u64 *id,
99 event__handler_t process,
100 struct perf_session *session);
101int event__synthesize_attrs(struct perf_header *self,
102 event__handler_t process,
103 struct perf_session *session);
104int event__process_attr(event_t *self, struct perf_session *session);
105
106int event__synthesize_event_type(u64 event_id, char *name,
107 event__handler_t process,
108 struct perf_session *session);
109int event__synthesize_event_types(event__handler_t process,
110 struct perf_session *session);
111int event__process_event_type(event_t *self,
112 struct perf_session *session);
113
114int event__synthesize_tracing_data(int fd, struct perf_event_attr *pattrs,
115 int nb_events,
116 event__handler_t process,
117 struct perf_session *session);
118int event__process_tracing_data(event_t *self,
119 struct perf_session *session);
120
121int event__synthesize_build_id(struct dso *pos, u16 misc,
122 event__handler_t process,
123 struct machine *machine,
124 struct perf_session *session);
125int event__process_build_id(event_t *self, struct perf_session *session);
126
85#endif /* __PERF_HEADER_H */ 127#endif /* __PERF_HEADER_H */
diff --git a/tools/perf/util/help.c b/tools/perf/util/help.c
index fbb00978b2e2..6f2975a00358 100644
--- a/tools/perf/util/help.c
+++ b/tools/perf/util/help.c
@@ -4,28 +4,6 @@
4#include "levenshtein.h" 4#include "levenshtein.h"
5#include "help.h" 5#include "help.h"
6 6
7/* most GUI terminals set COLUMNS (although some don't export it) */
8static int term_columns(void)
9{
10 char *col_string = getenv("COLUMNS");
11 int n_cols;
12
13 if (col_string && (n_cols = atoi(col_string)) > 0)
14 return n_cols;
15
16#ifdef TIOCGWINSZ
17 {
18 struct winsize ws;
19 if (!ioctl(1, TIOCGWINSZ, &ws)) {
20 if (ws.ws_col)
21 return ws.ws_col;
22 }
23 }
24#endif
25
26 return 80;
27}
28
29void add_cmdname(struct cmdnames *cmds, const char *name, size_t len) 7void add_cmdname(struct cmdnames *cmds, const char *name, size_t len)
30{ 8{
31 struct cmdname *ent = malloc(sizeof(*ent) + len + 1); 9 struct cmdname *ent = malloc(sizeof(*ent) + len + 1);
@@ -96,9 +74,13 @@ static void pretty_print_string_list(struct cmdnames *cmds, int longest)
96{ 74{
97 int cols = 1, rows; 75 int cols = 1, rows;
98 int space = longest + 1; /* min 1 SP between words */ 76 int space = longest + 1; /* min 1 SP between words */
99 int max_cols = term_columns() - 1; /* don't print *on* the edge */ 77 struct winsize win;
78 int max_cols;
100 int i, j; 79 int i, j;
101 80
81 get_term_dimensions(&win);
82 max_cols = win.ws_col - 1; /* don't print *on* the edge */
83
102 if (space < max_cols) 84 if (space < max_cols)
103 cols = max_cols / space; 85 cols = max_cols / space;
104 rows = (cmds->cnt + cols - 1) / cols; 86 rows = (cmds->cnt + cols - 1) / cols;
@@ -324,7 +306,7 @@ const char *help_unknown_cmd(const char *cmd)
324 306
325 main_cmds.names[0] = NULL; 307 main_cmds.names[0] = NULL;
326 clean_cmdnames(&main_cmds); 308 clean_cmdnames(&main_cmds);
327 fprintf(stderr, "WARNING: You called a Git program named '%s', " 309 fprintf(stderr, "WARNING: You called a perf program named '%s', "
328 "which does not exist.\n" 310 "which does not exist.\n"
329 "Continuing under the assumption that you meant '%s'\n", 311 "Continuing under the assumption that you meant '%s'\n",
330 cmd, assumed); 312 cmd, assumed);
diff --git a/tools/perf/util/hist.c b/tools/perf/util/hist.c
index e8daf5ca6fd2..784ee0bdda77 100644
--- a/tools/perf/util/hist.c
+++ b/tools/perf/util/hist.c
@@ -1,3 +1,5 @@
1#include "util.h"
2#include "build-id.h"
1#include "hist.h" 3#include "hist.h"
2#include "session.h" 4#include "session.h"
3#include "sort.h" 5#include "sort.h"
@@ -8,25 +10,69 @@ struct callchain_param callchain_param = {
8 .min_percent = 0.5 10 .min_percent = 0.5
9}; 11};
10 12
13static void hist_entry__add_cpumode_period(struct hist_entry *self,
14 unsigned int cpumode, u64 period)
15{
16 switch (cpumode) {
17 case PERF_RECORD_MISC_KERNEL:
18 self->period_sys += period;
19 break;
20 case PERF_RECORD_MISC_USER:
21 self->period_us += period;
22 break;
23 case PERF_RECORD_MISC_GUEST_KERNEL:
24 self->period_guest_sys += period;
25 break;
26 case PERF_RECORD_MISC_GUEST_USER:
27 self->period_guest_us += period;
28 break;
29 default:
30 break;
31 }
32}
33
11/* 34/*
12 * histogram, sorted on item, collects counts 35 * histogram, sorted on item, collects periods
13 */ 36 */
14 37
15struct hist_entry *__perf_session__add_hist_entry(struct perf_session *self, 38static struct hist_entry *hist_entry__new(struct hist_entry *template)
16 struct addr_location *al,
17 struct symbol *sym_parent,
18 u64 count, bool *hit)
19{ 39{
20 struct rb_node **p = &self->hists.rb_node; 40 size_t callchain_size = symbol_conf.use_callchain ? sizeof(struct callchain_node) : 0;
41 struct hist_entry *self = malloc(sizeof(*self) + callchain_size);
42
43 if (self != NULL) {
44 *self = *template;
45 self->nr_events = 1;
46 if (symbol_conf.use_callchain)
47 callchain_init(self->callchain);
48 }
49
50 return self;
51}
52
53static void hists__inc_nr_entries(struct hists *self, struct hist_entry *entry)
54{
55 if (entry->ms.sym && self->max_sym_namelen < entry->ms.sym->namelen)
56 self->max_sym_namelen = entry->ms.sym->namelen;
57 ++self->nr_entries;
58}
59
60struct hist_entry *__hists__add_entry(struct hists *self,
61 struct addr_location *al,
62 struct symbol *sym_parent, u64 period)
63{
64 struct rb_node **p = &self->entries.rb_node;
21 struct rb_node *parent = NULL; 65 struct rb_node *parent = NULL;
22 struct hist_entry *he; 66 struct hist_entry *he;
23 struct hist_entry entry = { 67 struct hist_entry entry = {
24 .thread = al->thread, 68 .thread = al->thread,
25 .map = al->map, 69 .ms = {
26 .sym = al->sym, 70 .map = al->map,
71 .sym = al->sym,
72 },
27 .ip = al->addr, 73 .ip = al->addr,
28 .level = al->level, 74 .level = al->level,
29 .count = count, 75 .period = period,
30 .parent = sym_parent, 76 .parent = sym_parent,
31 }; 77 };
32 int cmp; 78 int cmp;
@@ -38,8 +84,9 @@ struct hist_entry *__perf_session__add_hist_entry(struct perf_session *self,
38 cmp = hist_entry__cmp(&entry, he); 84 cmp = hist_entry__cmp(&entry, he);
39 85
40 if (!cmp) { 86 if (!cmp) {
41 *hit = true; 87 he->period += period;
42 return he; 88 ++he->nr_events;
89 goto out;
43 } 90 }
44 91
45 if (cmp < 0) 92 if (cmp < 0)
@@ -48,13 +95,14 @@ struct hist_entry *__perf_session__add_hist_entry(struct perf_session *self,
48 p = &(*p)->rb_right; 95 p = &(*p)->rb_right;
49 } 96 }
50 97
51 he = malloc(sizeof(*he)); 98 he = hist_entry__new(&entry);
52 if (!he) 99 if (!he)
53 return NULL; 100 return NULL;
54 *he = entry;
55 rb_link_node(&he->rb_node, parent, p); 101 rb_link_node(&he->rb_node, parent, p);
56 rb_insert_color(&he->rb_node, &self->hists); 102 rb_insert_color(&he->rb_node, &self->entries);
57 *hit = false; 103 hists__inc_nr_entries(self, he);
104out:
105 hist_entry__add_cpumode_period(he, al->cpumode, period);
58 return he; 106 return he;
59} 107}
60 108
@@ -65,7 +113,7 @@ hist_entry__cmp(struct hist_entry *left, struct hist_entry *right)
65 int64_t cmp = 0; 113 int64_t cmp = 0;
66 114
67 list_for_each_entry(se, &hist_entry__sort_list, list) { 115 list_for_each_entry(se, &hist_entry__sort_list, list) {
68 cmp = se->cmp(left, right); 116 cmp = se->se_cmp(left, right);
69 if (cmp) 117 if (cmp)
70 break; 118 break;
71 } 119 }
@@ -82,7 +130,7 @@ hist_entry__collapse(struct hist_entry *left, struct hist_entry *right)
82 list_for_each_entry(se, &hist_entry__sort_list, list) { 130 list_for_each_entry(se, &hist_entry__sort_list, list) {
83 int64_t (*f)(struct hist_entry *, struct hist_entry *); 131 int64_t (*f)(struct hist_entry *, struct hist_entry *);
84 132
85 f = se->collapse ?: se->cmp; 133 f = se->se_collapse ?: se->se_cmp;
86 134
87 cmp = f(left, right); 135 cmp = f(left, right);
88 if (cmp) 136 if (cmp)
@@ -101,7 +149,7 @@ void hist_entry__free(struct hist_entry *he)
101 * collapse the histogram 149 * collapse the histogram
102 */ 150 */
103 151
104static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he) 152static bool collapse__insert_entry(struct rb_root *root, struct hist_entry *he)
105{ 153{
106 struct rb_node **p = &root->rb_node; 154 struct rb_node **p = &root->rb_node;
107 struct rb_node *parent = NULL; 155 struct rb_node *parent = NULL;
@@ -115,9 +163,9 @@ static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he)
115 cmp = hist_entry__collapse(iter, he); 163 cmp = hist_entry__collapse(iter, he);
116 164
117 if (!cmp) { 165 if (!cmp) {
118 iter->count += he->count; 166 iter->period += he->period;
119 hist_entry__free(he); 167 hist_entry__free(he);
120 return; 168 return false;
121 } 169 }
122 170
123 if (cmp < 0) 171 if (cmp < 0)
@@ -128,9 +176,10 @@ static void collapse__insert_entry(struct rb_root *root, struct hist_entry *he)
128 176
129 rb_link_node(&he->rb_node, parent, p); 177 rb_link_node(&he->rb_node, parent, p);
130 rb_insert_color(&he->rb_node, root); 178 rb_insert_color(&he->rb_node, root);
179 return true;
131} 180}
132 181
133void perf_session__collapse_resort(struct perf_session *self) 182void hists__collapse_resort(struct hists *self)
134{ 183{
135 struct rb_root tmp; 184 struct rb_root tmp;
136 struct rb_node *next; 185 struct rb_node *next;
@@ -140,72 +189,77 @@ void perf_session__collapse_resort(struct perf_session *self)
140 return; 189 return;
141 190
142 tmp = RB_ROOT; 191 tmp = RB_ROOT;
143 next = rb_first(&self->hists); 192 next = rb_first(&self->entries);
193 self->nr_entries = 0;
194 self->max_sym_namelen = 0;
144 195
145 while (next) { 196 while (next) {
146 n = rb_entry(next, struct hist_entry, rb_node); 197 n = rb_entry(next, struct hist_entry, rb_node);
147 next = rb_next(&n->rb_node); 198 next = rb_next(&n->rb_node);
148 199
149 rb_erase(&n->rb_node, &self->hists); 200 rb_erase(&n->rb_node, &self->entries);
150 collapse__insert_entry(&tmp, n); 201 if (collapse__insert_entry(&tmp, n))
202 hists__inc_nr_entries(self, n);
151 } 203 }
152 204
153 self->hists = tmp; 205 self->entries = tmp;
154} 206}
155 207
156/* 208/*
157 * reverse the map, sort on count. 209 * reverse the map, sort on period.
158 */ 210 */
159 211
160static void perf_session__insert_output_hist_entry(struct rb_root *root, 212static void __hists__insert_output_entry(struct rb_root *entries,
161 struct hist_entry *he, 213 struct hist_entry *he,
162 u64 min_callchain_hits) 214 u64 min_callchain_hits)
163{ 215{
164 struct rb_node **p = &root->rb_node; 216 struct rb_node **p = &entries->rb_node;
165 struct rb_node *parent = NULL; 217 struct rb_node *parent = NULL;
166 struct hist_entry *iter; 218 struct hist_entry *iter;
167 219
168 if (symbol_conf.use_callchain) 220 if (symbol_conf.use_callchain)
169 callchain_param.sort(&he->sorted_chain, &he->callchain, 221 callchain_param.sort(&he->sorted_chain, he->callchain,
170 min_callchain_hits, &callchain_param); 222 min_callchain_hits, &callchain_param);
171 223
172 while (*p != NULL) { 224 while (*p != NULL) {
173 parent = *p; 225 parent = *p;
174 iter = rb_entry(parent, struct hist_entry, rb_node); 226 iter = rb_entry(parent, struct hist_entry, rb_node);
175 227
176 if (he->count > iter->count) 228 if (he->period > iter->period)
177 p = &(*p)->rb_left; 229 p = &(*p)->rb_left;
178 else 230 else
179 p = &(*p)->rb_right; 231 p = &(*p)->rb_right;
180 } 232 }
181 233
182 rb_link_node(&he->rb_node, parent, p); 234 rb_link_node(&he->rb_node, parent, p);
183 rb_insert_color(&he->rb_node, root); 235 rb_insert_color(&he->rb_node, entries);
184} 236}
185 237
186void perf_session__output_resort(struct perf_session *self, u64 total_samples) 238void hists__output_resort(struct hists *self)
187{ 239{
188 struct rb_root tmp; 240 struct rb_root tmp;
189 struct rb_node *next; 241 struct rb_node *next;
190 struct hist_entry *n; 242 struct hist_entry *n;
191 u64 min_callchain_hits; 243 u64 min_callchain_hits;
192 244
193 min_callchain_hits = 245 min_callchain_hits = self->stats.total_period * (callchain_param.min_percent / 100);
194 total_samples * (callchain_param.min_percent / 100);
195 246
196 tmp = RB_ROOT; 247 tmp = RB_ROOT;
197 next = rb_first(&self->hists); 248 next = rb_first(&self->entries);
249
250 self->nr_entries = 0;
251 self->max_sym_namelen = 0;
198 252
199 while (next) { 253 while (next) {
200 n = rb_entry(next, struct hist_entry, rb_node); 254 n = rb_entry(next, struct hist_entry, rb_node);
201 next = rb_next(&n->rb_node); 255 next = rb_next(&n->rb_node);
202 256
203 rb_erase(&n->rb_node, &self->hists); 257 rb_erase(&n->rb_node, &self->entries);
204 perf_session__insert_output_hist_entry(&tmp, n, 258 __hists__insert_output_entry(&tmp, n, min_callchain_hits);
205 min_callchain_hits); 259 hists__inc_nr_entries(self, n);
206 } 260 }
207 261
208 self->hists = tmp; 262 self->entries = tmp;
209} 263}
210 264
211static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin) 265static size_t callchain__fprintf_left_margin(FILE *fp, int left_margin)
@@ -237,7 +291,7 @@ static size_t ipchain__fprintf_graph_line(FILE *fp, int depth, int depth_mask,
237} 291}
238 292
239static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, 293static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain,
240 int depth, int depth_mask, int count, 294 int depth, int depth_mask, int period,
241 u64 total_samples, int hits, 295 u64 total_samples, int hits,
242 int left_margin) 296 int left_margin)
243{ 297{
@@ -250,7 +304,7 @@ static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain,
250 ret += fprintf(fp, "|"); 304 ret += fprintf(fp, "|");
251 else 305 else
252 ret += fprintf(fp, " "); 306 ret += fprintf(fp, " ");
253 if (!count && i == depth - 1) { 307 if (!period && i == depth - 1) {
254 double percent; 308 double percent;
255 309
256 percent = hits * 100.0 / total_samples; 310 percent = hits * 100.0 / total_samples;
@@ -258,8 +312,8 @@ static size_t ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain,
258 } else 312 } else
259 ret += fprintf(fp, "%s", " "); 313 ret += fprintf(fp, "%s", " ");
260 } 314 }
261 if (chain->sym) 315 if (chain->ms.sym)
262 ret += fprintf(fp, "%s\n", chain->sym->name); 316 ret += fprintf(fp, "%s\n", chain->ms.sym->name);
263 else 317 else
264 ret += fprintf(fp, "%p\n", (void *)(long)chain->ip); 318 ret += fprintf(fp, "%p\n", (void *)(long)chain->ip);
265 319
@@ -278,7 +332,7 @@ static void init_rem_hits(void)
278 } 332 }
279 333
280 strcpy(rem_sq_bracket->name, "[...]"); 334 strcpy(rem_sq_bracket->name, "[...]");
281 rem_hits.sym = rem_sq_bracket; 335 rem_hits.ms.sym = rem_sq_bracket;
282} 336}
283 337
284static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self, 338static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
@@ -293,6 +347,7 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
293 u64 remaining; 347 u64 remaining;
294 size_t ret = 0; 348 size_t ret = 0;
295 int i; 349 int i;
350 uint entries_printed = 0;
296 351
297 if (callchain_param.mode == CHAIN_GRAPH_REL) 352 if (callchain_param.mode == CHAIN_GRAPH_REL)
298 new_total = self->children_hit; 353 new_total = self->children_hit;
@@ -321,15 +376,13 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
321 new_depth_mask &= ~(1 << (depth - 1)); 376 new_depth_mask &= ~(1 << (depth - 1));
322 377
323 /* 378 /*
324 * But we keep the older depth mask for the line seperator 379 * But we keep the older depth mask for the line separator
325 * to keep the level link until we reach the last child 380 * to keep the level link until we reach the last child
326 */ 381 */
327 ret += ipchain__fprintf_graph_line(fp, depth, depth_mask, 382 ret += ipchain__fprintf_graph_line(fp, depth, depth_mask,
328 left_margin); 383 left_margin);
329 i = 0; 384 i = 0;
330 list_for_each_entry(chain, &child->val, list) { 385 list_for_each_entry(chain, &child->val, list) {
331 if (chain->ip >= PERF_CONTEXT_MAX)
332 continue;
333 ret += ipchain__fprintf_graph(fp, chain, depth, 386 ret += ipchain__fprintf_graph(fp, chain, depth,
334 new_depth_mask, i++, 387 new_depth_mask, i++,
335 new_total, 388 new_total,
@@ -341,6 +394,8 @@ static size_t __callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
341 new_depth_mask | (1 << depth), 394 new_depth_mask | (1 << depth),
342 left_margin); 395 left_margin);
343 node = next; 396 node = next;
397 if (++entries_printed == callchain_param.print_limit)
398 break;
344 } 399 }
345 400
346 if (callchain_param.mode == CHAIN_GRAPH_REL && 401 if (callchain_param.mode == CHAIN_GRAPH_REL &&
@@ -366,11 +421,9 @@ static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
366 bool printed = false; 421 bool printed = false;
367 int i = 0; 422 int i = 0;
368 int ret = 0; 423 int ret = 0;
424 u32 entries_printed = 0;
369 425
370 list_for_each_entry(chain, &self->val, list) { 426 list_for_each_entry(chain, &self->val, list) {
371 if (chain->ip >= PERF_CONTEXT_MAX)
372 continue;
373
374 if (!i++ && sort__first_dimension == SORT_SYM) 427 if (!i++ && sort__first_dimension == SORT_SYM)
375 continue; 428 continue;
376 429
@@ -385,10 +438,13 @@ static size_t callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
385 } else 438 } else
386 ret += callchain__fprintf_left_margin(fp, left_margin); 439 ret += callchain__fprintf_left_margin(fp, left_margin);
387 440
388 if (chain->sym) 441 if (chain->ms.sym)
389 ret += fprintf(fp, " %s\n", chain->sym->name); 442 ret += fprintf(fp, " %s\n", chain->ms.sym->name);
390 else 443 else
391 ret += fprintf(fp, " %p\n", (void *)(long)chain->ip); 444 ret += fprintf(fp, " %p\n", (void *)(long)chain->ip);
445
446 if (++entries_printed == callchain_param.print_limit)
447 break;
392 } 448 }
393 449
394 ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin); 450 ret += __callchain__fprintf_graph(fp, self, total_samples, 1, 1, left_margin);
@@ -411,8 +467,8 @@ static size_t callchain__fprintf_flat(FILE *fp, struct callchain_node *self,
411 list_for_each_entry(chain, &self->val, list) { 467 list_for_each_entry(chain, &self->val, list) {
412 if (chain->ip >= PERF_CONTEXT_MAX) 468 if (chain->ip >= PERF_CONTEXT_MAX)
413 continue; 469 continue;
414 if (chain->sym) 470 if (chain->ms.sym)
415 ret += fprintf(fp, " %s\n", chain->sym->name); 471 ret += fprintf(fp, " %s\n", chain->ms.sym->name);
416 else 472 else
417 ret += fprintf(fp, " %p\n", 473 ret += fprintf(fp, " %p\n",
418 (void *)(long)chain->ip); 474 (void *)(long)chain->ip);
@@ -427,6 +483,7 @@ static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self,
427 struct rb_node *rb_node; 483 struct rb_node *rb_node;
428 struct callchain_node *chain; 484 struct callchain_node *chain;
429 size_t ret = 0; 485 size_t ret = 0;
486 u32 entries_printed = 0;
430 487
431 rb_node = rb_first(&self->sorted_chain); 488 rb_node = rb_first(&self->sorted_chain);
432 while (rb_node) { 489 while (rb_node) {
@@ -449,55 +506,88 @@ static size_t hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self,
449 break; 506 break;
450 } 507 }
451 ret += fprintf(fp, "\n"); 508 ret += fprintf(fp, "\n");
509 if (++entries_printed == callchain_param.print_limit)
510 break;
452 rb_node = rb_next(rb_node); 511 rb_node = rb_next(rb_node);
453 } 512 }
454 513
455 return ret; 514 return ret;
456} 515}
457 516
458static size_t hist_entry__fprintf(struct hist_entry *self, 517int hist_entry__snprintf(struct hist_entry *self, char *s, size_t size,
459 struct perf_session *session, 518 struct hists *pair_hists, bool show_displacement,
460 struct perf_session *pair_session, 519 long displacement, bool color, u64 session_total)
461 bool show_displacement,
462 long displacement, FILE *fp)
463{ 520{
464 struct sort_entry *se; 521 struct sort_entry *se;
465 u64 count, total; 522 u64 period, total, period_sys, period_us, period_guest_sys, period_guest_us;
466 const char *sep = symbol_conf.field_sep; 523 const char *sep = symbol_conf.field_sep;
467 size_t ret; 524 int ret;
468 525
469 if (symbol_conf.exclude_other && !self->parent) 526 if (symbol_conf.exclude_other && !self->parent)
470 return 0; 527 return 0;
471 528
472 if (pair_session) { 529 if (pair_hists) {
473 count = self->pair ? self->pair->count : 0; 530 period = self->pair ? self->pair->period : 0;
474 total = pair_session->events_stats.total; 531 total = pair_hists->stats.total_period;
532 period_sys = self->pair ? self->pair->period_sys : 0;
533 period_us = self->pair ? self->pair->period_us : 0;
534 period_guest_sys = self->pair ? self->pair->period_guest_sys : 0;
535 period_guest_us = self->pair ? self->pair->period_guest_us : 0;
475 } else { 536 } else {
476 count = self->count; 537 period = self->period;
477 total = session->events_stats.total; 538 total = session_total;
539 period_sys = self->period_sys;
540 period_us = self->period_us;
541 period_guest_sys = self->period_guest_sys;
542 period_guest_us = self->period_guest_us;
478 } 543 }
479 544
480 if (total) 545 if (total) {
481 ret = percent_color_fprintf(fp, sep ? "%.2f" : " %6.2f%%", 546 if (color)
482 (count * 100.0) / total); 547 ret = percent_color_snprintf(s, size,
483 else 548 sep ? "%.2f" : " %6.2f%%",
484 ret = fprintf(fp, sep ? "%lld" : "%12lld ", count); 549 (period * 100.0) / total);
550 else
551 ret = snprintf(s, size, sep ? "%.2f" : " %6.2f%%",
552 (period * 100.0) / total);
553 if (symbol_conf.show_cpu_utilization) {
554 ret += percent_color_snprintf(s + ret, size - ret,
555 sep ? "%.2f" : " %6.2f%%",
556 (period_sys * 100.0) / total);
557 ret += percent_color_snprintf(s + ret, size - ret,
558 sep ? "%.2f" : " %6.2f%%",
559 (period_us * 100.0) / total);
560 if (perf_guest) {
561 ret += percent_color_snprintf(s + ret,
562 size - ret,
563 sep ? "%.2f" : " %6.2f%%",
564 (period_guest_sys * 100.0) /
565 total);
566 ret += percent_color_snprintf(s + ret,
567 size - ret,
568 sep ? "%.2f" : " %6.2f%%",
569 (period_guest_us * 100.0) /
570 total);
571 }
572 }
573 } else
574 ret = snprintf(s, size, sep ? "%lld" : "%12lld ", period);
485 575
486 if (symbol_conf.show_nr_samples) { 576 if (symbol_conf.show_nr_samples) {
487 if (sep) 577 if (sep)
488 fprintf(fp, "%c%lld", *sep, count); 578 ret += snprintf(s + ret, size - ret, "%c%lld", *sep, period);
489 else 579 else
490 fprintf(fp, "%11lld", count); 580 ret += snprintf(s + ret, size - ret, "%11lld", period);
491 } 581 }
492 582
493 if (pair_session) { 583 if (pair_hists) {
494 char bf[32]; 584 char bf[32];
495 double old_percent = 0, new_percent = 0, diff; 585 double old_percent = 0, new_percent = 0, diff;
496 586
497 if (total > 0) 587 if (total > 0)
498 old_percent = (count * 100.0) / total; 588 old_percent = (period * 100.0) / total;
499 if (session->events_stats.total > 0) 589 if (session_total > 0)
500 new_percent = (self->count * 100.0) / session->events_stats.total; 590 new_percent = (self->period * 100.0) / session_total;
501 591
502 diff = new_percent - old_percent; 592 diff = new_percent - old_percent;
503 593
@@ -507,9 +597,9 @@ static size_t hist_entry__fprintf(struct hist_entry *self,
507 snprintf(bf, sizeof(bf), " "); 597 snprintf(bf, sizeof(bf), " ");
508 598
509 if (sep) 599 if (sep)
510 ret += fprintf(fp, "%c%s", *sep, bf); 600 ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf);
511 else 601 else
512 ret += fprintf(fp, "%11.11s", bf); 602 ret += snprintf(s + ret, size - ret, "%11.11s", bf);
513 603
514 if (show_displacement) { 604 if (show_displacement) {
515 if (displacement) 605 if (displacement)
@@ -518,9 +608,9 @@ static size_t hist_entry__fprintf(struct hist_entry *self,
518 snprintf(bf, sizeof(bf), " "); 608 snprintf(bf, sizeof(bf), " ");
519 609
520 if (sep) 610 if (sep)
521 fprintf(fp, "%c%s", *sep, bf); 611 ret += snprintf(s + ret, size - ret, "%c%s", *sep, bf);
522 else 612 else
523 fprintf(fp, "%6.6s", bf); 613 ret += snprintf(s + ret, size - ret, "%6.6s", bf);
524 } 614 }
525 } 615 }
526 616
@@ -528,32 +618,48 @@ static size_t hist_entry__fprintf(struct hist_entry *self,
528 if (se->elide) 618 if (se->elide)
529 continue; 619 continue;
530 620
531 fprintf(fp, "%s", sep ?: " "); 621 ret += snprintf(s + ret, size - ret, "%s", sep ?: " ");
532 ret += se->print(fp, self, se->width ? *se->width : 0); 622 ret += se->se_snprintf(self, s + ret, size - ret,
623 se->se_width ? *se->se_width : 0);
533 } 624 }
534 625
535 ret += fprintf(fp, "\n"); 626 return ret;
627}
536 628
537 if (symbol_conf.use_callchain) { 629int hist_entry__fprintf(struct hist_entry *self, struct hists *pair_hists,
538 int left_margin = 0; 630 bool show_displacement, long displacement, FILE *fp,
631 u64 session_total)
632{
633 char bf[512];
634 int ret;
539 635
540 if (sort__first_dimension == SORT_COMM) { 636 ret = hist_entry__snprintf(self, bf, sizeof(bf), pair_hists,
541 se = list_first_entry(&hist_entry__sort_list, typeof(*se), 637 show_displacement, displacement,
542 list); 638 true, session_total);
543 left_margin = se->width ? *se->width : 0; 639 if (!ret)
544 left_margin -= thread__comm_len(self->thread); 640 return 0;
545 } 641
642 return fprintf(fp, "%s\n", bf);
643}
644
645static size_t hist_entry__fprintf_callchain(struct hist_entry *self, FILE *fp,
646 u64 session_total)
647{
648 int left_margin = 0;
546 649
547 hist_entry_callchain__fprintf(fp, self, session->events_stats.total, 650 if (sort__first_dimension == SORT_COMM) {
548 left_margin); 651 struct sort_entry *se = list_first_entry(&hist_entry__sort_list,
652 typeof(*se), list);
653 left_margin = se->se_width ? *se->se_width : 0;
654 left_margin -= thread__comm_len(self->thread);
549 } 655 }
550 656
551 return ret; 657 return hist_entry_callchain__fprintf(fp, self, session_total,
658 left_margin);
552} 659}
553 660
554size_t perf_session__fprintf_hists(struct perf_session *self, 661size_t hists__fprintf(struct hists *self, struct hists *pair,
555 struct perf_session *pair, 662 bool show_displacement, FILE *fp)
556 bool show_displacement, FILE *fp)
557{ 663{
558 struct sort_entry *se; 664 struct sort_entry *se;
559 struct rb_node *nd; 665 struct rb_node *nd;
@@ -562,7 +668,7 @@ size_t perf_session__fprintf_hists(struct perf_session *self,
562 long displacement = 0; 668 long displacement = 0;
563 unsigned int width; 669 unsigned int width;
564 const char *sep = symbol_conf.field_sep; 670 const char *sep = symbol_conf.field_sep;
565 char *col_width = symbol_conf.col_width_list_str; 671 const char *col_width = symbol_conf.col_width_list_str;
566 672
567 init_rem_hits(); 673 init_rem_hits();
568 674
@@ -575,6 +681,24 @@ size_t perf_session__fprintf_hists(struct perf_session *self,
575 fputs(" Samples ", fp); 681 fputs(" Samples ", fp);
576 } 682 }
577 683
684 if (symbol_conf.show_cpu_utilization) {
685 if (sep) {
686 ret += fprintf(fp, "%csys", *sep);
687 ret += fprintf(fp, "%cus", *sep);
688 if (perf_guest) {
689 ret += fprintf(fp, "%cguest sys", *sep);
690 ret += fprintf(fp, "%cguest us", *sep);
691 }
692 } else {
693 ret += fprintf(fp, " sys ");
694 ret += fprintf(fp, " us ");
695 if (perf_guest) {
696 ret += fprintf(fp, " guest sys ");
697 ret += fprintf(fp, " guest us ");
698 }
699 }
700 }
701
578 if (pair) { 702 if (pair) {
579 if (sep) 703 if (sep)
580 ret += fprintf(fp, "%cDelta", *sep); 704 ret += fprintf(fp, "%cDelta", *sep);
@@ -593,22 +717,22 @@ size_t perf_session__fprintf_hists(struct perf_session *self,
593 if (se->elide) 717 if (se->elide)
594 continue; 718 continue;
595 if (sep) { 719 if (sep) {
596 fprintf(fp, "%c%s", *sep, se->header); 720 fprintf(fp, "%c%s", *sep, se->se_header);
597 continue; 721 continue;
598 } 722 }
599 width = strlen(se->header); 723 width = strlen(se->se_header);
600 if (se->width) { 724 if (se->se_width) {
601 if (symbol_conf.col_width_list_str) { 725 if (symbol_conf.col_width_list_str) {
602 if (col_width) { 726 if (col_width) {
603 *se->width = atoi(col_width); 727 *se->se_width = atoi(col_width);
604 col_width = strchr(col_width, ','); 728 col_width = strchr(col_width, ',');
605 if (col_width) 729 if (col_width)
606 ++col_width; 730 ++col_width;
607 } 731 }
608 } 732 }
609 width = *se->width = max(*se->width, width); 733 width = *se->se_width = max(*se->se_width, width);
610 } 734 }
611 fprintf(fp, " %*s", width, se->header); 735 fprintf(fp, " %*s", width, se->se_header);
612 } 736 }
613 fprintf(fp, "\n"); 737 fprintf(fp, "\n");
614 738
@@ -630,10 +754,10 @@ size_t perf_session__fprintf_hists(struct perf_session *self,
630 continue; 754 continue;
631 755
632 fprintf(fp, " "); 756 fprintf(fp, " ");
633 if (se->width) 757 if (se->se_width)
634 width = *se->width; 758 width = *se->se_width;
635 else 759 else
636 width = strlen(se->header); 760 width = strlen(se->se_header);
637 for (i = 0; i < width; i++) 761 for (i = 0; i < width; i++)
638 fprintf(fp, "."); 762 fprintf(fp, ".");
639 } 763 }
@@ -641,8 +765,9 @@ size_t perf_session__fprintf_hists(struct perf_session *self,
641 fprintf(fp, "\n#\n"); 765 fprintf(fp, "\n#\n");
642 766
643print_entries: 767print_entries:
644 for (nd = rb_first(&self->hists); nd; nd = rb_next(nd)) { 768 for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) {
645 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node); 769 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
770 int cnt;
646 771
647 if (show_displacement) { 772 if (show_displacement) {
648 if (h->pair != NULL) 773 if (h->pair != NULL)
@@ -652,11 +777,320 @@ print_entries:
652 displacement = 0; 777 displacement = 0;
653 ++position; 778 ++position;
654 } 779 }
655 ret += hist_entry__fprintf(h, self, pair, show_displacement, 780 cnt = hist_entry__fprintf(h, pair, show_displacement,
656 displacement, fp); 781 displacement, fp, self->stats.total_period);
782 /* Ignore those that didn't match the parent filter */
783 if (!cnt)
784 continue;
785
786 ret += cnt;
787
788 if (symbol_conf.use_callchain)
789 ret += hist_entry__fprintf_callchain(h, fp, self->stats.total_period);
790
791 if (h->ms.map == NULL && verbose > 1) {
792 __map_groups__fprintf_maps(&h->thread->mg,
793 MAP__FUNCTION, verbose, fp);
794 fprintf(fp, "%.10s end\n", graph_dotted_line);
795 }
657 } 796 }
658 797
659 free(rem_sq_bracket); 798 free(rem_sq_bracket);
660 799
661 return ret; 800 return ret;
662} 801}
802
803enum hist_filter {
804 HIST_FILTER__DSO,
805 HIST_FILTER__THREAD,
806};
807
808void hists__filter_by_dso(struct hists *self, const struct dso *dso)
809{
810 struct rb_node *nd;
811
812 self->nr_entries = self->stats.total_period = 0;
813 self->stats.nr_events[PERF_RECORD_SAMPLE] = 0;
814 self->max_sym_namelen = 0;
815
816 for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) {
817 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
818
819 if (symbol_conf.exclude_other && !h->parent)
820 continue;
821
822 if (dso != NULL && (h->ms.map == NULL || h->ms.map->dso != dso)) {
823 h->filtered |= (1 << HIST_FILTER__DSO);
824 continue;
825 }
826
827 h->filtered &= ~(1 << HIST_FILTER__DSO);
828 if (!h->filtered) {
829 ++self->nr_entries;
830 self->stats.total_period += h->period;
831 self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events;
832 if (h->ms.sym &&
833 self->max_sym_namelen < h->ms.sym->namelen)
834 self->max_sym_namelen = h->ms.sym->namelen;
835 }
836 }
837}
838
839void hists__filter_by_thread(struct hists *self, const struct thread *thread)
840{
841 struct rb_node *nd;
842
843 self->nr_entries = self->stats.total_period = 0;
844 self->stats.nr_events[PERF_RECORD_SAMPLE] = 0;
845 self->max_sym_namelen = 0;
846
847 for (nd = rb_first(&self->entries); nd; nd = rb_next(nd)) {
848 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
849
850 if (thread != NULL && h->thread != thread) {
851 h->filtered |= (1 << HIST_FILTER__THREAD);
852 continue;
853 }
854 h->filtered &= ~(1 << HIST_FILTER__THREAD);
855 if (!h->filtered) {
856 ++self->nr_entries;
857 self->stats.total_period += h->period;
858 self->stats.nr_events[PERF_RECORD_SAMPLE] += h->nr_events;
859 if (h->ms.sym &&
860 self->max_sym_namelen < h->ms.sym->namelen)
861 self->max_sym_namelen = h->ms.sym->namelen;
862 }
863 }
864}
865
866static int symbol__alloc_hist(struct symbol *self)
867{
868 struct sym_priv *priv = symbol__priv(self);
869 const int size = (sizeof(*priv->hist) +
870 (self->end - self->start) * sizeof(u64));
871
872 priv->hist = zalloc(size);
873 return priv->hist == NULL ? -1 : 0;
874}
875
876int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip)
877{
878 unsigned int sym_size, offset;
879 struct symbol *sym = self->ms.sym;
880 struct sym_priv *priv;
881 struct sym_hist *h;
882
883 if (!sym || !self->ms.map)
884 return 0;
885
886 priv = symbol__priv(sym);
887 if (priv->hist == NULL && symbol__alloc_hist(sym) < 0)
888 return -ENOMEM;
889
890 sym_size = sym->end - sym->start;
891 offset = ip - sym->start;
892
893 pr_debug3("%s: ip=%#Lx\n", __func__, self->ms.map->unmap_ip(self->ms.map, ip));
894
895 if (offset >= sym_size)
896 return 0;
897
898 h = priv->hist;
899 h->sum++;
900 h->ip[offset]++;
901
902 pr_debug3("%#Lx %s: period++ [ip: %#Lx, %#Lx] => %Ld\n", self->ms.sym->start,
903 self->ms.sym->name, ip, ip - self->ms.sym->start, h->ip[offset]);
904 return 0;
905}
906
907static struct objdump_line *objdump_line__new(s64 offset, char *line)
908{
909 struct objdump_line *self = malloc(sizeof(*self));
910
911 if (self != NULL) {
912 self->offset = offset;
913 self->line = line;
914 }
915
916 return self;
917}
918
919void objdump_line__free(struct objdump_line *self)
920{
921 free(self->line);
922 free(self);
923}
924
925static void objdump__add_line(struct list_head *head, struct objdump_line *line)
926{
927 list_add_tail(&line->node, head);
928}
929
930struct objdump_line *objdump__get_next_ip_line(struct list_head *head,
931 struct objdump_line *pos)
932{
933 list_for_each_entry_continue(pos, head, node)
934 if (pos->offset >= 0)
935 return pos;
936
937 return NULL;
938}
939
940static int hist_entry__parse_objdump_line(struct hist_entry *self, FILE *file,
941 struct list_head *head)
942{
943 struct symbol *sym = self->ms.sym;
944 struct objdump_line *objdump_line;
945 char *line = NULL, *tmp, *tmp2, *c;
946 size_t line_len;
947 s64 line_ip, offset = -1;
948
949 if (getline(&line, &line_len, file) < 0)
950 return -1;
951
952 if (!line)
953 return -1;
954
955 while (line_len != 0 && isspace(line[line_len - 1]))
956 line[--line_len] = '\0';
957
958 c = strchr(line, '\n');
959 if (c)
960 *c = 0;
961
962 line_ip = -1;
963
964 /*
965 * Strip leading spaces:
966 */
967 tmp = line;
968 while (*tmp) {
969 if (*tmp != ' ')
970 break;
971 tmp++;
972 }
973
974 if (*tmp) {
975 /*
976 * Parse hexa addresses followed by ':'
977 */
978 line_ip = strtoull(tmp, &tmp2, 16);
979 if (*tmp2 != ':' || tmp == tmp2 || tmp2[1] == '\0')
980 line_ip = -1;
981 }
982
983 if (line_ip != -1) {
984 u64 start = map__rip_2objdump(self->ms.map, sym->start),
985 end = map__rip_2objdump(self->ms.map, sym->end);
986
987 offset = line_ip - start;
988 if (offset < 0 || (u64)line_ip > end)
989 offset = -1;
990 }
991
992 objdump_line = objdump_line__new(offset, line);
993 if (objdump_line == NULL) {
994 free(line);
995 return -1;
996 }
997 objdump__add_line(head, objdump_line);
998
999 return 0;
1000}
1001
1002int hist_entry__annotate(struct hist_entry *self, struct list_head *head)
1003{
1004 struct symbol *sym = self->ms.sym;
1005 struct map *map = self->ms.map;
1006 struct dso *dso = map->dso;
1007 char *filename = dso__build_id_filename(dso, NULL, 0);
1008 bool free_filename = true;
1009 char command[PATH_MAX * 2];
1010 FILE *file;
1011 int err = 0;
1012 u64 len;
1013
1014 if (filename == NULL) {
1015 if (dso->has_build_id) {
1016 pr_err("Can't annotate %s: not enough memory\n",
1017 sym->name);
1018 return -ENOMEM;
1019 }
1020 goto fallback;
1021 } else if (readlink(filename, command, sizeof(command)) < 0 ||
1022 strstr(command, "[kernel.kallsyms]") ||
1023 access(filename, R_OK)) {
1024 free(filename);
1025fallback:
1026 /*
1027 * If we don't have build-ids or the build-id file isn't in the
1028 * cache, or is just a kallsyms file, well, lets hope that this
1029 * DSO is the same as when 'perf record' ran.
1030 */
1031 filename = dso->long_name;
1032 free_filename = false;
1033 }
1034
1035 if (dso->origin == DSO__ORIG_KERNEL) {
1036 if (dso->annotate_warned)
1037 goto out_free_filename;
1038 err = -ENOENT;
1039 dso->annotate_warned = 1;
1040 pr_err("Can't annotate %s: No vmlinux file was found in the "
1041 "path\n", sym->name);
1042 goto out_free_filename;
1043 }
1044
1045 pr_debug("%s: filename=%s, sym=%s, start=%#Lx, end=%#Lx\n", __func__,
1046 filename, sym->name, map->unmap_ip(map, sym->start),
1047 map->unmap_ip(map, sym->end));
1048
1049 len = sym->end - sym->start;
1050
1051 pr_debug("annotating [%p] %30s : [%p] %30s\n",
1052 dso, dso->long_name, sym, sym->name);
1053
1054 snprintf(command, sizeof(command),
1055 "objdump --start-address=0x%016Lx --stop-address=0x%016Lx -dS %s|grep -v %s|expand",
1056 map__rip_2objdump(map, sym->start),
1057 map__rip_2objdump(map, sym->end),
1058 filename, filename);
1059
1060 pr_debug("Executing: %s\n", command);
1061
1062 file = popen(command, "r");
1063 if (!file)
1064 goto out_free_filename;
1065
1066 while (!feof(file))
1067 if (hist_entry__parse_objdump_line(self, file, head) < 0)
1068 break;
1069
1070 pclose(file);
1071out_free_filename:
1072 if (free_filename)
1073 free(filename);
1074 return err;
1075}
1076
1077void hists__inc_nr_events(struct hists *self, u32 type)
1078{
1079 ++self->stats.nr_events[0];
1080 ++self->stats.nr_events[type];
1081}
1082
1083size_t hists__fprintf_nr_events(struct hists *self, FILE *fp)
1084{
1085 int i;
1086 size_t ret = 0;
1087
1088 for (i = 0; i < PERF_RECORD_HEADER_MAX; ++i) {
1089 if (!event__name[i])
1090 continue;
1091 ret += fprintf(fp, "%10s events: %10d\n",
1092 event__name[i], self->stats.nr_events[i]);
1093 }
1094
1095 return ret;
1096}
diff --git a/tools/perf/util/hist.h b/tools/perf/util/hist.h
index e5f99b24048b..83fa33a7b38b 100644
--- a/tools/perf/util/hist.h
+++ b/tools/perf/util/hist.h
@@ -6,22 +6,124 @@
6 6
7extern struct callchain_param callchain_param; 7extern struct callchain_param callchain_param;
8 8
9struct perf_session;
10struct hist_entry; 9struct hist_entry;
11struct addr_location; 10struct addr_location;
12struct symbol; 11struct symbol;
12struct rb_root;
13 13
14struct hist_entry *__perf_session__add_hist_entry(struct perf_session *self, 14struct objdump_line {
15 struct addr_location *al, 15 struct list_head node;
16 struct symbol *parent, 16 s64 offset;
17 u64 count, bool *hit); 17 char *line;
18};
19
20void objdump_line__free(struct objdump_line *self);
21struct objdump_line *objdump__get_next_ip_line(struct list_head *head,
22 struct objdump_line *pos);
23
24struct sym_hist {
25 u64 sum;
26 u64 ip[0];
27};
28
29struct sym_ext {
30 struct rb_node node;
31 double percent;
32 char *path;
33};
34
35struct sym_priv {
36 struct sym_hist *hist;
37 struct sym_ext *ext;
38};
39
40/*
41 * The kernel collects the number of events it couldn't send in a stretch and
42 * when possible sends this number in a PERF_RECORD_LOST event. The number of
43 * such "chunks" of lost events is stored in .nr_events[PERF_EVENT_LOST] while
44 * total_lost tells exactly how many events the kernel in fact lost, i.e. it is
45 * the sum of all struct lost_event.lost fields reported.
46 *
47 * The total_period is needed because by default auto-freq is used, so
48 * multipling nr_events[PERF_EVENT_SAMPLE] by a frequency isn't possible to get
49 * the total number of low level events, it is necessary to to sum all struct
50 * sample_event.period and stash the result in total_period.
51 */
52struct events_stats {
53 u64 total_period;
54 u64 total_lost;
55 u32 nr_events[PERF_RECORD_HEADER_MAX];
56 u32 nr_unknown_events;
57};
58
59struct hists {
60 struct rb_node rb_node;
61 struct rb_root entries;
62 u64 nr_entries;
63 struct events_stats stats;
64 u64 config;
65 u64 event_stream;
66 u32 type;
67 u32 max_sym_namelen;
68};
69
70struct hist_entry *__hists__add_entry(struct hists *self,
71 struct addr_location *al,
72 struct symbol *parent, u64 period);
18extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *); 73extern int64_t hist_entry__cmp(struct hist_entry *, struct hist_entry *);
19extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *); 74extern int64_t hist_entry__collapse(struct hist_entry *, struct hist_entry *);
75int hist_entry__fprintf(struct hist_entry *self, struct hists *pair_hists,
76 bool show_displacement, long displacement, FILE *fp,
77 u64 total);
78int hist_entry__snprintf(struct hist_entry *self, char *bf, size_t size,
79 struct hists *pair_hists, bool show_displacement,
80 long displacement, bool color, u64 total);
20void hist_entry__free(struct hist_entry *); 81void hist_entry__free(struct hist_entry *);
21 82
22void perf_session__output_resort(struct perf_session *self, u64 total_samples); 83void hists__output_resort(struct hists *self);
23void perf_session__collapse_resort(struct perf_session *self); 84void hists__collapse_resort(struct hists *self);
24size_t perf_session__fprintf_hists(struct perf_session *self, 85
25 struct perf_session *pair, 86void hists__inc_nr_events(struct hists *self, u32 type);
26 bool show_displacement, FILE *fp); 87size_t hists__fprintf_nr_events(struct hists *self, FILE *fp);
88
89size_t hists__fprintf(struct hists *self, struct hists *pair,
90 bool show_displacement, FILE *fp);
91
92int hist_entry__inc_addr_samples(struct hist_entry *self, u64 ip);
93int hist_entry__annotate(struct hist_entry *self, struct list_head *head);
94
95void hists__filter_by_dso(struct hists *self, const struct dso *dso);
96void hists__filter_by_thread(struct hists *self, const struct thread *thread);
97
98#ifdef NO_NEWT_SUPPORT
99static inline int hists__browse(struct hists *self __used,
100 const char *helpline __used,
101 const char *ev_name __used)
102{
103 return 0;
104}
105
106static inline int hists__tui_browse_tree(struct rb_root *self __used,
107 const char *help __used)
108{
109 return 0;
110}
111
112static inline int hist_entry__tui_annotate(struct hist_entry *self __used)
113{
114 return 0;
115}
116#define KEY_LEFT -1
117#define KEY_RIGHT -2
118#else
119#include <newt.h>
120int hists__browse(struct hists *self, const char *helpline,
121 const char *ev_name);
122int hist_entry__tui_annotate(struct hist_entry *self);
123
124#define KEY_LEFT NEWT_KEY_LEFT
125#define KEY_RIGHT NEWT_KEY_RIGHT
126
127int hists__tui_browse_tree(struct rb_root *self, const char *help);
128#endif
27#endif /* __PERF_HIST_H */ 129#endif /* __PERF_HIST_H */
diff --git a/tools/perf/util/hweight.c b/tools/perf/util/hweight.c
new file mode 100644
index 000000000000..5c1d0d099f0d
--- /dev/null
+++ b/tools/perf/util/hweight.c
@@ -0,0 +1,31 @@
1#include <linux/bitops.h>
2
3/**
4 * hweightN - returns the hamming weight of a N-bit word
5 * @x: the word to weigh
6 *
7 * The Hamming Weight of a number is the total number of bits set in it.
8 */
9
10unsigned int hweight32(unsigned int w)
11{
12 unsigned int res = w - ((w >> 1) & 0x55555555);
13 res = (res & 0x33333333) + ((res >> 2) & 0x33333333);
14 res = (res + (res >> 4)) & 0x0F0F0F0F;
15 res = res + (res >> 8);
16 return (res + (res >> 16)) & 0x000000FF;
17}
18
19unsigned long hweight64(__u64 w)
20{
21#if BITS_PER_LONG == 32
22 return hweight32((unsigned int)(w >> 32)) + hweight32((unsigned int)w);
23#elif BITS_PER_LONG == 64
24 __u64 res = w - ((w >> 1) & 0x5555555555555555ul);
25 res = (res & 0x3333333333333333ul) + ((res >> 2) & 0x3333333333333333ul);
26 res = (res + (res >> 4)) & 0x0F0F0F0F0F0F0F0Ful;
27 res = res + (res >> 8);
28 res = res + (res >> 16);
29 return (res + (res >> 32)) & 0x00000000000000FFul;
30#endif
31}
diff --git a/tools/perf/util/include/asm/bitops.h b/tools/perf/util/include/asm/bitops.h
deleted file mode 100644
index 58e9817ffae0..000000000000
--- a/tools/perf/util/include/asm/bitops.h
+++ /dev/null
@@ -1,18 +0,0 @@
1#ifndef _PERF_ASM_BITOPS_H_
2#define _PERF_ASM_BITOPS_H_
3
4#include <sys/types.h>
5#include "../../types.h"
6#include <linux/compiler.h>
7
8/* CHECKME: Not sure both always match */
9#define BITS_PER_LONG __WORDSIZE
10
11#include "../../../../include/asm-generic/bitops/__fls.h"
12#include "../../../../include/asm-generic/bitops/fls.h"
13#include "../../../../include/asm-generic/bitops/fls64.h"
14#include "../../../../include/asm-generic/bitops/__ffs.h"
15#include "../../../../include/asm-generic/bitops/ffz.h"
16#include "../../../../include/asm-generic/bitops/hweight.h"
17
18#endif
diff --git a/tools/perf/util/include/asm/hweight.h b/tools/perf/util/include/asm/hweight.h
new file mode 100644
index 000000000000..36cf26d434a5
--- /dev/null
+++ b/tools/perf/util/include/asm/hweight.h
@@ -0,0 +1,8 @@
1#ifndef PERF_HWEIGHT_H
2#define PERF_HWEIGHT_H
3
4#include <linux/types.h>
5unsigned int hweight32(unsigned int w);
6unsigned long hweight64(__u64 w);
7
8#endif /* PERF_HWEIGHT_H */
diff --git a/tools/perf/util/include/dwarf-regs.h b/tools/perf/util/include/dwarf-regs.h
new file mode 100644
index 000000000000..cf6727e99c44
--- /dev/null
+++ b/tools/perf/util/include/dwarf-regs.h
@@ -0,0 +1,8 @@
1#ifndef _PERF_DWARF_REGS_H_
2#define _PERF_DWARF_REGS_H_
3
4#ifdef DWARF_SUPPORT
5const char *get_arch_regstr(unsigned int n);
6#endif
7
8#endif
diff --git a/tools/perf/util/include/linux/bitmap.h b/tools/perf/util/include/linux/bitmap.h
index 94507639a8c4..eda4416efa0a 100644
--- a/tools/perf/util/include/linux/bitmap.h
+++ b/tools/perf/util/include/linux/bitmap.h
@@ -1,3 +1,35 @@
1#include "../../../../include/linux/bitmap.h" 1#ifndef _PERF_BITOPS_H
2#include "../../../../include/asm-generic/bitops/find.h" 2#define _PERF_BITOPS_H
3#include <linux/errno.h> 3
4#include <string.h>
5#include <linux/bitops.h>
6
7int __bitmap_weight(const unsigned long *bitmap, int bits);
8
9#define BITMAP_LAST_WORD_MASK(nbits) \
10( \
11 ((nbits) % BITS_PER_LONG) ? \
12 (1UL<<((nbits) % BITS_PER_LONG))-1 : ~0UL \
13)
14
15#define small_const_nbits(nbits) \
16 (__builtin_constant_p(nbits) && (nbits) <= BITS_PER_LONG)
17
18static inline void bitmap_zero(unsigned long *dst, int nbits)
19{
20 if (small_const_nbits(nbits))
21 *dst = 0UL;
22 else {
23 int len = BITS_TO_LONGS(nbits) * sizeof(unsigned long);
24 memset(dst, 0, len);
25 }
26}
27
28static inline int bitmap_weight(const unsigned long *src, int nbits)
29{
30 if (small_const_nbits(nbits))
31 return hweight_long(*src & BITMAP_LAST_WORD_MASK(nbits));
32 return __bitmap_weight(src, nbits);
33}
34
35#endif /* _PERF_BITOPS_H */
diff --git a/tools/perf/util/include/linux/bitops.h b/tools/perf/util/include/linux/bitops.h
index 8d63116e9435..bb4ac2e05385 100644
--- a/tools/perf/util/include/linux/bitops.h
+++ b/tools/perf/util/include/linux/bitops.h
@@ -1,13 +1,12 @@
1#ifndef _PERF_LINUX_BITOPS_H_ 1#ifndef _PERF_LINUX_BITOPS_H_
2#define _PERF_LINUX_BITOPS_H_ 2#define _PERF_LINUX_BITOPS_H_
3 3
4#define __KERNEL__ 4#include <linux/kernel.h>
5#include <asm/hweight.h>
5 6
6#define CONFIG_GENERIC_FIND_NEXT_BIT 7#define BITS_PER_LONG __WORDSIZE
7#define CONFIG_GENERIC_FIND_FIRST_BIT 8#define BITS_PER_BYTE 8
8#include "../../../../include/linux/bitops.h" 9#define BITS_TO_LONGS(nr) DIV_ROUND_UP(nr, BITS_PER_BYTE * sizeof(long))
9
10#undef __KERNEL__
11 10
12static inline void set_bit(int nr, unsigned long *addr) 11static inline void set_bit(int nr, unsigned long *addr)
13{ 12{
@@ -20,10 +19,9 @@ static __always_inline int test_bit(unsigned int nr, const unsigned long *addr)
20 (((unsigned long *)addr)[nr / BITS_PER_LONG])) != 0; 19 (((unsigned long *)addr)[nr / BITS_PER_LONG])) != 0;
21} 20}
22 21
23unsigned long generic_find_next_zero_le_bit(const unsigned long *addr, unsigned 22static inline unsigned long hweight_long(unsigned long w)
24 long size, unsigned long offset); 23{
25 24 return sizeof(w) == 4 ? hweight32(w) : hweight64(w);
26unsigned long generic_find_next_le_bit(const unsigned long *addr, unsigned 25}
27 long size, unsigned long offset);
28 26
29#endif 27#endif
diff --git a/tools/perf/util/include/linux/compiler.h b/tools/perf/util/include/linux/compiler.h
index dfb0713ed47f..791f9dd27ebf 100644
--- a/tools/perf/util/include/linux/compiler.h
+++ b/tools/perf/util/include/linux/compiler.h
@@ -7,4 +7,6 @@
7#define __user 7#define __user
8#define __attribute_const__ 8#define __attribute_const__
9 9
10#define __used __attribute__((__unused__))
11
10#endif 12#endif
diff --git a/tools/perf/util/include/linux/hash.h b/tools/perf/util/include/linux/hash.h
new file mode 100644
index 000000000000..201f57397997
--- /dev/null
+++ b/tools/perf/util/include/linux/hash.h
@@ -0,0 +1,5 @@
1#include "../../../../include/linux/hash.h"
2
3#ifndef PERF_HASH_H
4#define PERF_HASH_H
5#endif
diff --git a/tools/perf/util/include/linux/kernel.h b/tools/perf/util/include/linux/kernel.h
index 21c0274c02fa..1eb804fd3fbf 100644
--- a/tools/perf/util/include/linux/kernel.h
+++ b/tools/perf/util/include/linux/kernel.h
@@ -28,6 +28,8 @@
28 (type *)((char *)__mptr - offsetof(type, member)); }) 28 (type *)((char *)__mptr - offsetof(type, member)); })
29#endif 29#endif
30 30
31#define BUILD_BUG_ON_ZERO(e) (sizeof(struct { int:-!!(e); }))
32
31#ifndef max 33#ifndef max
32#define max(x, y) ({ \ 34#define max(x, y) ({ \
33 typeof(x) _max1 = (x); \ 35 typeof(x) _max1 = (x); \
@@ -85,21 +87,25 @@ simple_strtoul(const char *nptr, char **endptr, int base)
85 return strtoul(nptr, endptr, base); 87 return strtoul(nptr, endptr, base);
86} 88}
87 89
90int eprintf(int level,
91 const char *fmt, ...) __attribute__((format(printf, 2, 3)));
92
88#ifndef pr_fmt 93#ifndef pr_fmt
89#define pr_fmt(fmt) fmt 94#define pr_fmt(fmt) fmt
90#endif 95#endif
91 96
92#define pr_err(fmt, ...) \ 97#define pr_err(fmt, ...) \
93 do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) 98 eprintf(0, pr_fmt(fmt), ##__VA_ARGS__)
94#define pr_warning(fmt, ...) \ 99#define pr_warning(fmt, ...) \
95 do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) 100 eprintf(0, pr_fmt(fmt), ##__VA_ARGS__)
96#define pr_info(fmt, ...) \ 101#define pr_info(fmt, ...) \
97 do { fprintf(stderr, pr_fmt(fmt), ##__VA_ARGS__); } while (0) 102 eprintf(0, pr_fmt(fmt), ##__VA_ARGS__)
98#define pr_debug(fmt, ...) \ 103#define pr_debug(fmt, ...) \
99 eprintf(1, pr_fmt(fmt), ##__VA_ARGS__) 104 eprintf(1, pr_fmt(fmt), ##__VA_ARGS__)
100#define pr_debugN(n, fmt, ...) \ 105#define pr_debugN(n, fmt, ...) \
101 eprintf(n, pr_fmt(fmt), ##__VA_ARGS__) 106 eprintf(n, pr_fmt(fmt), ##__VA_ARGS__)
102#define pr_debug2(fmt, ...) pr_debugN(2, pr_fmt(fmt), ##__VA_ARGS__) 107#define pr_debug2(fmt, ...) pr_debugN(2, pr_fmt(fmt), ##__VA_ARGS__)
103#define pr_debug3(fmt, ...) pr_debugN(3, pr_fmt(fmt), ##__VA_ARGS__) 108#define pr_debug3(fmt, ...) pr_debugN(3, pr_fmt(fmt), ##__VA_ARGS__)
109#define pr_debug4(fmt, ...) pr_debugN(4, pr_fmt(fmt), ##__VA_ARGS__)
104 110
105#endif 111#endif
diff --git a/tools/perf/util/map.c b/tools/perf/util/map.c
index c4d55a0da2ea..e672f2fef65b 100644
--- a/tools/perf/util/map.c
+++ b/tools/perf/util/map.c
@@ -1,9 +1,16 @@
1#include "event.h"
2#include "symbol.h" 1#include "symbol.h"
2#include <errno.h>
3#include <limits.h>
3#include <stdlib.h> 4#include <stdlib.h>
4#include <string.h> 5#include <string.h>
5#include <stdio.h> 6#include <stdio.h>
6#include "debug.h" 7#include <unistd.h>
8#include "map.h"
9
10const char *map_type__name[MAP__NR_TYPES] = {
11 [MAP__FUNCTION] = "Functions",
12 [MAP__VARIABLE] = "Variables",
13};
7 14
8static inline int is_anon_memory(const char *filename) 15static inline int is_anon_memory(const char *filename)
9{ 16{
@@ -31,15 +38,16 @@ void map__init(struct map *self, enum map_type type,
31 self->map_ip = map__map_ip; 38 self->map_ip = map__map_ip;
32 self->unmap_ip = map__unmap_ip; 39 self->unmap_ip = map__unmap_ip;
33 RB_CLEAR_NODE(&self->rb_node); 40 RB_CLEAR_NODE(&self->rb_node);
41 self->groups = NULL;
34} 42}
35 43
36struct map *map__new(struct mmap_event *event, enum map_type type, 44struct map *map__new(struct list_head *dsos__list, u64 start, u64 len,
37 char *cwd, int cwdlen) 45 u64 pgoff, u32 pid, char *filename,
46 enum map_type type, char *cwd, int cwdlen)
38{ 47{
39 struct map *self = malloc(sizeof(*self)); 48 struct map *self = malloc(sizeof(*self));
40 49
41 if (self != NULL) { 50 if (self != NULL) {
42 const char *filename = event->filename;
43 char newfilename[PATH_MAX]; 51 char newfilename[PATH_MAX];
44 struct dso *dso; 52 struct dso *dso;
45 int anon; 53 int anon;
@@ -57,19 +65,23 @@ struct map *map__new(struct mmap_event *event, enum map_type type,
57 anon = is_anon_memory(filename); 65 anon = is_anon_memory(filename);
58 66
59 if (anon) { 67 if (anon) {
60 snprintf(newfilename, sizeof(newfilename), "/tmp/perf-%d.map", event->pid); 68 snprintf(newfilename, sizeof(newfilename), "/tmp/perf-%d.map", pid);
61 filename = newfilename; 69 filename = newfilename;
62 } 70 }
63 71
64 dso = dsos__findnew(filename); 72 dso = __dsos__findnew(dsos__list, filename);
65 if (dso == NULL) 73 if (dso == NULL)
66 goto out_delete; 74 goto out_delete;
67 75
68 map__init(self, type, event->start, event->start + event->len, 76 map__init(self, type, start, start + len, pgoff, dso);
69 event->pgoff, dso);
70 77
71 if (self->dso == vdso || anon) 78 if (anon) {
79set_identity:
72 self->map_ip = self->unmap_ip = identity__map_ip; 80 self->map_ip = self->unmap_ip = identity__map_ip;
81 } else if (strcmp(filename, "[vdso]") == 0) {
82 dso__set_loaded(dso, self->type);
83 goto set_identity;
84 }
73 } 85 }
74 return self; 86 return self;
75out_delete: 87out_delete:
@@ -104,8 +116,7 @@ void map__fixup_end(struct map *self)
104 116
105#define DSO__DELETED "(deleted)" 117#define DSO__DELETED "(deleted)"
106 118
107int map__load(struct map *self, struct perf_session *session, 119int map__load(struct map *self, symbol_filter_t filter)
108 symbol_filter_t filter)
109{ 120{
110 const char *name = self->dso->long_name; 121 const char *name = self->dso->long_name;
111 int nr; 122 int nr;
@@ -113,7 +124,7 @@ int map__load(struct map *self, struct perf_session *session,
113 if (dso__loaded(self->dso, self->type)) 124 if (dso__loaded(self->dso, self->type))
114 return 0; 125 return 0;
115 126
116 nr = dso__load(self->dso, self, session, filter); 127 nr = dso__load(self->dso, self, filter);
117 if (nr < 0) { 128 if (nr < 0) {
118 if (self->dso->has_build_id) { 129 if (self->dso->has_build_id) {
119 char sbuild_id[BUILD_ID_SIZE * 2 + 1]; 130 char sbuild_id[BUILD_ID_SIZE * 2 + 1];
@@ -144,24 +155,29 @@ int map__load(struct map *self, struct perf_session *session,
144 155
145 return -1; 156 return -1;
146 } 157 }
158 /*
159 * Only applies to the kernel, as its symtabs aren't relative like the
160 * module ones.
161 */
162 if (self->dso->kernel)
163 map__reloc_vmlinux(self);
147 164
148 return 0; 165 return 0;
149} 166}
150 167
151struct symbol *map__find_symbol(struct map *self, struct perf_session *session, 168struct symbol *map__find_symbol(struct map *self, u64 addr,
152 u64 addr, symbol_filter_t filter) 169 symbol_filter_t filter)
153{ 170{
154 if (map__load(self, session, filter) < 0) 171 if (map__load(self, filter) < 0)
155 return NULL; 172 return NULL;
156 173
157 return dso__find_symbol(self->dso, self->type, addr); 174 return dso__find_symbol(self->dso, self->type, addr);
158} 175}
159 176
160struct symbol *map__find_symbol_by_name(struct map *self, const char *name, 177struct symbol *map__find_symbol_by_name(struct map *self, const char *name,
161 struct perf_session *session,
162 symbol_filter_t filter) 178 symbol_filter_t filter)
163{ 179{
164 if (map__load(self, session, filter) < 0) 180 if (map__load(self, filter) < 0)
165 return NULL; 181 return NULL;
166 182
167 if (!dso__sorted_by_name(self->dso, self->type)) 183 if (!dso__sorted_by_name(self->dso, self->type))
@@ -201,3 +217,412 @@ size_t map__fprintf(struct map *self, FILE *fp)
201 return fprintf(fp, " %Lx-%Lx %Lx %s\n", 217 return fprintf(fp, " %Lx-%Lx %Lx %s\n",
202 self->start, self->end, self->pgoff, self->dso->name); 218 self->start, self->end, self->pgoff, self->dso->name);
203} 219}
220
221/*
222 * objdump wants/reports absolute IPs for ET_EXEC, and RIPs for ET_DYN.
223 * map->dso->adjust_symbols==1 for ET_EXEC-like cases.
224 */
225u64 map__rip_2objdump(struct map *map, u64 rip)
226{
227 u64 addr = map->dso->adjust_symbols ?
228 map->unmap_ip(map, rip) : /* RIP -> IP */
229 rip;
230 return addr;
231}
232
233u64 map__objdump_2ip(struct map *map, u64 addr)
234{
235 u64 ip = map->dso->adjust_symbols ?
236 addr :
237 map->unmap_ip(map, addr); /* RIP -> IP */
238 return ip;
239}
240
241void map_groups__init(struct map_groups *self)
242{
243 int i;
244 for (i = 0; i < MAP__NR_TYPES; ++i) {
245 self->maps[i] = RB_ROOT;
246 INIT_LIST_HEAD(&self->removed_maps[i]);
247 }
248 self->machine = NULL;
249}
250
251void map_groups__flush(struct map_groups *self)
252{
253 int type;
254
255 for (type = 0; type < MAP__NR_TYPES; type++) {
256 struct rb_root *root = &self->maps[type];
257 struct rb_node *next = rb_first(root);
258
259 while (next) {
260 struct map *pos = rb_entry(next, struct map, rb_node);
261 next = rb_next(&pos->rb_node);
262 rb_erase(&pos->rb_node, root);
263 /*
264 * We may have references to this map, for
265 * instance in some hist_entry instances, so
266 * just move them to a separate list.
267 */
268 list_add_tail(&pos->node, &self->removed_maps[pos->type]);
269 }
270 }
271}
272
273struct symbol *map_groups__find_symbol(struct map_groups *self,
274 enum map_type type, u64 addr,
275 struct map **mapp,
276 symbol_filter_t filter)
277{
278 struct map *map = map_groups__find(self, type, addr);
279
280 if (map != NULL) {
281 if (mapp != NULL)
282 *mapp = map;
283 return map__find_symbol(map, map->map_ip(map, addr), filter);
284 }
285
286 return NULL;
287}
288
289struct symbol *map_groups__find_symbol_by_name(struct map_groups *self,
290 enum map_type type,
291 const char *name,
292 struct map **mapp,
293 symbol_filter_t filter)
294{
295 struct rb_node *nd;
296
297 for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) {
298 struct map *pos = rb_entry(nd, struct map, rb_node);
299 struct symbol *sym = map__find_symbol_by_name(pos, name, filter);
300
301 if (sym == NULL)
302 continue;
303 if (mapp != NULL)
304 *mapp = pos;
305 return sym;
306 }
307
308 return NULL;
309}
310
311size_t __map_groups__fprintf_maps(struct map_groups *self,
312 enum map_type type, int verbose, FILE *fp)
313{
314 size_t printed = fprintf(fp, "%s:\n", map_type__name[type]);
315 struct rb_node *nd;
316
317 for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) {
318 struct map *pos = rb_entry(nd, struct map, rb_node);
319 printed += fprintf(fp, "Map:");
320 printed += map__fprintf(pos, fp);
321 if (verbose > 2) {
322 printed += dso__fprintf(pos->dso, type, fp);
323 printed += fprintf(fp, "--\n");
324 }
325 }
326
327 return printed;
328}
329
330size_t map_groups__fprintf_maps(struct map_groups *self, int verbose, FILE *fp)
331{
332 size_t printed = 0, i;
333 for (i = 0; i < MAP__NR_TYPES; ++i)
334 printed += __map_groups__fprintf_maps(self, i, verbose, fp);
335 return printed;
336}
337
338static size_t __map_groups__fprintf_removed_maps(struct map_groups *self,
339 enum map_type type,
340 int verbose, FILE *fp)
341{
342 struct map *pos;
343 size_t printed = 0;
344
345 list_for_each_entry(pos, &self->removed_maps[type], node) {
346 printed += fprintf(fp, "Map:");
347 printed += map__fprintf(pos, fp);
348 if (verbose > 1) {
349 printed += dso__fprintf(pos->dso, type, fp);
350 printed += fprintf(fp, "--\n");
351 }
352 }
353 return printed;
354}
355
356static size_t map_groups__fprintf_removed_maps(struct map_groups *self,
357 int verbose, FILE *fp)
358{
359 size_t printed = 0, i;
360 for (i = 0; i < MAP__NR_TYPES; ++i)
361 printed += __map_groups__fprintf_removed_maps(self, i, verbose, fp);
362 return printed;
363}
364
365size_t map_groups__fprintf(struct map_groups *self, int verbose, FILE *fp)
366{
367 size_t printed = map_groups__fprintf_maps(self, verbose, fp);
368 printed += fprintf(fp, "Removed maps:\n");
369 return printed + map_groups__fprintf_removed_maps(self, verbose, fp);
370}
371
372int map_groups__fixup_overlappings(struct map_groups *self, struct map *map,
373 int verbose, FILE *fp)
374{
375 struct rb_root *root = &self->maps[map->type];
376 struct rb_node *next = rb_first(root);
377
378 while (next) {
379 struct map *pos = rb_entry(next, struct map, rb_node);
380 next = rb_next(&pos->rb_node);
381
382 if (!map__overlap(pos, map))
383 continue;
384
385 if (verbose >= 2) {
386 fputs("overlapping maps:\n", fp);
387 map__fprintf(map, fp);
388 map__fprintf(pos, fp);
389 }
390
391 rb_erase(&pos->rb_node, root);
392 /*
393 * We may have references to this map, for instance in some
394 * hist_entry instances, so just move them to a separate
395 * list.
396 */
397 list_add_tail(&pos->node, &self->removed_maps[map->type]);
398 /*
399 * Now check if we need to create new maps for areas not
400 * overlapped by the new map:
401 */
402 if (map->start > pos->start) {
403 struct map *before = map__clone(pos);
404
405 if (before == NULL)
406 return -ENOMEM;
407
408 before->end = map->start - 1;
409 map_groups__insert(self, before);
410 if (verbose >= 2)
411 map__fprintf(before, fp);
412 }
413
414 if (map->end < pos->end) {
415 struct map *after = map__clone(pos);
416
417 if (after == NULL)
418 return -ENOMEM;
419
420 after->start = map->end + 1;
421 map_groups__insert(self, after);
422 if (verbose >= 2)
423 map__fprintf(after, fp);
424 }
425 }
426
427 return 0;
428}
429
430/*
431 * XXX This should not really _copy_ te maps, but refcount them.
432 */
433int map_groups__clone(struct map_groups *self,
434 struct map_groups *parent, enum map_type type)
435{
436 struct rb_node *nd;
437 for (nd = rb_first(&parent->maps[type]); nd; nd = rb_next(nd)) {
438 struct map *map = rb_entry(nd, struct map, rb_node);
439 struct map *new = map__clone(map);
440 if (new == NULL)
441 return -ENOMEM;
442 map_groups__insert(self, new);
443 }
444 return 0;
445}
446
447static u64 map__reloc_map_ip(struct map *map, u64 ip)
448{
449 return ip + (s64)map->pgoff;
450}
451
452static u64 map__reloc_unmap_ip(struct map *map, u64 ip)
453{
454 return ip - (s64)map->pgoff;
455}
456
457void map__reloc_vmlinux(struct map *self)
458{
459 struct kmap *kmap = map__kmap(self);
460 s64 reloc;
461
462 if (!kmap->ref_reloc_sym || !kmap->ref_reloc_sym->unrelocated_addr)
463 return;
464
465 reloc = (kmap->ref_reloc_sym->unrelocated_addr -
466 kmap->ref_reloc_sym->addr);
467
468 if (!reloc)
469 return;
470
471 self->map_ip = map__reloc_map_ip;
472 self->unmap_ip = map__reloc_unmap_ip;
473 self->pgoff = reloc;
474}
475
476void maps__insert(struct rb_root *maps, struct map *map)
477{
478 struct rb_node **p = &maps->rb_node;
479 struct rb_node *parent = NULL;
480 const u64 ip = map->start;
481 struct map *m;
482
483 while (*p != NULL) {
484 parent = *p;
485 m = rb_entry(parent, struct map, rb_node);
486 if (ip < m->start)
487 p = &(*p)->rb_left;
488 else
489 p = &(*p)->rb_right;
490 }
491
492 rb_link_node(&map->rb_node, parent, p);
493 rb_insert_color(&map->rb_node, maps);
494}
495
496struct map *maps__find(struct rb_root *maps, u64 ip)
497{
498 struct rb_node **p = &maps->rb_node;
499 struct rb_node *parent = NULL;
500 struct map *m;
501
502 while (*p != NULL) {
503 parent = *p;
504 m = rb_entry(parent, struct map, rb_node);
505 if (ip < m->start)
506 p = &(*p)->rb_left;
507 else if (ip > m->end)
508 p = &(*p)->rb_right;
509 else
510 return m;
511 }
512
513 return NULL;
514}
515
516int machine__init(struct machine *self, const char *root_dir, pid_t pid)
517{
518 map_groups__init(&self->kmaps);
519 RB_CLEAR_NODE(&self->rb_node);
520 INIT_LIST_HEAD(&self->user_dsos);
521 INIT_LIST_HEAD(&self->kernel_dsos);
522
523 self->kmaps.machine = self;
524 self->pid = pid;
525 self->root_dir = strdup(root_dir);
526 return self->root_dir == NULL ? -ENOMEM : 0;
527}
528
529struct machine *machines__add(struct rb_root *self, pid_t pid,
530 const char *root_dir)
531{
532 struct rb_node **p = &self->rb_node;
533 struct rb_node *parent = NULL;
534 struct machine *pos, *machine = malloc(sizeof(*machine));
535
536 if (!machine)
537 return NULL;
538
539 if (machine__init(machine, root_dir, pid) != 0) {
540 free(machine);
541 return NULL;
542 }
543
544 while (*p != NULL) {
545 parent = *p;
546 pos = rb_entry(parent, struct machine, rb_node);
547 if (pid < pos->pid)
548 p = &(*p)->rb_left;
549 else
550 p = &(*p)->rb_right;
551 }
552
553 rb_link_node(&machine->rb_node, parent, p);
554 rb_insert_color(&machine->rb_node, self);
555
556 return machine;
557}
558
559struct machine *machines__find(struct rb_root *self, pid_t pid)
560{
561 struct rb_node **p = &self->rb_node;
562 struct rb_node *parent = NULL;
563 struct machine *machine;
564 struct machine *default_machine = NULL;
565
566 while (*p != NULL) {
567 parent = *p;
568 machine = rb_entry(parent, struct machine, rb_node);
569 if (pid < machine->pid)
570 p = &(*p)->rb_left;
571 else if (pid > machine->pid)
572 p = &(*p)->rb_right;
573 else
574 return machine;
575 if (!machine->pid)
576 default_machine = machine;
577 }
578
579 return default_machine;
580}
581
582struct machine *machines__findnew(struct rb_root *self, pid_t pid)
583{
584 char path[PATH_MAX];
585 const char *root_dir;
586 struct machine *machine = machines__find(self, pid);
587
588 if (!machine || machine->pid != pid) {
589 if (pid == HOST_KERNEL_ID || pid == DEFAULT_GUEST_KERNEL_ID)
590 root_dir = "";
591 else {
592 if (!symbol_conf.guestmount)
593 goto out;
594 sprintf(path, "%s/%d", symbol_conf.guestmount, pid);
595 if (access(path, R_OK)) {
596 pr_err("Can't access file %s\n", path);
597 goto out;
598 }
599 root_dir = path;
600 }
601 machine = machines__add(self, pid, root_dir);
602 }
603
604out:
605 return machine;
606}
607
608void machines__process(struct rb_root *self, machine__process_t process, void *data)
609{
610 struct rb_node *nd;
611
612 for (nd = rb_first(self); nd; nd = rb_next(nd)) {
613 struct machine *pos = rb_entry(nd, struct machine, rb_node);
614 process(pos, data);
615 }
616}
617
618char *machine__mmap_name(struct machine *self, char *bf, size_t size)
619{
620 if (machine__is_host(self))
621 snprintf(bf, size, "[%s]", "kernel.kallsyms");
622 else if (machine__is_default_guest(self))
623 snprintf(bf, size, "[%s]", "guest.kernel.kallsyms");
624 else
625 snprintf(bf, size, "[%s.%d]", "guest.kernel.kallsyms", self->pid);
626
627 return bf;
628}
diff --git a/tools/perf/util/map.h b/tools/perf/util/map.h
new file mode 100644
index 000000000000..f39134512829
--- /dev/null
+++ b/tools/perf/util/map.h
@@ -0,0 +1,217 @@
1#ifndef __PERF_MAP_H
2#define __PERF_MAP_H
3
4#include <linux/compiler.h>
5#include <linux/list.h>
6#include <linux/rbtree.h>
7#include <stdio.h>
8#include <stdbool.h>
9#include "types.h"
10
11enum map_type {
12 MAP__FUNCTION = 0,
13 MAP__VARIABLE,
14};
15
16#define MAP__NR_TYPES (MAP__VARIABLE + 1)
17
18extern const char *map_type__name[MAP__NR_TYPES];
19
20struct dso;
21struct ref_reloc_sym;
22struct map_groups;
23struct machine;
24
25struct map {
26 union {
27 struct rb_node rb_node;
28 struct list_head node;
29 };
30 u64 start;
31 u64 end;
32 enum map_type type;
33 u32 priv;
34 u64 pgoff;
35
36 /* ip -> dso rip */
37 u64 (*map_ip)(struct map *, u64);
38 /* dso rip -> ip */
39 u64 (*unmap_ip)(struct map *, u64);
40
41 struct dso *dso;
42 struct map_groups *groups;
43};
44
45struct kmap {
46 struct ref_reloc_sym *ref_reloc_sym;
47 struct map_groups *kmaps;
48};
49
50struct map_groups {
51 struct rb_root maps[MAP__NR_TYPES];
52 struct list_head removed_maps[MAP__NR_TYPES];
53 struct machine *machine;
54};
55
56/* Native host kernel uses -1 as pid index in machine */
57#define HOST_KERNEL_ID (-1)
58#define DEFAULT_GUEST_KERNEL_ID (0)
59
60struct machine {
61 struct rb_node rb_node;
62 pid_t pid;
63 char *root_dir;
64 struct list_head user_dsos;
65 struct list_head kernel_dsos;
66 struct map_groups kmaps;
67 struct map *vmlinux_maps[MAP__NR_TYPES];
68};
69
70static inline
71struct map *machine__kernel_map(struct machine *self, enum map_type type)
72{
73 return self->vmlinux_maps[type];
74}
75
76static inline struct kmap *map__kmap(struct map *self)
77{
78 return (struct kmap *)(self + 1);
79}
80
81static inline u64 map__map_ip(struct map *map, u64 ip)
82{
83 return ip - map->start + map->pgoff;
84}
85
86static inline u64 map__unmap_ip(struct map *map, u64 ip)
87{
88 return ip + map->start - map->pgoff;
89}
90
91static inline u64 identity__map_ip(struct map *map __used, u64 ip)
92{
93 return ip;
94}
95
96
97/* rip/ip <-> addr suitable for passing to `objdump --start-address=` */
98u64 map__rip_2objdump(struct map *map, u64 rip);
99u64 map__objdump_2ip(struct map *map, u64 addr);
100
101struct symbol;
102
103typedef int (*symbol_filter_t)(struct map *map, struct symbol *sym);
104
105void map__init(struct map *self, enum map_type type,
106 u64 start, u64 end, u64 pgoff, struct dso *dso);
107struct map *map__new(struct list_head *dsos__list, u64 start, u64 len,
108 u64 pgoff, u32 pid, char *filename,
109 enum map_type type, char *cwd, int cwdlen);
110void map__delete(struct map *self);
111struct map *map__clone(struct map *self);
112int map__overlap(struct map *l, struct map *r);
113size_t map__fprintf(struct map *self, FILE *fp);
114
115int map__load(struct map *self, symbol_filter_t filter);
116struct symbol *map__find_symbol(struct map *self,
117 u64 addr, symbol_filter_t filter);
118struct symbol *map__find_symbol_by_name(struct map *self, const char *name,
119 symbol_filter_t filter);
120void map__fixup_start(struct map *self);
121void map__fixup_end(struct map *self);
122
123void map__reloc_vmlinux(struct map *self);
124
125size_t __map_groups__fprintf_maps(struct map_groups *self,
126 enum map_type type, int verbose, FILE *fp);
127void maps__insert(struct rb_root *maps, struct map *map);
128struct map *maps__find(struct rb_root *maps, u64 addr);
129void map_groups__init(struct map_groups *self);
130int map_groups__clone(struct map_groups *self,
131 struct map_groups *parent, enum map_type type);
132size_t map_groups__fprintf(struct map_groups *self, int verbose, FILE *fp);
133size_t map_groups__fprintf_maps(struct map_groups *self, int verbose, FILE *fp);
134
135typedef void (*machine__process_t)(struct machine *self, void *data);
136
137void machines__process(struct rb_root *self, machine__process_t process, void *data);
138struct machine *machines__add(struct rb_root *self, pid_t pid,
139 const char *root_dir);
140struct machine *machines__find_host(struct rb_root *self);
141struct machine *machines__find(struct rb_root *self, pid_t pid);
142struct machine *machines__findnew(struct rb_root *self, pid_t pid);
143char *machine__mmap_name(struct machine *self, char *bf, size_t size);
144int machine__init(struct machine *self, const char *root_dir, pid_t pid);
145
146/*
147 * Default guest kernel is defined by parameter --guestkallsyms
148 * and --guestmodules
149 */
150static inline bool machine__is_default_guest(struct machine *self)
151{
152 return self ? self->pid == DEFAULT_GUEST_KERNEL_ID : false;
153}
154
155static inline bool machine__is_host(struct machine *self)
156{
157 return self ? self->pid == HOST_KERNEL_ID : false;
158}
159
160static inline void map_groups__insert(struct map_groups *self, struct map *map)
161{
162 maps__insert(&self->maps[map->type], map);
163 map->groups = self;
164}
165
166static inline struct map *map_groups__find(struct map_groups *self,
167 enum map_type type, u64 addr)
168{
169 return maps__find(&self->maps[type], addr);
170}
171
172struct symbol *map_groups__find_symbol(struct map_groups *self,
173 enum map_type type, u64 addr,
174 struct map **mapp,
175 symbol_filter_t filter);
176
177struct symbol *map_groups__find_symbol_by_name(struct map_groups *self,
178 enum map_type type,
179 const char *name,
180 struct map **mapp,
181 symbol_filter_t filter);
182
183static inline
184struct symbol *machine__find_kernel_symbol(struct machine *self,
185 enum map_type type, u64 addr,
186 struct map **mapp,
187 symbol_filter_t filter)
188{
189 return map_groups__find_symbol(&self->kmaps, type, addr, mapp, filter);
190}
191
192static inline
193struct symbol *machine__find_kernel_function(struct machine *self, u64 addr,
194 struct map **mapp,
195 symbol_filter_t filter)
196{
197 return machine__find_kernel_symbol(self, MAP__FUNCTION, addr, mapp, filter);
198}
199
200static inline
201struct symbol *map_groups__find_function_by_name(struct map_groups *self,
202 const char *name, struct map **mapp,
203 symbol_filter_t filter)
204{
205 return map_groups__find_symbol_by_name(self, MAP__FUNCTION, name, mapp, filter);
206}
207
208int map_groups__fixup_overlappings(struct map_groups *self, struct map *map,
209 int verbose, FILE *fp);
210
211struct map *map_groups__find_by_name(struct map_groups *self,
212 enum map_type type, const char *name);
213struct map *machine__new_module(struct machine *self, u64 start, const char *filename);
214
215void map_groups__flush(struct map_groups *self);
216
217#endif /* __PERF_MAP_H */
diff --git a/tools/perf/util/newt.c b/tools/perf/util/newt.c
new file mode 100644
index 000000000000..7537ca15900b
--- /dev/null
+++ b/tools/perf/util/newt.c
@@ -0,0 +1,1178 @@
1#define _GNU_SOURCE
2#include <stdio.h>
3#undef _GNU_SOURCE
4/*
5 * slang versions <= 2.0.6 have a "#if HAVE_LONG_LONG" that breaks
6 * the build if it isn't defined. Use the equivalent one that glibc
7 * has on features.h.
8 */
9#include <features.h>
10#ifndef HAVE_LONG_LONG
11#define HAVE_LONG_LONG __GLIBC_HAVE_LONG_LONG
12#endif
13#include <slang.h>
14#include <stdlib.h>
15#include <newt.h>
16#include <sys/ttydefaults.h>
17
18#include "cache.h"
19#include "hist.h"
20#include "pstack.h"
21#include "session.h"
22#include "sort.h"
23#include "symbol.h"
24
25#if SLANG_VERSION < 20104
26#define slsmg_printf(msg, args...) SLsmg_printf((char *)msg, ##args)
27#define slsmg_write_nstring(msg, len) SLsmg_write_nstring((char *)msg, len)
28#define sltt_set_color(obj, name, fg, bg) SLtt_set_color(obj,(char *)name,\
29 (char *)fg, (char *)bg)
30#else
31#define slsmg_printf SLsmg_printf
32#define slsmg_write_nstring SLsmg_write_nstring
33#define sltt_set_color SLtt_set_color
34#endif
35
36struct ui_progress {
37 newtComponent form, scale;
38};
39
40struct ui_progress *ui_progress__new(const char *title, u64 total)
41{
42 struct ui_progress *self = malloc(sizeof(*self));
43
44 if (self != NULL) {
45 int cols;
46
47 if (use_browser <= 0)
48 return self;
49 newtGetScreenSize(&cols, NULL);
50 cols -= 4;
51 newtCenteredWindow(cols, 1, title);
52 self->form = newtForm(NULL, NULL, 0);
53 if (self->form == NULL)
54 goto out_free_self;
55 self->scale = newtScale(0, 0, cols, total);
56 if (self->scale == NULL)
57 goto out_free_form;
58 newtFormAddComponent(self->form, self->scale);
59 newtRefresh();
60 }
61
62 return self;
63
64out_free_form:
65 newtFormDestroy(self->form);
66out_free_self:
67 free(self);
68 return NULL;
69}
70
71void ui_progress__update(struct ui_progress *self, u64 curr)
72{
73 /*
74 * FIXME: We should have a per UI backend way of showing progress,
75 * stdio will just show a percentage as NN%, etc.
76 */
77 if (use_browser <= 0)
78 return;
79 newtScaleSet(self->scale, curr);
80 newtRefresh();
81}
82
83void ui_progress__delete(struct ui_progress *self)
84{
85 if (use_browser > 0) {
86 newtFormDestroy(self->form);
87 newtPopWindow();
88 }
89 free(self);
90}
91
92static void ui_helpline__pop(void)
93{
94 newtPopHelpLine();
95}
96
97static void ui_helpline__push(const char *msg)
98{
99 newtPushHelpLine(msg);
100}
101
102static void ui_helpline__vpush(const char *fmt, va_list ap)
103{
104 char *s;
105
106 if (vasprintf(&s, fmt, ap) < 0)
107 vfprintf(stderr, fmt, ap);
108 else {
109 ui_helpline__push(s);
110 free(s);
111 }
112}
113
114static void ui_helpline__fpush(const char *fmt, ...)
115{
116 va_list ap;
117
118 va_start(ap, fmt);
119 ui_helpline__vpush(fmt, ap);
120 va_end(ap);
121}
122
123static void ui_helpline__puts(const char *msg)
124{
125 ui_helpline__pop();
126 ui_helpline__push(msg);
127}
128
129static char browser__last_msg[1024];
130
131int browser__show_help(const char *format, va_list ap)
132{
133 int ret;
134 static int backlog;
135
136 ret = vsnprintf(browser__last_msg + backlog,
137 sizeof(browser__last_msg) - backlog, format, ap);
138 backlog += ret;
139
140 if (browser__last_msg[backlog - 1] == '\n') {
141 ui_helpline__puts(browser__last_msg);
142 newtRefresh();
143 backlog = 0;
144 }
145
146 return ret;
147}
148
149static void newt_form__set_exit_keys(newtComponent self)
150{
151 newtFormAddHotKey(self, NEWT_KEY_LEFT);
152 newtFormAddHotKey(self, NEWT_KEY_ESCAPE);
153 newtFormAddHotKey(self, 'Q');
154 newtFormAddHotKey(self, 'q');
155 newtFormAddHotKey(self, CTRL('c'));
156}
157
158static newtComponent newt_form__new(void)
159{
160 newtComponent self = newtForm(NULL, NULL, 0);
161 if (self)
162 newt_form__set_exit_keys(self);
163 return self;
164}
165
166static int popup_menu(int argc, char * const argv[])
167{
168 struct newtExitStruct es;
169 int i, rc = -1, max_len = 5;
170 newtComponent listbox, form = newt_form__new();
171
172 if (form == NULL)
173 return -1;
174
175 listbox = newtListbox(0, 0, argc, NEWT_FLAG_RETURNEXIT);
176 if (listbox == NULL)
177 goto out_destroy_form;
178
179 newtFormAddComponent(form, listbox);
180
181 for (i = 0; i < argc; ++i) {
182 int len = strlen(argv[i]);
183 if (len > max_len)
184 max_len = len;
185 if (newtListboxAddEntry(listbox, argv[i], (void *)(long)i))
186 goto out_destroy_form;
187 }
188
189 newtCenteredWindow(max_len, argc, NULL);
190 newtFormRun(form, &es);
191 rc = newtListboxGetCurrent(listbox) - NULL;
192 if (es.reason == NEWT_EXIT_HOTKEY)
193 rc = -1;
194 newtPopWindow();
195out_destroy_form:
196 newtFormDestroy(form);
197 return rc;
198}
199
200static int ui__help_window(const char *text)
201{
202 struct newtExitStruct es;
203 newtComponent tb, form = newt_form__new();
204 int rc = -1;
205 int max_len = 0, nr_lines = 0;
206 const char *t;
207
208 if (form == NULL)
209 return -1;
210
211 t = text;
212 while (1) {
213 const char *sep = strchr(t, '\n');
214 int len;
215
216 if (sep == NULL)
217 sep = strchr(t, '\0');
218 len = sep - t;
219 if (max_len < len)
220 max_len = len;
221 ++nr_lines;
222 if (*sep == '\0')
223 break;
224 t = sep + 1;
225 }
226
227 tb = newtTextbox(0, 0, max_len, nr_lines, 0);
228 if (tb == NULL)
229 goto out_destroy_form;
230
231 newtTextboxSetText(tb, text);
232 newtFormAddComponent(form, tb);
233 newtCenteredWindow(max_len, nr_lines, NULL);
234 newtFormRun(form, &es);
235 newtPopWindow();
236 rc = 0;
237out_destroy_form:
238 newtFormDestroy(form);
239 return rc;
240}
241
242static bool dialog_yesno(const char *msg)
243{
244 /* newtWinChoice should really be accepting const char pointers... */
245 char yes[] = "Yes", no[] = "No";
246 return newtWinChoice(NULL, yes, no, (char *)msg) == 1;
247}
248
249static void ui__error_window(const char *fmt, ...)
250{
251 va_list ap;
252
253 va_start(ap, fmt);
254 newtWinMessagev((char *)"Error", (char *)"Ok", (char *)fmt, ap);
255 va_end(ap);
256}
257
258#define HE_COLORSET_TOP 50
259#define HE_COLORSET_MEDIUM 51
260#define HE_COLORSET_NORMAL 52
261#define HE_COLORSET_SELECTED 53
262#define HE_COLORSET_CODE 54
263
264static int ui_browser__percent_color(double percent, bool current)
265{
266 if (current)
267 return HE_COLORSET_SELECTED;
268 if (percent >= MIN_RED)
269 return HE_COLORSET_TOP;
270 if (percent >= MIN_GREEN)
271 return HE_COLORSET_MEDIUM;
272 return HE_COLORSET_NORMAL;
273}
274
275struct ui_browser {
276 newtComponent form, sb;
277 u64 index, first_visible_entry_idx;
278 void *first_visible_entry, *entries;
279 u16 top, left, width, height;
280 void *priv;
281 u32 nr_entries;
282};
283
284static void ui_browser__refresh_dimensions(struct ui_browser *self)
285{
286 int cols, rows;
287 newtGetScreenSize(&cols, &rows);
288
289 if (self->width > cols - 4)
290 self->width = cols - 4;
291 self->height = rows - 5;
292 if (self->height > self->nr_entries)
293 self->height = self->nr_entries;
294 self->top = (rows - self->height) / 2;
295 self->left = (cols - self->width) / 2;
296}
297
298static void ui_browser__reset_index(struct ui_browser *self)
299{
300 self->index = self->first_visible_entry_idx = 0;
301 self->first_visible_entry = NULL;
302}
303
304static int objdump_line__show(struct objdump_line *self, struct list_head *head,
305 int width, struct hist_entry *he, int len,
306 bool current_entry)
307{
308 if (self->offset != -1) {
309 struct symbol *sym = he->ms.sym;
310 unsigned int hits = 0;
311 double percent = 0.0;
312 int color;
313 struct sym_priv *priv = symbol__priv(sym);
314 struct sym_ext *sym_ext = priv->ext;
315 struct sym_hist *h = priv->hist;
316 s64 offset = self->offset;
317 struct objdump_line *next = objdump__get_next_ip_line(head, self);
318
319 while (offset < (s64)len &&
320 (next == NULL || offset < next->offset)) {
321 if (sym_ext) {
322 percent += sym_ext[offset].percent;
323 } else
324 hits += h->ip[offset];
325
326 ++offset;
327 }
328
329 if (sym_ext == NULL && h->sum)
330 percent = 100.0 * hits / h->sum;
331
332 color = ui_browser__percent_color(percent, current_entry);
333 SLsmg_set_color(color);
334 slsmg_printf(" %7.2f ", percent);
335 if (!current_entry)
336 SLsmg_set_color(HE_COLORSET_CODE);
337 } else {
338 int color = ui_browser__percent_color(0, current_entry);
339 SLsmg_set_color(color);
340 slsmg_write_nstring(" ", 9);
341 }
342
343 SLsmg_write_char(':');
344 slsmg_write_nstring(" ", 8);
345 if (!*self->line)
346 slsmg_write_nstring(" ", width - 18);
347 else
348 slsmg_write_nstring(self->line, width - 18);
349
350 return 0;
351}
352
353static int ui_browser__refresh_entries(struct ui_browser *self)
354{
355 struct objdump_line *pos;
356 struct list_head *head = self->entries;
357 struct hist_entry *he = self->priv;
358 int row = 0;
359 int len = he->ms.sym->end - he->ms.sym->start;
360
361 if (self->first_visible_entry == NULL || self->first_visible_entry == self->entries)
362 self->first_visible_entry = head->next;
363
364 pos = list_entry(self->first_visible_entry, struct objdump_line, node);
365
366 list_for_each_entry_from(pos, head, node) {
367 bool current_entry = (self->first_visible_entry_idx + row) == self->index;
368 SLsmg_gotorc(self->top + row, self->left);
369 objdump_line__show(pos, head, self->width,
370 he, len, current_entry);
371 if (++row == self->height)
372 break;
373 }
374
375 SLsmg_set_color(HE_COLORSET_NORMAL);
376 SLsmg_fill_region(self->top + row, self->left,
377 self->height - row, self->width, ' ');
378
379 return 0;
380}
381
382static int ui_browser__run(struct ui_browser *self, const char *title,
383 struct newtExitStruct *es)
384{
385 if (self->form) {
386 newtFormDestroy(self->form);
387 newtPopWindow();
388 }
389
390 ui_browser__refresh_dimensions(self);
391 newtCenteredWindow(self->width + 2, self->height, title);
392 self->form = newt_form__new();
393 if (self->form == NULL)
394 return -1;
395
396 self->sb = newtVerticalScrollbar(self->width + 1, 0, self->height,
397 HE_COLORSET_NORMAL,
398 HE_COLORSET_SELECTED);
399 if (self->sb == NULL)
400 return -1;
401
402 newtFormAddHotKey(self->form, NEWT_KEY_UP);
403 newtFormAddHotKey(self->form, NEWT_KEY_DOWN);
404 newtFormAddHotKey(self->form, NEWT_KEY_PGUP);
405 newtFormAddHotKey(self->form, NEWT_KEY_PGDN);
406 newtFormAddHotKey(self->form, ' ');
407 newtFormAddHotKey(self->form, NEWT_KEY_HOME);
408 newtFormAddHotKey(self->form, NEWT_KEY_END);
409 newtFormAddHotKey(self->form, NEWT_KEY_TAB);
410 newtFormAddHotKey(self->form, NEWT_KEY_RIGHT);
411
412 if (ui_browser__refresh_entries(self) < 0)
413 return -1;
414 newtFormAddComponent(self->form, self->sb);
415
416 while (1) {
417 unsigned int offset;
418
419 newtFormRun(self->form, es);
420
421 if (es->reason != NEWT_EXIT_HOTKEY)
422 break;
423 if (is_exit_key(es->u.key))
424 return es->u.key;
425 switch (es->u.key) {
426 case NEWT_KEY_DOWN:
427 if (self->index == self->nr_entries - 1)
428 break;
429 ++self->index;
430 if (self->index == self->first_visible_entry_idx + self->height) {
431 struct list_head *pos = self->first_visible_entry;
432 ++self->first_visible_entry_idx;
433 self->first_visible_entry = pos->next;
434 }
435 break;
436 case NEWT_KEY_UP:
437 if (self->index == 0)
438 break;
439 --self->index;
440 if (self->index < self->first_visible_entry_idx) {
441 struct list_head *pos = self->first_visible_entry;
442 --self->first_visible_entry_idx;
443 self->first_visible_entry = pos->prev;
444 }
445 break;
446 case NEWT_KEY_PGDN:
447 case ' ':
448 if (self->first_visible_entry_idx + self->height > self->nr_entries - 1)
449 break;
450
451 offset = self->height;
452 if (self->index + offset > self->nr_entries - 1)
453 offset = self->nr_entries - 1 - self->index;
454 self->index += offset;
455 self->first_visible_entry_idx += offset;
456
457 while (offset--) {
458 struct list_head *pos = self->first_visible_entry;
459 self->first_visible_entry = pos->next;
460 }
461
462 break;
463 case NEWT_KEY_PGUP:
464 if (self->first_visible_entry_idx == 0)
465 break;
466
467 if (self->first_visible_entry_idx < self->height)
468 offset = self->first_visible_entry_idx;
469 else
470 offset = self->height;
471
472 self->index -= offset;
473 self->first_visible_entry_idx -= offset;
474
475 while (offset--) {
476 struct list_head *pos = self->first_visible_entry;
477 self->first_visible_entry = pos->prev;
478 }
479 break;
480 case NEWT_KEY_HOME:
481 ui_browser__reset_index(self);
482 break;
483 case NEWT_KEY_END: {
484 struct list_head *head = self->entries;
485 offset = self->height - 1;
486
487 if (offset > self->nr_entries)
488 offset = self->nr_entries;
489
490 self->index = self->first_visible_entry_idx = self->nr_entries - 1 - offset;
491 self->first_visible_entry = head->prev;
492 while (offset-- != 0) {
493 struct list_head *pos = self->first_visible_entry;
494 self->first_visible_entry = pos->prev;
495 }
496 }
497 break;
498 case NEWT_KEY_RIGHT:
499 case NEWT_KEY_LEFT:
500 case NEWT_KEY_TAB:
501 return es->u.key;
502 default:
503 continue;
504 }
505 if (ui_browser__refresh_entries(self) < 0)
506 return -1;
507 }
508 return 0;
509}
510
511/*
512 * When debugging newt problems it was useful to be able to "unroll"
513 * the calls to newtCheckBoxTreeAdd{Array,Item}, so that we can generate
514 * a source file with the sequence of calls to these methods, to then
515 * tweak the arrays to get the intended results, so I'm keeping this code
516 * here, may be useful again in the future.
517 */
518#undef NEWT_DEBUG
519
520static void newt_checkbox_tree__add(newtComponent tree, const char *str,
521 void *priv, int *indexes)
522{
523#ifdef NEWT_DEBUG
524 /* Print the newtCheckboxTreeAddArray to tinker with its index arrays */
525 int i = 0, len = 40 - strlen(str);
526
527 fprintf(stderr,
528 "\tnewtCheckboxTreeAddItem(tree, %*.*s\"%s\", (void *)%p, 0, ",
529 len, len, " ", str, priv);
530 while (indexes[i] != NEWT_ARG_LAST) {
531 if (indexes[i] != NEWT_ARG_APPEND)
532 fprintf(stderr, " %d,", indexes[i]);
533 else
534 fprintf(stderr, " %s,", "NEWT_ARG_APPEND");
535 ++i;
536 }
537 fprintf(stderr, " %s", " NEWT_ARG_LAST);\n");
538 fflush(stderr);
539#endif
540 newtCheckboxTreeAddArray(tree, str, priv, 0, indexes);
541}
542
543static char *callchain_list__sym_name(struct callchain_list *self,
544 char *bf, size_t bfsize)
545{
546 if (self->ms.sym)
547 return self->ms.sym->name;
548
549 snprintf(bf, bfsize, "%#Lx", self->ip);
550 return bf;
551}
552
553static void __callchain__append_graph_browser(struct callchain_node *self,
554 newtComponent tree, u64 total,
555 int *indexes, int depth)
556{
557 struct rb_node *node;
558 u64 new_total, remaining;
559 int idx = 0;
560
561 if (callchain_param.mode == CHAIN_GRAPH_REL)
562 new_total = self->children_hit;
563 else
564 new_total = total;
565
566 remaining = new_total;
567 node = rb_first(&self->rb_root);
568 while (node) {
569 struct callchain_node *child = rb_entry(node, struct callchain_node, rb_node);
570 struct rb_node *next = rb_next(node);
571 u64 cumul = cumul_hits(child);
572 struct callchain_list *chain;
573 int first = true, printed = 0;
574 int chain_idx = -1;
575 remaining -= cumul;
576
577 indexes[depth] = NEWT_ARG_APPEND;
578 indexes[depth + 1] = NEWT_ARG_LAST;
579
580 list_for_each_entry(chain, &child->val, list) {
581 char ipstr[BITS_PER_LONG / 4 + 1],
582 *alloc_str = NULL;
583 const char *str = callchain_list__sym_name(chain, ipstr, sizeof(ipstr));
584
585 if (first) {
586 double percent = cumul * 100.0 / new_total;
587
588 first = false;
589 if (asprintf(&alloc_str, "%2.2f%% %s", percent, str) < 0)
590 str = "Not enough memory!";
591 else
592 str = alloc_str;
593 } else {
594 indexes[depth] = idx;
595 indexes[depth + 1] = NEWT_ARG_APPEND;
596 indexes[depth + 2] = NEWT_ARG_LAST;
597 ++chain_idx;
598 }
599 newt_checkbox_tree__add(tree, str, &chain->ms, indexes);
600 free(alloc_str);
601 ++printed;
602 }
603
604 indexes[depth] = idx;
605 if (chain_idx != -1)
606 indexes[depth + 1] = chain_idx;
607 if (printed != 0)
608 ++idx;
609 __callchain__append_graph_browser(child, tree, new_total, indexes,
610 depth + (chain_idx != -1 ? 2 : 1));
611 node = next;
612 }
613}
614
615static void callchain__append_graph_browser(struct callchain_node *self,
616 newtComponent tree, u64 total,
617 int *indexes, int parent_idx)
618{
619 struct callchain_list *chain;
620 int i = 0;
621
622 indexes[1] = NEWT_ARG_APPEND;
623 indexes[2] = NEWT_ARG_LAST;
624
625 list_for_each_entry(chain, &self->val, list) {
626 char ipstr[BITS_PER_LONG / 4 + 1], *str;
627
628 if (chain->ip >= PERF_CONTEXT_MAX)
629 continue;
630
631 if (!i++ && sort__first_dimension == SORT_SYM)
632 continue;
633
634 str = callchain_list__sym_name(chain, ipstr, sizeof(ipstr));
635 newt_checkbox_tree__add(tree, str, &chain->ms, indexes);
636 }
637
638 indexes[1] = parent_idx;
639 indexes[2] = NEWT_ARG_APPEND;
640 indexes[3] = NEWT_ARG_LAST;
641 __callchain__append_graph_browser(self, tree, total, indexes, 2);
642}
643
644static void hist_entry__append_callchain_browser(struct hist_entry *self,
645 newtComponent tree, u64 total, int parent_idx)
646{
647 struct rb_node *rb_node;
648 int indexes[1024] = { [0] = parent_idx, };
649 int idx = 0;
650 struct callchain_node *chain;
651
652 rb_node = rb_first(&self->sorted_chain);
653 while (rb_node) {
654 chain = rb_entry(rb_node, struct callchain_node, rb_node);
655 switch (callchain_param.mode) {
656 case CHAIN_FLAT:
657 break;
658 case CHAIN_GRAPH_ABS: /* falldown */
659 case CHAIN_GRAPH_REL:
660 callchain__append_graph_browser(chain, tree, total, indexes, idx++);
661 break;
662 case CHAIN_NONE:
663 default:
664 break;
665 }
666 rb_node = rb_next(rb_node);
667 }
668}
669
670static size_t hist_entry__append_browser(struct hist_entry *self,
671 newtComponent tree, u64 total)
672{
673 char s[256];
674 size_t ret;
675
676 if (symbol_conf.exclude_other && !self->parent)
677 return 0;
678
679 ret = hist_entry__snprintf(self, s, sizeof(s), NULL,
680 false, 0, false, total);
681 if (symbol_conf.use_callchain) {
682 int indexes[2];
683
684 indexes[0] = NEWT_ARG_APPEND;
685 indexes[1] = NEWT_ARG_LAST;
686 newt_checkbox_tree__add(tree, s, &self->ms, indexes);
687 } else
688 newtListboxAppendEntry(tree, s, &self->ms);
689
690 return ret;
691}
692
693int hist_entry__tui_annotate(struct hist_entry *self)
694{
695 struct ui_browser browser;
696 struct newtExitStruct es;
697 struct objdump_line *pos, *n;
698 LIST_HEAD(head);
699 int ret;
700
701 if (self->ms.sym == NULL)
702 return -1;
703
704 if (self->ms.map->dso->annotate_warned)
705 return -1;
706
707 if (hist_entry__annotate(self, &head) < 0) {
708 ui__error_window(browser__last_msg);
709 return -1;
710 }
711
712 ui_helpline__push("Press <- or ESC to exit");
713
714 memset(&browser, 0, sizeof(browser));
715 browser.entries = &head;
716 browser.priv = self;
717 list_for_each_entry(pos, &head, node) {
718 size_t line_len = strlen(pos->line);
719 if (browser.width < line_len)
720 browser.width = line_len;
721 ++browser.nr_entries;
722 }
723
724 browser.width += 18; /* Percentage */
725 ret = ui_browser__run(&browser, self->ms.sym->name, &es);
726 newtFormDestroy(browser.form);
727 newtPopWindow();
728 list_for_each_entry_safe(pos, n, &head, node) {
729 list_del(&pos->node);
730 objdump_line__free(pos);
731 }
732 ui_helpline__pop();
733 return ret;
734}
735
736static const void *newt__symbol_tree_get_current(newtComponent self)
737{
738 if (symbol_conf.use_callchain)
739 return newtCheckboxTreeGetCurrent(self);
740 return newtListboxGetCurrent(self);
741}
742
743static void hist_browser__selection(newtComponent self, void *data)
744{
745 const struct map_symbol **symbol_ptr = data;
746 *symbol_ptr = newt__symbol_tree_get_current(self);
747}
748
749struct hist_browser {
750 newtComponent form, tree;
751 const struct map_symbol *selection;
752};
753
754static struct hist_browser *hist_browser__new(void)
755{
756 struct hist_browser *self = malloc(sizeof(*self));
757
758 if (self != NULL)
759 self->form = NULL;
760
761 return self;
762}
763
764static void hist_browser__delete(struct hist_browser *self)
765{
766 newtFormDestroy(self->form);
767 newtPopWindow();
768 free(self);
769}
770
771static int hist_browser__populate(struct hist_browser *self, struct hists *hists,
772 const char *title)
773{
774 int max_len = 0, idx, cols, rows;
775 struct ui_progress *progress;
776 struct rb_node *nd;
777 u64 curr_hist = 0;
778 char seq[] = ".", unit;
779 char str[256];
780 unsigned long nr_events = hists->stats.nr_events[PERF_RECORD_SAMPLE];
781
782 if (self->form) {
783 newtFormDestroy(self->form);
784 newtPopWindow();
785 }
786
787 nr_events = convert_unit(nr_events, &unit);
788 snprintf(str, sizeof(str), "Events: %lu%c ",
789 nr_events, unit);
790 newtDrawRootText(0, 0, str);
791
792 newtGetScreenSize(NULL, &rows);
793
794 if (symbol_conf.use_callchain)
795 self->tree = newtCheckboxTreeMulti(0, 0, rows - 5, seq,
796 NEWT_FLAG_SCROLL);
797 else
798 self->tree = newtListbox(0, 0, rows - 5,
799 (NEWT_FLAG_SCROLL |
800 NEWT_FLAG_RETURNEXIT));
801
802 newtComponentAddCallback(self->tree, hist_browser__selection,
803 &self->selection);
804
805 progress = ui_progress__new("Adding entries to the browser...",
806 hists->nr_entries);
807 if (progress == NULL)
808 return -1;
809
810 idx = 0;
811 for (nd = rb_first(&hists->entries); nd; nd = rb_next(nd)) {
812 struct hist_entry *h = rb_entry(nd, struct hist_entry, rb_node);
813 int len;
814
815 if (h->filtered)
816 continue;
817
818 len = hist_entry__append_browser(h, self->tree, hists->stats.total_period);
819 if (len > max_len)
820 max_len = len;
821 if (symbol_conf.use_callchain)
822 hist_entry__append_callchain_browser(h, self->tree,
823 hists->stats.total_period, idx++);
824 ++curr_hist;
825 if (curr_hist % 5)
826 ui_progress__update(progress, curr_hist);
827 }
828
829 ui_progress__delete(progress);
830
831 newtGetScreenSize(&cols, &rows);
832
833 if (max_len > cols)
834 max_len = cols - 3;
835
836 if (!symbol_conf.use_callchain)
837 newtListboxSetWidth(self->tree, max_len);
838
839 newtCenteredWindow(max_len + (symbol_conf.use_callchain ? 5 : 0),
840 rows - 5, title);
841 self->form = newt_form__new();
842 if (self->form == NULL)
843 return -1;
844
845 newtFormAddHotKey(self->form, 'A');
846 newtFormAddHotKey(self->form, 'a');
847 newtFormAddHotKey(self->form, 'D');
848 newtFormAddHotKey(self->form, 'd');
849 newtFormAddHotKey(self->form, 'T');
850 newtFormAddHotKey(self->form, 't');
851 newtFormAddHotKey(self->form, '?');
852 newtFormAddHotKey(self->form, 'H');
853 newtFormAddHotKey(self->form, 'h');
854 newtFormAddHotKey(self->form, NEWT_KEY_F1);
855 newtFormAddHotKey(self->form, NEWT_KEY_RIGHT);
856 newtFormAddHotKey(self->form, NEWT_KEY_TAB);
857 newtFormAddHotKey(self->form, NEWT_KEY_UNTAB);
858 newtFormAddComponents(self->form, self->tree, NULL);
859 self->selection = newt__symbol_tree_get_current(self->tree);
860
861 return 0;
862}
863
864static struct hist_entry *hist_browser__selected_entry(struct hist_browser *self)
865{
866 int *indexes;
867
868 if (!symbol_conf.use_callchain)
869 goto out;
870
871 indexes = newtCheckboxTreeFindItem(self->tree, (void *)self->selection);
872 if (indexes) {
873 bool is_hist_entry = indexes[1] == NEWT_ARG_LAST;
874 free(indexes);
875 if (is_hist_entry)
876 goto out;
877 }
878 return NULL;
879out:
880 return container_of(self->selection, struct hist_entry, ms);
881}
882
883static struct thread *hist_browser__selected_thread(struct hist_browser *self)
884{
885 struct hist_entry *he = hist_browser__selected_entry(self);
886 return he ? he->thread : NULL;
887}
888
889static int hist_browser__title(char *bf, size_t size, const char *ev_name,
890 const struct dso *dso, const struct thread *thread)
891{
892 int printed = 0;
893
894 if (thread)
895 printed += snprintf(bf + printed, size - printed,
896 "Thread: %s(%d)",
897 (thread->comm_set ? thread->comm : ""),
898 thread->pid);
899 if (dso)
900 printed += snprintf(bf + printed, size - printed,
901 "%sDSO: %s", thread ? " " : "",
902 dso->short_name);
903 return printed ?: snprintf(bf, size, "Event: %s", ev_name);
904}
905
906int hists__browse(struct hists *self, const char *helpline, const char *ev_name)
907{
908 struct hist_browser *browser = hist_browser__new();
909 struct pstack *fstack;
910 const struct thread *thread_filter = NULL;
911 const struct dso *dso_filter = NULL;
912 struct newtExitStruct es;
913 char msg[160];
914 int key = -1;
915
916 if (browser == NULL)
917 return -1;
918
919 fstack = pstack__new(2);
920 if (fstack == NULL)
921 goto out;
922
923 ui_helpline__push(helpline);
924
925 hist_browser__title(msg, sizeof(msg), ev_name,
926 dso_filter, thread_filter);
927 if (hist_browser__populate(browser, self, msg) < 0)
928 goto out_free_stack;
929
930 while (1) {
931 const struct thread *thread;
932 const struct dso *dso;
933 char *options[16];
934 int nr_options = 0, choice = 0, i,
935 annotate = -2, zoom_dso = -2, zoom_thread = -2;
936
937 newtFormRun(browser->form, &es);
938
939 thread = hist_browser__selected_thread(browser);
940 dso = browser->selection->map ? browser->selection->map->dso : NULL;
941
942 if (es.reason == NEWT_EXIT_HOTKEY) {
943 key = es.u.key;
944
945 switch (key) {
946 case NEWT_KEY_F1:
947 goto do_help;
948 case NEWT_KEY_TAB:
949 case NEWT_KEY_UNTAB:
950 /*
951 * Exit the browser, let hists__browser_tree
952 * go to the next or previous
953 */
954 goto out_free_stack;
955 default:;
956 }
957
958 key = toupper(key);
959 switch (key) {
960 case 'A':
961 if (browser->selection->map == NULL &&
962 browser->selection->map->dso->annotate_warned)
963 continue;
964 goto do_annotate;
965 case 'D':
966 goto zoom_dso;
967 case 'T':
968 goto zoom_thread;
969 case 'H':
970 case '?':
971do_help:
972 ui__help_window("-> Zoom into DSO/Threads & Annotate current symbol\n"
973 "<- Zoom out\n"
974 "a Annotate current symbol\n"
975 "h/?/F1 Show this window\n"
976 "d Zoom into current DSO\n"
977 "t Zoom into current Thread\n"
978 "q/CTRL+C Exit browser");
979 continue;
980 default:;
981 }
982 if (is_exit_key(key)) {
983 if (key == NEWT_KEY_ESCAPE) {
984 if (dialog_yesno("Do you really want to exit?"))
985 break;
986 else
987 continue;
988 } else
989 break;
990 }
991
992 if (es.u.key == NEWT_KEY_LEFT) {
993 const void *top;
994
995 if (pstack__empty(fstack))
996 continue;
997 top = pstack__pop(fstack);
998 if (top == &dso_filter)
999 goto zoom_out_dso;
1000 if (top == &thread_filter)
1001 goto zoom_out_thread;
1002 continue;
1003 }
1004 }
1005
1006 if (browser->selection->sym != NULL &&
1007 !browser->selection->map->dso->annotate_warned &&
1008 asprintf(&options[nr_options], "Annotate %s",
1009 browser->selection->sym->name) > 0)
1010 annotate = nr_options++;
1011
1012 if (thread != NULL &&
1013 asprintf(&options[nr_options], "Zoom %s %s(%d) thread",
1014 (thread_filter ? "out of" : "into"),
1015 (thread->comm_set ? thread->comm : ""),
1016 thread->pid) > 0)
1017 zoom_thread = nr_options++;
1018
1019 if (dso != NULL &&
1020 asprintf(&options[nr_options], "Zoom %s %s DSO",
1021 (dso_filter ? "out of" : "into"),
1022 (dso->kernel ? "the Kernel" : dso->short_name)) > 0)
1023 zoom_dso = nr_options++;
1024
1025 options[nr_options++] = (char *)"Exit";
1026
1027 choice = popup_menu(nr_options, options);
1028
1029 for (i = 0; i < nr_options - 1; ++i)
1030 free(options[i]);
1031
1032 if (choice == nr_options - 1)
1033 break;
1034
1035 if (choice == -1)
1036 continue;
1037
1038 if (choice == annotate) {
1039 struct hist_entry *he;
1040do_annotate:
1041 if (browser->selection->map->dso->origin == DSO__ORIG_KERNEL) {
1042 browser->selection->map->dso->annotate_warned = 1;
1043 ui_helpline__puts("No vmlinux file found, can't "
1044 "annotate with just a "
1045 "kallsyms file");
1046 continue;
1047 }
1048
1049 he = hist_browser__selected_entry(browser);
1050 if (he == NULL)
1051 continue;
1052
1053 hist_entry__tui_annotate(he);
1054 } else if (choice == zoom_dso) {
1055zoom_dso:
1056 if (dso_filter) {
1057 pstack__remove(fstack, &dso_filter);
1058zoom_out_dso:
1059 ui_helpline__pop();
1060 dso_filter = NULL;
1061 } else {
1062 if (dso == NULL)
1063 continue;
1064 ui_helpline__fpush("To zoom out press <- or -> + \"Zoom out of %s DSO\"",
1065 dso->kernel ? "the Kernel" : dso->short_name);
1066 dso_filter = dso;
1067 pstack__push(fstack, &dso_filter);
1068 }
1069 hists__filter_by_dso(self, dso_filter);
1070 hist_browser__title(msg, sizeof(msg), ev_name,
1071 dso_filter, thread_filter);
1072 if (hist_browser__populate(browser, self, msg) < 0)
1073 goto out;
1074 } else if (choice == zoom_thread) {
1075zoom_thread:
1076 if (thread_filter) {
1077 pstack__remove(fstack, &thread_filter);
1078zoom_out_thread:
1079 ui_helpline__pop();
1080 thread_filter = NULL;
1081 } else {
1082 ui_helpline__fpush("To zoom out press <- or -> + \"Zoom out of %s(%d) thread\"",
1083 thread->comm_set ? thread->comm : "",
1084 thread->pid);
1085 thread_filter = thread;
1086 pstack__push(fstack, &thread_filter);
1087 }
1088 hists__filter_by_thread(self, thread_filter);
1089 hist_browser__title(msg, sizeof(msg), ev_name,
1090 dso_filter, thread_filter);
1091 if (hist_browser__populate(browser, self, msg) < 0)
1092 goto out;
1093 }
1094 }
1095out_free_stack:
1096 pstack__delete(fstack);
1097out:
1098 hist_browser__delete(browser);
1099 return key;
1100}
1101
1102int hists__tui_browse_tree(struct rb_root *self, const char *help)
1103{
1104 struct rb_node *first = rb_first(self), *nd = first, *next;
1105 int key = 0;
1106
1107 while (nd) {
1108 struct hists *hists = rb_entry(nd, struct hists, rb_node);
1109 const char *ev_name = __event_name(hists->type, hists->config);
1110
1111 key = hists__browse(hists, help, ev_name);
1112
1113 if (is_exit_key(key))
1114 break;
1115
1116 switch (key) {
1117 case NEWT_KEY_TAB:
1118 next = rb_next(nd);
1119 if (next)
1120 nd = next;
1121 break;
1122 case NEWT_KEY_UNTAB:
1123 if (nd == first)
1124 continue;
1125 nd = rb_prev(nd);
1126 default:
1127 break;
1128 }
1129 }
1130
1131 return key;
1132}
1133
1134static struct newtPercentTreeColors {
1135 const char *topColorFg, *topColorBg;
1136 const char *mediumColorFg, *mediumColorBg;
1137 const char *normalColorFg, *normalColorBg;
1138 const char *selColorFg, *selColorBg;
1139 const char *codeColorFg, *codeColorBg;
1140} defaultPercentTreeColors = {
1141 "red", "lightgray",
1142 "green", "lightgray",
1143 "black", "lightgray",
1144 "lightgray", "magenta",
1145 "blue", "lightgray",
1146};
1147
1148void setup_browser(void)
1149{
1150 struct newtPercentTreeColors *c = &defaultPercentTreeColors;
1151
1152 if (!isatty(1) || !use_browser || dump_trace) {
1153 use_browser = 0;
1154 setup_pager();
1155 return;
1156 }
1157
1158 use_browser = 1;
1159 newtInit();
1160 newtCls();
1161 ui_helpline__puts(" ");
1162 sltt_set_color(HE_COLORSET_TOP, NULL, c->topColorFg, c->topColorBg);
1163 sltt_set_color(HE_COLORSET_MEDIUM, NULL, c->mediumColorFg, c->mediumColorBg);
1164 sltt_set_color(HE_COLORSET_NORMAL, NULL, c->normalColorFg, c->normalColorBg);
1165 sltt_set_color(HE_COLORSET_SELECTED, NULL, c->selColorFg, c->selColorBg);
1166 sltt_set_color(HE_COLORSET_CODE, NULL, c->codeColorFg, c->codeColorBg);
1167}
1168
1169void exit_browser(bool wait_for_ok)
1170{
1171 if (use_browser > 0) {
1172 if (wait_for_ok) {
1173 char title[] = "Fatal Error", ok[] = "Ok";
1174 newtWinMessage(title, ok, browser__last_msg);
1175 }
1176 newtFinished();
1177 }
1178}
diff --git a/tools/perf/util/parse-events.c b/tools/perf/util/parse-events.c
index e5bc0fb016b2..9bf0f402ca73 100644
--- a/tools/perf/util/parse-events.c
+++ b/tools/perf/util/parse-events.c
@@ -5,6 +5,7 @@
5#include "parse-events.h" 5#include "parse-events.h"
6#include "exec_cmd.h" 6#include "exec_cmd.h"
7#include "string.h" 7#include "string.h"
8#include "symbol.h"
8#include "cache.h" 9#include "cache.h"
9#include "header.h" 10#include "header.h"
10#include "debugfs.h" 11#include "debugfs.h"
@@ -409,7 +410,6 @@ static enum event_result
409parse_single_tracepoint_event(char *sys_name, 410parse_single_tracepoint_event(char *sys_name,
410 const char *evt_name, 411 const char *evt_name,
411 unsigned int evt_length, 412 unsigned int evt_length,
412 char *flags,
413 struct perf_event_attr *attr, 413 struct perf_event_attr *attr,
414 const char **strp) 414 const char **strp)
415{ 415{
@@ -418,14 +418,6 @@ parse_single_tracepoint_event(char *sys_name,
418 u64 id; 418 u64 id;
419 int fd; 419 int fd;
420 420
421 if (flags) {
422 if (!strncmp(flags, "record", strlen(flags))) {
423 attr->sample_type |= PERF_SAMPLE_RAW;
424 attr->sample_type |= PERF_SAMPLE_TIME;
425 attr->sample_type |= PERF_SAMPLE_CPU;
426 }
427 }
428
429 snprintf(evt_path, MAXPATHLEN, "%s/%s/%s/id", debugfs_path, 421 snprintf(evt_path, MAXPATHLEN, "%s/%s/%s/id", debugfs_path,
430 sys_name, evt_name); 422 sys_name, evt_name);
431 423
@@ -444,13 +436,21 @@ parse_single_tracepoint_event(char *sys_name,
444 attr->type = PERF_TYPE_TRACEPOINT; 436 attr->type = PERF_TYPE_TRACEPOINT;
445 *strp = evt_name + evt_length; 437 *strp = evt_name + evt_length;
446 438
439 attr->sample_type |= PERF_SAMPLE_RAW;
440 attr->sample_type |= PERF_SAMPLE_TIME;
441 attr->sample_type |= PERF_SAMPLE_CPU;
442
443 attr->sample_period = 1;
444
445
447 return EVT_HANDLED; 446 return EVT_HANDLED;
448} 447}
449 448
450/* sys + ':' + event + ':' + flags*/ 449/* sys + ':' + event + ':' + flags*/
451#define MAX_EVOPT_LEN (MAX_EVENT_LENGTH * 2 + 2 + 128) 450#define MAX_EVOPT_LEN (MAX_EVENT_LENGTH * 2 + 2 + 128)
452static enum event_result 451static enum event_result
453parse_subsystem_tracepoint_event(char *sys_name, char *flags) 452parse_multiple_tracepoint_event(char *sys_name, const char *evt_exp,
453 char *flags)
454{ 454{
455 char evt_path[MAXPATHLEN]; 455 char evt_path[MAXPATHLEN];
456 struct dirent *evt_ent; 456 struct dirent *evt_ent;
@@ -474,6 +474,9 @@ parse_subsystem_tracepoint_event(char *sys_name, char *flags)
474 || !strcmp(evt_ent->d_name, "filter")) 474 || !strcmp(evt_ent->d_name, "filter"))
475 continue; 475 continue;
476 476
477 if (!strglobmatch(evt_ent->d_name, evt_exp))
478 continue;
479
477 len = snprintf(event_opt, MAX_EVOPT_LEN, "%s:%s%s%s", sys_name, 480 len = snprintf(event_opt, MAX_EVOPT_LEN, "%s:%s%s%s", sys_name,
478 evt_ent->d_name, flags ? ":" : "", 481 evt_ent->d_name, flags ? ":" : "",
479 flags ?: ""); 482 flags ?: "");
@@ -522,13 +525,13 @@ static enum event_result parse_tracepoint_event(const char **strp,
522 if (evt_length >= MAX_EVENT_LENGTH) 525 if (evt_length >= MAX_EVENT_LENGTH)
523 return EVT_FAILED; 526 return EVT_FAILED;
524 527
525 if (!strcmp(evt_name, "*")) { 528 if (strpbrk(evt_name, "*?")) {
526 *strp = evt_name + evt_length; 529 *strp = evt_name + evt_length;
527 return parse_subsystem_tracepoint_event(sys_name, flags); 530 return parse_multiple_tracepoint_event(sys_name, evt_name,
531 flags);
528 } else 532 } else
529 return parse_single_tracepoint_event(sys_name, evt_name, 533 return parse_single_tracepoint_event(sys_name, evt_name,
530 evt_length, flags, 534 evt_length, attr, strp);
531 attr, strp);
532} 535}
533 536
534static enum event_result 537static enum event_result
@@ -685,19 +688,29 @@ static enum event_result
685parse_event_modifier(const char **strp, struct perf_event_attr *attr) 688parse_event_modifier(const char **strp, struct perf_event_attr *attr)
686{ 689{
687 const char *str = *strp; 690 const char *str = *strp;
688 int eu = 1, ek = 1, eh = 1; 691 int exclude = 0;
692 int eu = 0, ek = 0, eh = 0, precise = 0;
689 693
690 if (*str++ != ':') 694 if (*str++ != ':')
691 return 0; 695 return 0;
692 while (*str) { 696 while (*str) {
693 if (*str == 'u') 697 if (*str == 'u') {
698 if (!exclude)
699 exclude = eu = ek = eh = 1;
694 eu = 0; 700 eu = 0;
695 else if (*str == 'k') 701 } else if (*str == 'k') {
702 if (!exclude)
703 exclude = eu = ek = eh = 1;
696 ek = 0; 704 ek = 0;
697 else if (*str == 'h') 705 } else if (*str == 'h') {
706 if (!exclude)
707 exclude = eu = ek = eh = 1;
698 eh = 0; 708 eh = 0;
699 else 709 } else if (*str == 'p') {
710 precise++;
711 } else
700 break; 712 break;
713
701 ++str; 714 ++str;
702 } 715 }
703 if (str >= *strp + 2) { 716 if (str >= *strp + 2) {
@@ -705,6 +718,7 @@ parse_event_modifier(const char **strp, struct perf_event_attr *attr)
705 attr->exclude_user = eu; 718 attr->exclude_user = eu;
706 attr->exclude_kernel = ek; 719 attr->exclude_kernel = ek;
707 attr->exclude_hv = eh; 720 attr->exclude_hv = eh;
721 attr->precise_ip = precise;
708 return 1; 722 return 1;
709 } 723 }
710 return 0; 724 return 0;
@@ -753,11 +767,11 @@ modifier:
753 return ret; 767 return ret;
754} 768}
755 769
756static void store_event_type(const char *orgname) 770static int store_event_type(const char *orgname)
757{ 771{
758 char filename[PATH_MAX], *c; 772 char filename[PATH_MAX], *c;
759 FILE *file; 773 FILE *file;
760 int id; 774 int id, n;
761 775
762 sprintf(filename, "%s/", debugfs_path); 776 sprintf(filename, "%s/", debugfs_path);
763 strncat(filename, orgname, strlen(orgname)); 777 strncat(filename, orgname, strlen(orgname));
@@ -769,11 +783,14 @@ static void store_event_type(const char *orgname)
769 783
770 file = fopen(filename, "r"); 784 file = fopen(filename, "r");
771 if (!file) 785 if (!file)
772 return; 786 return 0;
773 if (fscanf(file, "%i", &id) < 1) 787 n = fscanf(file, "%i", &id);
774 die("cannot store event ID");
775 fclose(file); 788 fclose(file);
776 perf_header__push_event(id, orgname); 789 if (n < 1) {
790 pr_err("cannot store event ID\n");
791 return -EINVAL;
792 }
793 return perf_header__push_event(id, orgname);
777} 794}
778 795
779int parse_events(const struct option *opt __used, const char *str, int unset __used) 796int parse_events(const struct option *opt __used, const char *str, int unset __used)
@@ -782,7 +799,8 @@ int parse_events(const struct option *opt __used, const char *str, int unset __u
782 enum event_result ret; 799 enum event_result ret;
783 800
784 if (strchr(str, ':')) 801 if (strchr(str, ':'))
785 store_event_type(str); 802 if (store_event_type(str) < 0)
803 return -1;
786 804
787 for (;;) { 805 for (;;) {
788 if (nr_counters == MAX_COUNTERS) 806 if (nr_counters == MAX_COUNTERS)
@@ -835,11 +853,12 @@ int parse_filter(const struct option *opt __used, const char *str,
835} 853}
836 854
837static const char * const event_type_descriptors[] = { 855static const char * const event_type_descriptors[] = {
838 "",
839 "Hardware event", 856 "Hardware event",
840 "Software event", 857 "Software event",
841 "Tracepoint event", 858 "Tracepoint event",
842 "Hardware cache event", 859 "Hardware cache event",
860 "Raw hardware event descriptor",
861 "Hardware breakpoint",
843}; 862};
844 863
845/* 864/*
@@ -872,7 +891,7 @@ static void print_tracepoint_events(void)
872 snprintf(evt_path, MAXPATHLEN, "%s:%s", 891 snprintf(evt_path, MAXPATHLEN, "%s:%s",
873 sys_dirent.d_name, evt_dirent.d_name); 892 sys_dirent.d_name, evt_dirent.d_name);
874 printf(" %-42s [%s]\n", evt_path, 893 printf(" %-42s [%s]\n", evt_path,
875 event_type_descriptors[PERF_TYPE_TRACEPOINT+1]); 894 event_type_descriptors[PERF_TYPE_TRACEPOINT]);
876 } 895 }
877 closedir(evt_dir); 896 closedir(evt_dir);
878 } 897 }
@@ -892,9 +911,7 @@ void print_events(void)
892 printf("List of pre-defined events (to be used in -e):\n"); 911 printf("List of pre-defined events (to be used in -e):\n");
893 912
894 for (i = 0; i < ARRAY_SIZE(event_symbols); i++, syms++) { 913 for (i = 0; i < ARRAY_SIZE(event_symbols); i++, syms++) {
895 type = syms->type + 1; 914 type = syms->type;
896 if (type >= ARRAY_SIZE(event_type_descriptors))
897 type = 0;
898 915
899 if (type != prev_type) 916 if (type != prev_type)
900 printf("\n"); 917 printf("\n");
@@ -919,17 +936,20 @@ void print_events(void)
919 for (i = 0; i < PERF_COUNT_HW_CACHE_RESULT_MAX; i++) { 936 for (i = 0; i < PERF_COUNT_HW_CACHE_RESULT_MAX; i++) {
920 printf(" %-42s [%s]\n", 937 printf(" %-42s [%s]\n",
921 event_cache_name(type, op, i), 938 event_cache_name(type, op, i),
922 event_type_descriptors[4]); 939 event_type_descriptors[PERF_TYPE_HW_CACHE]);
923 } 940 }
924 } 941 }
925 } 942 }
926 943
927 printf("\n"); 944 printf("\n");
928 printf(" %-42s [raw hardware event descriptor]\n", 945 printf(" %-42s [%s]\n",
929 "rNNN"); 946 "rNNN (see 'perf list --help' on how to encode it)",
947 event_type_descriptors[PERF_TYPE_RAW]);
930 printf("\n"); 948 printf("\n");
931 949
932 printf(" %-42s [hardware breakpoint]\n", "mem:<addr>[:access]"); 950 printf(" %-42s [%s]\n",
951 "mem:<addr>[:access]",
952 event_type_descriptors[PERF_TYPE_BREAKPOINT]);
933 printf("\n"); 953 printf("\n");
934 954
935 print_tracepoint_events(); 955 print_tracepoint_events();
diff --git a/tools/perf/util/parse-events.h b/tools/perf/util/parse-events.h
index b8c1f64bc935..fc4ab3fe877a 100644
--- a/tools/perf/util/parse-events.h
+++ b/tools/perf/util/parse-events.h
@@ -13,6 +13,7 @@ struct tracepoint_path {
13}; 13};
14 14
15extern struct tracepoint_path *tracepoint_id_to_path(u64 config); 15extern struct tracepoint_path *tracepoint_id_to_path(u64 config);
16extern bool have_tracepoints(struct perf_event_attr *pattrs, int nb_events);
16 17
17extern int nr_counters; 18extern int nr_counters;
18 19
diff --git a/tools/perf/util/parse-options.c b/tools/perf/util/parse-options.c
index efebd5b476b3..99d02aa57dbf 100644
--- a/tools/perf/util/parse-options.c
+++ b/tools/perf/util/parse-options.c
@@ -49,8 +49,9 @@ static int get_value(struct parse_opt_ctx_t *p,
49 break; 49 break;
50 /* FALLTHROUGH */ 50 /* FALLTHROUGH */
51 case OPTION_BOOLEAN: 51 case OPTION_BOOLEAN:
52 case OPTION_INCR:
52 case OPTION_BIT: 53 case OPTION_BIT:
53 case OPTION_SET_INT: 54 case OPTION_SET_UINT:
54 case OPTION_SET_PTR: 55 case OPTION_SET_PTR:
55 return opterror(opt, "takes no value", flags); 56 return opterror(opt, "takes no value", flags);
56 case OPTION_END: 57 case OPTION_END:
@@ -58,7 +59,9 @@ static int get_value(struct parse_opt_ctx_t *p,
58 case OPTION_GROUP: 59 case OPTION_GROUP:
59 case OPTION_STRING: 60 case OPTION_STRING:
60 case OPTION_INTEGER: 61 case OPTION_INTEGER:
62 case OPTION_UINTEGER:
61 case OPTION_LONG: 63 case OPTION_LONG:
64 case OPTION_U64:
62 default: 65 default:
63 break; 66 break;
64 } 67 }
@@ -73,11 +76,15 @@ static int get_value(struct parse_opt_ctx_t *p,
73 return 0; 76 return 0;
74 77
75 case OPTION_BOOLEAN: 78 case OPTION_BOOLEAN:
79 *(bool *)opt->value = unset ? false : true;
80 return 0;
81
82 case OPTION_INCR:
76 *(int *)opt->value = unset ? 0 : *(int *)opt->value + 1; 83 *(int *)opt->value = unset ? 0 : *(int *)opt->value + 1;
77 return 0; 84 return 0;
78 85
79 case OPTION_SET_INT: 86 case OPTION_SET_UINT:
80 *(int *)opt->value = unset ? 0 : opt->defval; 87 *(unsigned int *)opt->value = unset ? 0 : opt->defval;
81 return 0; 88 return 0;
82 89
83 case OPTION_SET_PTR: 90 case OPTION_SET_PTR:
@@ -120,6 +127,22 @@ static int get_value(struct parse_opt_ctx_t *p,
120 return opterror(opt, "expects a numerical value", flags); 127 return opterror(opt, "expects a numerical value", flags);
121 return 0; 128 return 0;
122 129
130 case OPTION_UINTEGER:
131 if (unset) {
132 *(unsigned int *)opt->value = 0;
133 return 0;
134 }
135 if (opt->flags & PARSE_OPT_OPTARG && !p->opt) {
136 *(unsigned int *)opt->value = opt->defval;
137 return 0;
138 }
139 if (get_arg(p, opt, flags, &arg))
140 return -1;
141 *(unsigned int *)opt->value = strtol(arg, (char **)&s, 10);
142 if (*s)
143 return opterror(opt, "expects a numerical value", flags);
144 return 0;
145
123 case OPTION_LONG: 146 case OPTION_LONG:
124 if (unset) { 147 if (unset) {
125 *(long *)opt->value = 0; 148 *(long *)opt->value = 0;
@@ -136,6 +159,22 @@ static int get_value(struct parse_opt_ctx_t *p,
136 return opterror(opt, "expects a numerical value", flags); 159 return opterror(opt, "expects a numerical value", flags);
137 return 0; 160 return 0;
138 161
162 case OPTION_U64:
163 if (unset) {
164 *(u64 *)opt->value = 0;
165 return 0;
166 }
167 if (opt->flags & PARSE_OPT_OPTARG && !p->opt) {
168 *(u64 *)opt->value = opt->defval;
169 return 0;
170 }
171 if (get_arg(p, opt, flags, &arg))
172 return -1;
173 *(u64 *)opt->value = strtoull(arg, (char **)&s, 10);
174 if (*s)
175 return opterror(opt, "expects a numerical value", flags);
176 return 0;
177
139 case OPTION_END: 178 case OPTION_END:
140 case OPTION_ARGUMENT: 179 case OPTION_ARGUMENT:
141 case OPTION_GROUP: 180 case OPTION_GROUP:
@@ -441,7 +480,10 @@ int usage_with_options_internal(const char * const *usagestr,
441 switch (opts->type) { 480 switch (opts->type) {
442 case OPTION_ARGUMENT: 481 case OPTION_ARGUMENT:
443 break; 482 break;
483 case OPTION_LONG:
484 case OPTION_U64:
444 case OPTION_INTEGER: 485 case OPTION_INTEGER:
486 case OPTION_UINTEGER:
445 if (opts->flags & PARSE_OPT_OPTARG) 487 if (opts->flags & PARSE_OPT_OPTARG)
446 if (opts->long_name) 488 if (opts->long_name)
447 pos += fprintf(stderr, "[=<n>]"); 489 pos += fprintf(stderr, "[=<n>]");
@@ -473,14 +515,14 @@ int usage_with_options_internal(const char * const *usagestr,
473 pos += fprintf(stderr, " ..."); 515 pos += fprintf(stderr, " ...");
474 } 516 }
475 break; 517 break;
476 default: /* OPTION_{BIT,BOOLEAN,SET_INT,SET_PTR} */ 518 default: /* OPTION_{BIT,BOOLEAN,SET_UINT,SET_PTR} */
477 case OPTION_END: 519 case OPTION_END:
478 case OPTION_GROUP: 520 case OPTION_GROUP:
479 case OPTION_BIT: 521 case OPTION_BIT:
480 case OPTION_BOOLEAN: 522 case OPTION_BOOLEAN:
481 case OPTION_SET_INT: 523 case OPTION_INCR:
524 case OPTION_SET_UINT:
482 case OPTION_SET_PTR: 525 case OPTION_SET_PTR:
483 case OPTION_LONG:
484 break; 526 break;
485 } 527 }
486 528
@@ -500,6 +542,7 @@ int usage_with_options_internal(const char * const *usagestr,
500void usage_with_options(const char * const *usagestr, 542void usage_with_options(const char * const *usagestr,
501 const struct option *opts) 543 const struct option *opts)
502{ 544{
545 exit_browser(false);
503 usage_with_options_internal(usagestr, opts, 0); 546 usage_with_options_internal(usagestr, opts, 0);
504 exit(129); 547 exit(129);
505} 548}
diff --git a/tools/perf/util/parse-options.h b/tools/perf/util/parse-options.h
index 948805af43c2..c7d72dce54b2 100644
--- a/tools/perf/util/parse-options.h
+++ b/tools/perf/util/parse-options.h
@@ -1,6 +1,9 @@
1#ifndef __PERF_PARSE_OPTIONS_H 1#ifndef __PERF_PARSE_OPTIONS_H
2#define __PERF_PARSE_OPTIONS_H 2#define __PERF_PARSE_OPTIONS_H
3 3
4#include <linux/kernel.h>
5#include <stdbool.h>
6
4enum parse_opt_type { 7enum parse_opt_type {
5 /* special types */ 8 /* special types */
6 OPTION_END, 9 OPTION_END,
@@ -8,14 +11,17 @@ enum parse_opt_type {
8 OPTION_GROUP, 11 OPTION_GROUP,
9 /* options with no arguments */ 12 /* options with no arguments */
10 OPTION_BIT, 13 OPTION_BIT,
11 OPTION_BOOLEAN, /* _INCR would have been a better name */ 14 OPTION_BOOLEAN,
12 OPTION_SET_INT, 15 OPTION_INCR,
16 OPTION_SET_UINT,
13 OPTION_SET_PTR, 17 OPTION_SET_PTR,
14 /* options with arguments (usually) */ 18 /* options with arguments (usually) */
15 OPTION_STRING, 19 OPTION_STRING,
16 OPTION_INTEGER, 20 OPTION_INTEGER,
17 OPTION_LONG, 21 OPTION_LONG,
18 OPTION_CALLBACK, 22 OPTION_CALLBACK,
23 OPTION_U64,
24 OPTION_UINTEGER,
19}; 25};
20 26
21enum parse_opt_flags { 27enum parse_opt_flags {
@@ -73,7 +79,7 @@ typedef int parse_opt_cb(const struct option *, const char *arg, int unset);
73 * 79 *
74 * `defval`:: 80 * `defval`::
75 * default value to fill (*->value) with for PARSE_OPT_OPTARG. 81 * default value to fill (*->value) with for PARSE_OPT_OPTARG.
76 * OPTION_{BIT,SET_INT,SET_PTR} store the {mask,integer,pointer} to put in 82 * OPTION_{BIT,SET_UINT,SET_PTR} store the {mask,integer,pointer} to put in
77 * the value when met. 83 * the value when met.
78 * CALLBACKS can use it like they want. 84 * CALLBACKS can use it like they want.
79 */ 85 */
@@ -90,16 +96,21 @@ struct option {
90 intptr_t defval; 96 intptr_t defval;
91}; 97};
92 98
99#define check_vtype(v, type) ( BUILD_BUG_ON_ZERO(!__builtin_types_compatible_p(typeof(v), type)) + v )
100
93#define OPT_END() { .type = OPTION_END } 101#define OPT_END() { .type = OPTION_END }
94#define OPT_ARGUMENT(l, h) { .type = OPTION_ARGUMENT, .long_name = (l), .help = (h) } 102#define OPT_ARGUMENT(l, h) { .type = OPTION_ARGUMENT, .long_name = (l), .help = (h) }
95#define OPT_GROUP(h) { .type = OPTION_GROUP, .help = (h) } 103#define OPT_GROUP(h) { .type = OPTION_GROUP, .help = (h) }
96#define OPT_BIT(s, l, v, h, b) { .type = OPTION_BIT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (b) } 104#define OPT_BIT(s, l, v, h, b) { .type = OPTION_BIT, .short_name = (s), .long_name = (l), .value = check_vtype(v, int *), .help = (h), .defval = (b) }
97#define OPT_BOOLEAN(s, l, v, h) { .type = OPTION_BOOLEAN, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } 105#define OPT_BOOLEAN(s, l, v, h) { .type = OPTION_BOOLEAN, .short_name = (s), .long_name = (l), .value = check_vtype(v, bool *), .help = (h) }
98#define OPT_SET_INT(s, l, v, h, i) { .type = OPTION_SET_INT, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (i) } 106#define OPT_INCR(s, l, v, h) { .type = OPTION_INCR, .short_name = (s), .long_name = (l), .value = check_vtype(v, int *), .help = (h) }
107#define OPT_SET_UINT(s, l, v, h, i) { .type = OPTION_SET_UINT, .short_name = (s), .long_name = (l), .value = check_vtype(v, unsigned int *), .help = (h), .defval = (i) }
99#define OPT_SET_PTR(s, l, v, h, p) { .type = OPTION_SET_PTR, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (p) } 108#define OPT_SET_PTR(s, l, v, h, p) { .type = OPTION_SET_PTR, .short_name = (s), .long_name = (l), .value = (v), .help = (h), .defval = (p) }
100#define OPT_INTEGER(s, l, v, h) { .type = OPTION_INTEGER, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } 109#define OPT_INTEGER(s, l, v, h) { .type = OPTION_INTEGER, .short_name = (s), .long_name = (l), .value = check_vtype(v, int *), .help = (h) }
101#define OPT_LONG(s, l, v, h) { .type = OPTION_LONG, .short_name = (s), .long_name = (l), .value = (v), .help = (h) } 110#define OPT_UINTEGER(s, l, v, h) { .type = OPTION_UINTEGER, .short_name = (s), .long_name = (l), .value = check_vtype(v, unsigned int *), .help = (h) }
102#define OPT_STRING(s, l, v, a, h) { .type = OPTION_STRING, .short_name = (s), .long_name = (l), .value = (v), (a), .help = (h) } 111#define OPT_LONG(s, l, v, h) { .type = OPTION_LONG, .short_name = (s), .long_name = (l), .value = check_vtype(v, long *), .help = (h) }
112#define OPT_U64(s, l, v, h) { .type = OPTION_U64, .short_name = (s), .long_name = (l), .value = check_vtype(v, u64 *), .help = (h) }
113#define OPT_STRING(s, l, v, a, h) { .type = OPTION_STRING, .short_name = (s), .long_name = (l), .value = check_vtype(v, const char **), (a), .help = (h) }
103#define OPT_DATE(s, l, v, h) \ 114#define OPT_DATE(s, l, v, h) \
104 { .type = OPTION_CALLBACK, .short_name = (s), .long_name = (l), .value = (v), .argh = "time", .help = (h), .callback = parse_opt_approxidate_cb } 115 { .type = OPTION_CALLBACK, .short_name = (s), .long_name = (l), .value = (v), .argh = "time", .help = (h), .callback = parse_opt_approxidate_cb }
105#define OPT_CALLBACK(s, l, v, a, h, f) \ 116#define OPT_CALLBACK(s, l, v, a, h, f) \
diff --git a/tools/perf/util/path.c b/tools/perf/util/path.c
index fd1f2faaade4..58a470d036dd 100644
--- a/tools/perf/util/path.c
+++ b/tools/perf/util/path.c
@@ -54,21 +54,6 @@ static char *cleanup_path(char *path)
54 return path; 54 return path;
55} 55}
56 56
57char *mksnpath(char *buf, size_t n, const char *fmt, ...)
58{
59 va_list args;
60 unsigned len;
61
62 va_start(args, fmt);
63 len = vsnprintf(buf, n, fmt, args);
64 va_end(args);
65 if (len >= n) {
66 strlcpy(buf, bad_path, n);
67 return buf;
68 }
69 return cleanup_path(buf);
70}
71
72static char *perf_vsnpath(char *buf, size_t n, const char *fmt, va_list args) 57static char *perf_vsnpath(char *buf, size_t n, const char *fmt, va_list args)
73{ 58{
74 const char *perf_dir = get_perf_dir(); 59 const char *perf_dir = get_perf_dir();
@@ -89,15 +74,6 @@ bad:
89 return buf; 74 return buf;
90} 75}
91 76
92char *perf_snpath(char *buf, size_t n, const char *fmt, ...)
93{
94 va_list args;
95 va_start(args, fmt);
96 (void)perf_vsnpath(buf, n, fmt, args);
97 va_end(args);
98 return buf;
99}
100
101char *perf_pathdup(const char *fmt, ...) 77char *perf_pathdup(const char *fmt, ...)
102{ 78{
103 char path[PATH_MAX]; 79 char path[PATH_MAX];
@@ -143,184 +119,6 @@ char *perf_path(const char *fmt, ...)
143 return cleanup_path(pathname); 119 return cleanup_path(pathname);
144} 120}
145 121
146
147/* perf_mkstemp() - create tmp file honoring TMPDIR variable */
148int perf_mkstemp(char *path, size_t len, const char *template)
149{
150 const char *tmp;
151 size_t n;
152
153 tmp = getenv("TMPDIR");
154 if (!tmp)
155 tmp = "/tmp";
156 n = snprintf(path, len, "%s/%s", tmp, template);
157 if (len <= n) {
158 errno = ENAMETOOLONG;
159 return -1;
160 }
161 return mkstemp(path);
162}
163
164
165const char *make_relative_path(const char *abs_path, const char *base)
166{
167 static char buf[PATH_MAX + 1];
168 int baselen;
169
170 if (!base)
171 return abs_path;
172
173 baselen = strlen(base);
174 if (prefixcmp(abs_path, base))
175 return abs_path;
176 if (abs_path[baselen] == '/')
177 baselen++;
178 else if (base[baselen - 1] != '/')
179 return abs_path;
180
181 strcpy(buf, abs_path + baselen);
182
183 return buf;
184}
185
186/*
187 * It is okay if dst == src, but they should not overlap otherwise.
188 *
189 * Performs the following normalizations on src, storing the result in dst:
190 * - Ensures that components are separated by '/' (Windows only)
191 * - Squashes sequences of '/'.
192 * - Removes "." components.
193 * - Removes ".." components, and the components the precede them.
194 * Returns failure (non-zero) if a ".." component appears as first path
195 * component anytime during the normalization. Otherwise, returns success (0).
196 *
197 * Note that this function is purely textual. It does not follow symlinks,
198 * verify the existence of the path, or make any system calls.
199 */
200int normalize_path_copy(char *dst, const char *src)
201{
202 char *dst0;
203
204 if (has_dos_drive_prefix(src)) {
205 *dst++ = *src++;
206 *dst++ = *src++;
207 }
208 dst0 = dst;
209
210 if (is_dir_sep(*src)) {
211 *dst++ = '/';
212 while (is_dir_sep(*src))
213 src++;
214 }
215
216 for (;;) {
217 char c = *src;
218
219 /*
220 * A path component that begins with . could be
221 * special:
222 * (1) "." and ends -- ignore and terminate.
223 * (2) "./" -- ignore them, eat slash and continue.
224 * (3) ".." and ends -- strip one and terminate.
225 * (4) "../" -- strip one, eat slash and continue.
226 */
227 if (c == '.') {
228 if (!src[1]) {
229 /* (1) */
230 src++;
231 } else if (is_dir_sep(src[1])) {
232 /* (2) */
233 src += 2;
234 while (is_dir_sep(*src))
235 src++;
236 continue;
237 } else if (src[1] == '.') {
238 if (!src[2]) {
239 /* (3) */
240 src += 2;
241 goto up_one;
242 } else if (is_dir_sep(src[2])) {
243 /* (4) */
244 src += 3;
245 while (is_dir_sep(*src))
246 src++;
247 goto up_one;
248 }
249 }
250 }
251
252 /* copy up to the next '/', and eat all '/' */
253 while ((c = *src++) != '\0' && !is_dir_sep(c))
254 *dst++ = c;
255 if (is_dir_sep(c)) {
256 *dst++ = '/';
257 while (is_dir_sep(c))
258 c = *src++;
259 src--;
260 } else if (!c)
261 break;
262 continue;
263
264 up_one:
265 /*
266 * dst0..dst is prefix portion, and dst[-1] is '/';
267 * go up one level.
268 */
269 dst--; /* go to trailing '/' */
270 if (dst <= dst0)
271 return -1;
272 /* Windows: dst[-1] cannot be backslash anymore */
273 while (dst0 < dst && dst[-1] != '/')
274 dst--;
275 }
276 *dst = '\0';
277 return 0;
278}
279
280/*
281 * path = Canonical absolute path
282 * prefix_list = Colon-separated list of absolute paths
283 *
284 * Determines, for each path in prefix_list, whether the "prefix" really
285 * is an ancestor directory of path. Returns the length of the longest
286 * ancestor directory, excluding any trailing slashes, or -1 if no prefix
287 * is an ancestor. (Note that this means 0 is returned if prefix_list is
288 * "/".) "/foo" is not considered an ancestor of "/foobar". Directories
289 * are not considered to be their own ancestors. path must be in a
290 * canonical form: empty components, or "." or ".." components are not
291 * allowed. prefix_list may be null, which is like "".
292 */
293int longest_ancestor_length(const char *path, const char *prefix_list)
294{
295 char buf[PATH_MAX+1];
296 const char *ceil, *colon;
297 int len, max_len = -1;
298
299 if (prefix_list == NULL || !strcmp(path, "/"))
300 return -1;
301
302 for (colon = ceil = prefix_list; *colon; ceil = colon+1) {
303 for (colon = ceil; *colon && *colon != PATH_SEP; colon++);
304 len = colon - ceil;
305 if (len == 0 || len > PATH_MAX || !is_absolute_path(ceil))
306 continue;
307 strlcpy(buf, ceil, len+1);
308 if (normalize_path_copy(buf, buf) < 0)
309 continue;
310 len = strlen(buf);
311 if (len > 0 && buf[len-1] == '/')
312 buf[--len] = '\0';
313
314 if (!strncmp(path, buf, len) &&
315 path[len] == '/' &&
316 len > max_len) {
317 max_len = len;
318 }
319 }
320
321 return max_len;
322}
323
324/* strip arbitrary amount of directory separators at end of path */ 122/* strip arbitrary amount of directory separators at end of path */
325static inline int chomp_trailing_dir_sep(const char *path, int len) 123static inline int chomp_trailing_dir_sep(const char *path, int len)
326{ 124{
@@ -354,5 +152,5 @@ char *strip_path_suffix(const char *path, const char *suffix)
354 152
355 if (path_len && !is_dir_sep(path[path_len - 1])) 153 if (path_len && !is_dir_sep(path[path_len - 1]))
356 return NULL; 154 return NULL;
357 return xstrndup(path, chomp_trailing_dir_sep(path, path_len)); 155 return strndup(path, chomp_trailing_dir_sep(path, path_len));
358} 156}
diff --git a/tools/perf/util/probe-event.c b/tools/perf/util/probe-event.c
index fde17b090a47..914c67095d96 100644
--- a/tools/perf/util/probe-event.c
+++ b/tools/perf/util/probe-event.c
@@ -33,18 +33,27 @@
33#include <limits.h> 33#include <limits.h>
34 34
35#undef _GNU_SOURCE 35#undef _GNU_SOURCE
36#include "util.h"
36#include "event.h" 37#include "event.h"
37#include "string.h" 38#include "string.h"
38#include "strlist.h" 39#include "strlist.h"
39#include "debug.h" 40#include "debug.h"
40#include "parse-events.h" /* For debugfs_path */ 41#include "cache.h"
42#include "color.h"
43#include "symbol.h"
44#include "thread.h"
45#include "debugfs.h"
46#include "trace-event.h" /* For __unused */
41#include "probe-event.h" 47#include "probe-event.h"
48#include "probe-finder.h"
42 49
43#define MAX_CMDLEN 256 50#define MAX_CMDLEN 256
44#define MAX_PROBE_ARGS 128 51#define MAX_PROBE_ARGS 128
45#define PERFPROBE_GROUP "probe" 52#define PERFPROBE_GROUP "probe"
46 53
47#define semantic_error(msg ...) die("Semantic error :" msg) 54bool probe_event_dry_run; /* Dry run flag */
55
56#define semantic_error(msg ...) pr_err("Semantic error :" msg)
48 57
49/* If there is no space to write, returns -E2BIG. */ 58/* If there is no space to write, returns -E2BIG. */
50static int e_snprintf(char *str, size_t size, const char *format, ...) 59static int e_snprintf(char *str, size_t size, const char *format, ...)
@@ -62,6 +71,326 @@ static int e_snprintf(char *str, size_t size, const char *format, ...)
62 return ret; 71 return ret;
63} 72}
64 73
74static char *synthesize_perf_probe_point(struct perf_probe_point *pp);
75static struct machine machine;
76
77/* Initialize symbol maps and path of vmlinux */
78static int init_vmlinux(void)
79{
80 struct dso *kernel;
81 int ret;
82
83 symbol_conf.sort_by_name = true;
84 if (symbol_conf.vmlinux_name == NULL)
85 symbol_conf.try_vmlinux_path = true;
86 else
87 pr_debug("Use vmlinux: %s\n", symbol_conf.vmlinux_name);
88 ret = symbol__init();
89 if (ret < 0) {
90 pr_debug("Failed to init symbol map.\n");
91 goto out;
92 }
93
94 ret = machine__init(&machine, "/", 0);
95 if (ret < 0)
96 goto out;
97
98 kernel = dso__new_kernel(symbol_conf.vmlinux_name);
99 if (kernel == NULL)
100 die("Failed to create kernel dso.");
101
102 ret = __machine__create_kernel_maps(&machine, kernel);
103 if (ret < 0)
104 pr_debug("Failed to create kernel maps.\n");
105
106out:
107 if (ret < 0)
108 pr_warning("Failed to init vmlinux path.\n");
109 return ret;
110}
111
112#ifdef DWARF_SUPPORT
113static int open_vmlinux(void)
114{
115 if (map__load(machine.vmlinux_maps[MAP__FUNCTION], NULL) < 0) {
116 pr_debug("Failed to load kernel map.\n");
117 return -EINVAL;
118 }
119 pr_debug("Try to open %s\n", machine.vmlinux_maps[MAP__FUNCTION]->dso->long_name);
120 return open(machine.vmlinux_maps[MAP__FUNCTION]->dso->long_name, O_RDONLY);
121}
122
123/* Convert trace point to probe point with debuginfo */
124static int convert_to_perf_probe_point(struct kprobe_trace_point *tp,
125 struct perf_probe_point *pp)
126{
127 struct symbol *sym;
128 int fd, ret = -ENOENT;
129
130 sym = map__find_symbol_by_name(machine.vmlinux_maps[MAP__FUNCTION],
131 tp->symbol, NULL);
132 if (sym) {
133 fd = open_vmlinux();
134 if (fd >= 0) {
135 ret = find_perf_probe_point(fd,
136 sym->start + tp->offset, pp);
137 close(fd);
138 }
139 }
140 if (ret <= 0) {
141 pr_debug("Failed to find corresponding probes from "
142 "debuginfo. Use kprobe event information.\n");
143 pp->function = strdup(tp->symbol);
144 if (pp->function == NULL)
145 return -ENOMEM;
146 pp->offset = tp->offset;
147 }
148 pp->retprobe = tp->retprobe;
149
150 return 0;
151}
152
153/* Try to find perf_probe_event with debuginfo */
154static int try_to_find_kprobe_trace_events(struct perf_probe_event *pev,
155 struct kprobe_trace_event **tevs,
156 int max_tevs)
157{
158 bool need_dwarf = perf_probe_event_need_dwarf(pev);
159 int fd, ntevs;
160
161 fd = open_vmlinux();
162 if (fd < 0) {
163 if (need_dwarf) {
164 pr_warning("Failed to open debuginfo file.\n");
165 return fd;
166 }
167 pr_debug("Could not open vmlinux. Try to use symbols.\n");
168 return 0;
169 }
170
171 /* Searching trace events corresponding to probe event */
172 ntevs = find_kprobe_trace_events(fd, pev, tevs, max_tevs);
173 close(fd);
174
175 if (ntevs > 0) { /* Succeeded to find trace events */
176 pr_debug("find %d kprobe_trace_events.\n", ntevs);
177 return ntevs;
178 }
179
180 if (ntevs == 0) { /* No error but failed to find probe point. */
181 pr_warning("Probe point '%s' not found.\n",
182 synthesize_perf_probe_point(&pev->point));
183 return -ENOENT;
184 }
185 /* Error path : ntevs < 0 */
186 pr_debug("An error occurred in debuginfo analysis (%d).\n", ntevs);
187 if (ntevs == -EBADF) {
188 pr_warning("Warning: No dwarf info found in the vmlinux - "
189 "please rebuild kernel with CONFIG_DEBUG_INFO=y.\n");
190 if (!need_dwarf) {
191 pr_debug("Trying to use symbols.\nn");
192 return 0;
193 }
194 }
195 return ntevs;
196}
197
198#define LINEBUF_SIZE 256
199#define NR_ADDITIONAL_LINES 2
200
201static int show_one_line(FILE *fp, int l, bool skip, bool show_num)
202{
203 char buf[LINEBUF_SIZE];
204 const char *color = PERF_COLOR_BLUE;
205
206 if (fgets(buf, LINEBUF_SIZE, fp) == NULL)
207 goto error;
208 if (!skip) {
209 if (show_num)
210 fprintf(stdout, "%7d %s", l, buf);
211 else
212 color_fprintf(stdout, color, " %s", buf);
213 }
214
215 while (strlen(buf) == LINEBUF_SIZE - 1 &&
216 buf[LINEBUF_SIZE - 2] != '\n') {
217 if (fgets(buf, LINEBUF_SIZE, fp) == NULL)
218 goto error;
219 if (!skip) {
220 if (show_num)
221 fprintf(stdout, "%s", buf);
222 else
223 color_fprintf(stdout, color, "%s", buf);
224 }
225 }
226
227 return 0;
228error:
229 if (feof(fp))
230 pr_warning("Source file is shorter than expected.\n");
231 else
232 pr_warning("File read error: %s\n", strerror(errno));
233
234 return -1;
235}
236
237/*
238 * Show line-range always requires debuginfo to find source file and
239 * line number.
240 */
241int show_line_range(struct line_range *lr)
242{
243 int l = 1;
244 struct line_node *ln;
245 FILE *fp;
246 int fd, ret;
247
248 /* Search a line range */
249 ret = init_vmlinux();
250 if (ret < 0)
251 return ret;
252
253 fd = open_vmlinux();
254 if (fd < 0) {
255 pr_warning("Failed to open debuginfo file.\n");
256 return fd;
257 }
258
259 ret = find_line_range(fd, lr);
260 close(fd);
261 if (ret == 0) {
262 pr_warning("Specified source line is not found.\n");
263 return -ENOENT;
264 } else if (ret < 0) {
265 pr_warning("Debuginfo analysis failed. (%d)\n", ret);
266 return ret;
267 }
268
269 setup_pager();
270
271 if (lr->function)
272 fprintf(stdout, "<%s:%d>\n", lr->function,
273 lr->start - lr->offset);
274 else
275 fprintf(stdout, "<%s:%d>\n", lr->file, lr->start);
276
277 fp = fopen(lr->path, "r");
278 if (fp == NULL) {
279 pr_warning("Failed to open %s: %s\n", lr->path,
280 strerror(errno));
281 return -errno;
282 }
283 /* Skip to starting line number */
284 while (l < lr->start && ret >= 0)
285 ret = show_one_line(fp, l++, true, false);
286 if (ret < 0)
287 goto end;
288
289 list_for_each_entry(ln, &lr->line_list, list) {
290 while (ln->line > l && ret >= 0)
291 ret = show_one_line(fp, (l++) - lr->offset,
292 false, false);
293 if (ret >= 0)
294 ret = show_one_line(fp, (l++) - lr->offset,
295 false, true);
296 if (ret < 0)
297 goto end;
298 }
299
300 if (lr->end == INT_MAX)
301 lr->end = l + NR_ADDITIONAL_LINES;
302 while (l <= lr->end && !feof(fp) && ret >= 0)
303 ret = show_one_line(fp, (l++) - lr->offset, false, false);
304end:
305 fclose(fp);
306 return ret;
307}
308
309#else /* !DWARF_SUPPORT */
310
311static int convert_to_perf_probe_point(struct kprobe_trace_point *tp,
312 struct perf_probe_point *pp)
313{
314 pp->function = strdup(tp->symbol);
315 if (pp->function == NULL)
316 return -ENOMEM;
317 pp->offset = tp->offset;
318 pp->retprobe = tp->retprobe;
319
320 return 0;
321}
322
323static int try_to_find_kprobe_trace_events(struct perf_probe_event *pev,
324 struct kprobe_trace_event **tevs __unused,
325 int max_tevs __unused)
326{
327 if (perf_probe_event_need_dwarf(pev)) {
328 pr_warning("Debuginfo-analysis is not supported.\n");
329 return -ENOSYS;
330 }
331 return 0;
332}
333
334int show_line_range(struct line_range *lr __unused)
335{
336 pr_warning("Debuginfo-analysis is not supported.\n");
337 return -ENOSYS;
338}
339
340#endif
341
342int parse_line_range_desc(const char *arg, struct line_range *lr)
343{
344 const char *ptr;
345 char *tmp;
346 /*
347 * <Syntax>
348 * SRC:SLN[+NUM|-ELN]
349 * FUNC[:SLN[+NUM|-ELN]]
350 */
351 ptr = strchr(arg, ':');
352 if (ptr) {
353 lr->start = (int)strtoul(ptr + 1, &tmp, 0);
354 if (*tmp == '+') {
355 lr->end = lr->start + (int)strtoul(tmp + 1, &tmp, 0);
356 lr->end--; /*
357 * Adjust the number of lines here.
358 * If the number of lines == 1, the
359 * the end of line should be equal to
360 * the start of line.
361 */
362 } else if (*tmp == '-')
363 lr->end = (int)strtoul(tmp + 1, &tmp, 0);
364 else
365 lr->end = INT_MAX;
366 pr_debug("Line range is %d to %d\n", lr->start, lr->end);
367 if (lr->start > lr->end) {
368 semantic_error("Start line must be smaller"
369 " than end line.\n");
370 return -EINVAL;
371 }
372 if (*tmp != '\0') {
373 semantic_error("Tailing with invalid character '%d'.\n",
374 *tmp);
375 return -EINVAL;
376 }
377 tmp = strndup(arg, (ptr - arg));
378 } else {
379 tmp = strdup(arg);
380 lr->end = INT_MAX;
381 }
382
383 if (tmp == NULL)
384 return -ENOMEM;
385
386 if (strchr(tmp, '.'))
387 lr->file = tmp;
388 else
389 lr->function = tmp;
390
391 return 0;
392}
393
65/* Check the name is good for event/group */ 394/* Check the name is good for event/group */
66static bool check_event_name(const char *name) 395static bool check_event_name(const char *name)
67{ 396{
@@ -75,50 +404,66 @@ static bool check_event_name(const char *name)
75} 404}
76 405
77/* Parse probepoint definition. */ 406/* Parse probepoint definition. */
78static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp) 407static int parse_perf_probe_point(char *arg, struct perf_probe_event *pev)
79{ 408{
409 struct perf_probe_point *pp = &pev->point;
80 char *ptr, *tmp; 410 char *ptr, *tmp;
81 char c, nc = 0; 411 char c, nc = 0;
82 /* 412 /*
83 * <Syntax> 413 * <Syntax>
84 * perf probe [EVENT=]SRC:LN 414 * perf probe [EVENT=]SRC[:LN|;PTN]
85 * perf probe [EVENT=]FUNC[+OFFS|%return][@SRC] 415 * perf probe [EVENT=]FUNC[@SRC][+OFFS|%return|:LN|;PAT]
86 * 416 *
87 * TODO:Group name support 417 * TODO:Group name support
88 */ 418 */
89 419
90 ptr = strchr(arg, '='); 420 ptr = strpbrk(arg, ";=@+%");
91 if (ptr) { /* Event name */ 421 if (ptr && *ptr == '=') { /* Event name */
92 *ptr = '\0'; 422 *ptr = '\0';
93 tmp = ptr + 1; 423 tmp = ptr + 1;
94 ptr = strchr(arg, ':'); 424 if (strchr(arg, ':')) {
95 if (ptr) /* Group name is not supported yet. */ 425 semantic_error("Group name is not supported yet.\n");
96 semantic_error("Group name is not supported yet."); 426 return -ENOTSUP;
97 if (!check_event_name(arg)) 427 }
428 if (!check_event_name(arg)) {
98 semantic_error("%s is bad for event name -it must " 429 semantic_error("%s is bad for event name -it must "
99 "follow C symbol-naming rule.", arg); 430 "follow C symbol-naming rule.\n", arg);
100 pp->event = strdup(arg); 431 return -EINVAL;
432 }
433 pev->event = strdup(arg);
434 if (pev->event == NULL)
435 return -ENOMEM;
436 pev->group = NULL;
101 arg = tmp; 437 arg = tmp;
102 } 438 }
103 439
104 ptr = strpbrk(arg, ":+@%"); 440 ptr = strpbrk(arg, ";:+@%");
105 if (ptr) { 441 if (ptr) {
106 nc = *ptr; 442 nc = *ptr;
107 *ptr++ = '\0'; 443 *ptr++ = '\0';
108 } 444 }
109 445
446 tmp = strdup(arg);
447 if (tmp == NULL)
448 return -ENOMEM;
449
110 /* Check arg is function or file and copy it */ 450 /* Check arg is function or file and copy it */
111 if (strchr(arg, '.')) /* File */ 451 if (strchr(tmp, '.')) /* File */
112 pp->file = strdup(arg); 452 pp->file = tmp;
113 else /* Function */ 453 else /* Function */
114 pp->function = strdup(arg); 454 pp->function = tmp;
115 DIE_IF(pp->file == NULL && pp->function == NULL);
116 455
117 /* Parse other options */ 456 /* Parse other options */
118 while (ptr) { 457 while (ptr) {
119 arg = ptr; 458 arg = ptr;
120 c = nc; 459 c = nc;
121 ptr = strpbrk(arg, ":+@%"); 460 if (c == ';') { /* Lazy pattern must be the last part */
461 pp->lazy_line = strdup(arg);
462 if (pp->lazy_line == NULL)
463 return -ENOMEM;
464 break;
465 }
466 ptr = strpbrk(arg, ";:+@%");
122 if (ptr) { 467 if (ptr) {
123 nc = *ptr; 468 nc = *ptr;
124 *ptr++ = '\0'; 469 *ptr++ = '\0';
@@ -126,260 +471,658 @@ static void parse_perf_probe_probepoint(char *arg, struct probe_point *pp)
126 switch (c) { 471 switch (c) {
127 case ':': /* Line number */ 472 case ':': /* Line number */
128 pp->line = strtoul(arg, &tmp, 0); 473 pp->line = strtoul(arg, &tmp, 0);
129 if (*tmp != '\0') 474 if (*tmp != '\0') {
130 semantic_error("There is non-digit charactor" 475 semantic_error("There is non-digit char"
131 " in line number."); 476 " in line number.\n");
477 return -EINVAL;
478 }
132 break; 479 break;
133 case '+': /* Byte offset from a symbol */ 480 case '+': /* Byte offset from a symbol */
134 pp->offset = strtoul(arg, &tmp, 0); 481 pp->offset = strtoul(arg, &tmp, 0);
135 if (*tmp != '\0') 482 if (*tmp != '\0') {
136 semantic_error("There is non-digit charactor" 483 semantic_error("There is non-digit character"
137 " in offset."); 484 " in offset.\n");
485 return -EINVAL;
486 }
138 break; 487 break;
139 case '@': /* File name */ 488 case '@': /* File name */
140 if (pp->file) 489 if (pp->file) {
141 semantic_error("SRC@SRC is not allowed."); 490 semantic_error("SRC@SRC is not allowed.\n");
491 return -EINVAL;
492 }
142 pp->file = strdup(arg); 493 pp->file = strdup(arg);
143 DIE_IF(pp->file == NULL); 494 if (pp->file == NULL)
144 if (ptr) 495 return -ENOMEM;
145 semantic_error("@SRC must be the last "
146 "option.");
147 break; 496 break;
148 case '%': /* Probe places */ 497 case '%': /* Probe places */
149 if (strcmp(arg, "return") == 0) { 498 if (strcmp(arg, "return") == 0) {
150 pp->retprobe = 1; 499 pp->retprobe = 1;
151 } else /* Others not supported yet */ 500 } else { /* Others not supported yet */
152 semantic_error("%%%s is not supported.", arg); 501 semantic_error("%%%s is not supported.\n", arg);
502 return -ENOTSUP;
503 }
153 break; 504 break;
154 default: 505 default: /* Buggy case */
155 DIE_IF("Program has a bug."); 506 pr_err("This program has a bug at %s:%d.\n",
507 __FILE__, __LINE__);
508 return -ENOTSUP;
156 break; 509 break;
157 } 510 }
158 } 511 }
159 512
160 /* Exclusion check */ 513 /* Exclusion check */
161 if (pp->line && pp->offset) 514 if (pp->lazy_line && pp->line) {
515 semantic_error("Lazy pattern can't be used with line number.");
516 return -EINVAL;
517 }
518
519 if (pp->lazy_line && pp->offset) {
520 semantic_error("Lazy pattern can't be used with offset.");
521 return -EINVAL;
522 }
523
524 if (pp->line && pp->offset) {
162 semantic_error("Offset can't be used with line number."); 525 semantic_error("Offset can't be used with line number.");
526 return -EINVAL;
527 }
163 528
164 if (!pp->line && pp->file && !pp->function) 529 if (!pp->line && !pp->lazy_line && pp->file && !pp->function) {
165 semantic_error("File always requires line number."); 530 semantic_error("File always requires line number or "
531 "lazy pattern.");
532 return -EINVAL;
533 }
166 534
167 if (pp->offset && !pp->function) 535 if (pp->offset && !pp->function) {
168 semantic_error("Offset requires an entry function."); 536 semantic_error("Offset requires an entry function.");
537 return -EINVAL;
538 }
169 539
170 if (pp->retprobe && !pp->function) 540 if (pp->retprobe && !pp->function) {
171 semantic_error("Return probe requires an entry function."); 541 semantic_error("Return probe requires an entry function.");
542 return -EINVAL;
543 }
172 544
173 if ((pp->offset || pp->line) && pp->retprobe) 545 if ((pp->offset || pp->line || pp->lazy_line) && pp->retprobe) {
174 semantic_error("Offset/Line can't be used with return probe."); 546 semantic_error("Offset/Line/Lazy pattern can't be used with "
547 "return probe.");
548 return -EINVAL;
549 }
175 550
176 pr_debug("symbol:%s file:%s line:%d offset:%d, return:%d\n", 551 pr_debug("symbol:%s file:%s line:%d offset:%lu return:%d lazy:%s\n",
177 pp->function, pp->file, pp->line, pp->offset, pp->retprobe); 552 pp->function, pp->file, pp->line, pp->offset, pp->retprobe,
553 pp->lazy_line);
554 return 0;
178} 555}
179 556
180/* Parse perf-probe event definition */ 557/* Parse perf-probe event argument */
181void parse_perf_probe_event(const char *str, struct probe_point *pp, 558static int parse_perf_probe_arg(char *str, struct perf_probe_arg *arg)
182 bool *need_dwarf)
183{ 559{
184 char **argv; 560 char *tmp;
185 int argc, i; 561 struct perf_probe_arg_field **fieldp;
562
563 pr_debug("parsing arg: %s into ", str);
564
565 tmp = strchr(str, '=');
566 if (tmp) {
567 arg->name = strndup(str, tmp - str);
568 if (arg->name == NULL)
569 return -ENOMEM;
570 pr_debug("name:%s ", arg->name);
571 str = tmp + 1;
572 }
573
574 tmp = strchr(str, ':');
575 if (tmp) { /* Type setting */
576 *tmp = '\0';
577 arg->type = strdup(tmp + 1);
578 if (arg->type == NULL)
579 return -ENOMEM;
580 pr_debug("type:%s ", arg->type);
581 }
582
583 tmp = strpbrk(str, "-.");
584 if (!is_c_varname(str) || !tmp) {
585 /* A variable, register, symbol or special value */
586 arg->var = strdup(str);
587 if (arg->var == NULL)
588 return -ENOMEM;
589 pr_debug("%s\n", arg->var);
590 return 0;
591 }
592
593 /* Structure fields */
594 arg->var = strndup(str, tmp - str);
595 if (arg->var == NULL)
596 return -ENOMEM;
597 pr_debug("%s, ", arg->var);
598 fieldp = &arg->field;
599
600 do {
601 *fieldp = zalloc(sizeof(struct perf_probe_arg_field));
602 if (*fieldp == NULL)
603 return -ENOMEM;
604 if (*tmp == '.') {
605 str = tmp + 1;
606 (*fieldp)->ref = false;
607 } else if (tmp[1] == '>') {
608 str = tmp + 2;
609 (*fieldp)->ref = true;
610 } else {
611 semantic_error("Argument parse error: %s\n", str);
612 return -EINVAL;
613 }
186 614
187 *need_dwarf = false; 615 tmp = strpbrk(str, "-.");
616 if (tmp) {
617 (*fieldp)->name = strndup(str, tmp - str);
618 if ((*fieldp)->name == NULL)
619 return -ENOMEM;
620 pr_debug("%s(%d), ", (*fieldp)->name, (*fieldp)->ref);
621 fieldp = &(*fieldp)->next;
622 }
623 } while (tmp);
624 (*fieldp)->name = strdup(str);
625 if ((*fieldp)->name == NULL)
626 return -ENOMEM;
627 pr_debug("%s(%d)\n", (*fieldp)->name, (*fieldp)->ref);
628
629 /* If no name is specified, set the last field name */
630 if (!arg->name) {
631 arg->name = strdup((*fieldp)->name);
632 if (arg->name == NULL)
633 return -ENOMEM;
634 }
635 return 0;
636}
188 637
189 argv = argv_split(str, &argc); 638/* Parse perf-probe event command */
190 if (!argv) 639int parse_perf_probe_command(const char *cmd, struct perf_probe_event *pev)
191 die("argv_split failed."); 640{
192 if (argc > MAX_PROBE_ARGS + 1) 641 char **argv;
193 semantic_error("Too many arguments"); 642 int argc, i, ret = 0;
194 643
644 argv = argv_split(cmd, &argc);
645 if (!argv) {
646 pr_debug("Failed to split arguments.\n");
647 return -ENOMEM;
648 }
649 if (argc - 1 > MAX_PROBE_ARGS) {
650 semantic_error("Too many probe arguments (%d).\n", argc - 1);
651 ret = -ERANGE;
652 goto out;
653 }
195 /* Parse probe point */ 654 /* Parse probe point */
196 parse_perf_probe_probepoint(argv[0], pp); 655 ret = parse_perf_probe_point(argv[0], pev);
197 if (pp->file || pp->line) 656 if (ret < 0)
198 *need_dwarf = true; 657 goto out;
199 658
200 /* Copy arguments and ensure return probe has no C argument */ 659 /* Copy arguments and ensure return probe has no C argument */
201 pp->nr_args = argc - 1; 660 pev->nargs = argc - 1;
202 pp->args = zalloc(sizeof(char *) * pp->nr_args); 661 pev->args = zalloc(sizeof(struct perf_probe_arg) * pev->nargs);
203 for (i = 0; i < pp->nr_args; i++) { 662 if (pev->args == NULL) {
204 pp->args[i] = strdup(argv[i + 1]); 663 ret = -ENOMEM;
205 if (!pp->args[i]) 664 goto out;
206 die("Failed to copy argument."); 665 }
207 if (is_c_varname(pp->args[i])) { 666 for (i = 0; i < pev->nargs && ret >= 0; i++) {
208 if (pp->retprobe) 667 ret = parse_perf_probe_arg(argv[i + 1], &pev->args[i]);
209 semantic_error("You can't specify local" 668 if (ret >= 0 &&
210 " variable for kretprobe"); 669 is_c_varname(pev->args[i].var) && pev->point.retprobe) {
211 *need_dwarf = true; 670 semantic_error("You can't specify local variable for"
671 " kretprobe.\n");
672 ret = -EINVAL;
212 } 673 }
213 } 674 }
214 675out:
215 argv_free(argv); 676 argv_free(argv);
677
678 return ret;
679}
680
681/* Return true if this perf_probe_event requires debuginfo */
682bool perf_probe_event_need_dwarf(struct perf_probe_event *pev)
683{
684 int i;
685
686 if (pev->point.file || pev->point.line || pev->point.lazy_line)
687 return true;
688
689 for (i = 0; i < pev->nargs; i++)
690 if (is_c_varname(pev->args[i].var))
691 return true;
692
693 return false;
216} 694}
217 695
218/* Parse kprobe_events event into struct probe_point */ 696/* Parse kprobe_events event into struct probe_point */
219void parse_trace_kprobe_event(const char *str, struct probe_point *pp) 697int parse_kprobe_trace_command(const char *cmd, struct kprobe_trace_event *tev)
220{ 698{
699 struct kprobe_trace_point *tp = &tev->point;
221 char pr; 700 char pr;
222 char *p; 701 char *p;
223 int ret, i, argc; 702 int ret, i, argc;
224 char **argv; 703 char **argv;
225 704
226 pr_debug("Parsing kprobe_events: %s\n", str); 705 pr_debug("Parsing kprobe_events: %s\n", cmd);
227 argv = argv_split(str, &argc); 706 argv = argv_split(cmd, &argc);
228 if (!argv) 707 if (!argv) {
229 die("argv_split failed."); 708 pr_debug("Failed to split arguments.\n");
230 if (argc < 2) 709 return -ENOMEM;
231 semantic_error("Too less arguments."); 710 }
711 if (argc < 2) {
712 semantic_error("Too few probe arguments.\n");
713 ret = -ERANGE;
714 goto out;
715 }
232 716
233 /* Scan event and group name. */ 717 /* Scan event and group name. */
234 ret = sscanf(argv[0], "%c:%a[^/ \t]/%a[^ \t]", 718 ret = sscanf(argv[0], "%c:%a[^/ \t]/%a[^ \t]",
235 &pr, (float *)(void *)&pp->group, 719 &pr, (float *)(void *)&tev->group,
236 (float *)(void *)&pp->event); 720 (float *)(void *)&tev->event);
237 if (ret != 3) 721 if (ret != 3) {
238 semantic_error("Failed to parse event name: %s", argv[0]); 722 semantic_error("Failed to parse event name: %s\n", argv[0]);
239 pr_debug("Group:%s Event:%s probe:%c\n", pp->group, pp->event, pr); 723 ret = -EINVAL;
724 goto out;
725 }
726 pr_debug("Group:%s Event:%s probe:%c\n", tev->group, tev->event, pr);
240 727
241 pp->retprobe = (pr == 'r'); 728 tp->retprobe = (pr == 'r');
242 729
243 /* Scan function name and offset */ 730 /* Scan function name and offset */
244 ret = sscanf(argv[1], "%a[^+]+%d", (float *)(void *)&pp->function, 731 ret = sscanf(argv[1], "%a[^+]+%lu", (float *)(void *)&tp->symbol,
245 &pp->offset); 732 &tp->offset);
246 if (ret == 1) 733 if (ret == 1)
247 pp->offset = 0; 734 tp->offset = 0;
248
249 /* kprobe_events doesn't have this information */
250 pp->line = 0;
251 pp->file = NULL;
252 735
253 pp->nr_args = argc - 2; 736 tev->nargs = argc - 2;
254 pp->args = zalloc(sizeof(char *) * pp->nr_args); 737 tev->args = zalloc(sizeof(struct kprobe_trace_arg) * tev->nargs);
255 for (i = 0; i < pp->nr_args; i++) { 738 if (tev->args == NULL) {
739 ret = -ENOMEM;
740 goto out;
741 }
742 for (i = 0; i < tev->nargs; i++) {
256 p = strchr(argv[i + 2], '='); 743 p = strchr(argv[i + 2], '=');
257 if (p) /* We don't need which register is assigned. */ 744 if (p) /* We don't need which register is assigned. */
258 *p = '\0'; 745 *p++ = '\0';
259 pp->args[i] = strdup(argv[i + 2]); 746 else
260 if (!pp->args[i]) 747 p = argv[i + 2];
261 die("Failed to copy argument."); 748 tev->args[i].name = strdup(argv[i + 2]);
749 /* TODO: parse regs and offset */
750 tev->args[i].value = strdup(p);
751 if (tev->args[i].name == NULL || tev->args[i].value == NULL) {
752 ret = -ENOMEM;
753 goto out;
754 }
262 } 755 }
263 756 ret = 0;
757out:
264 argv_free(argv); 758 argv_free(argv);
759 return ret;
265} 760}
266 761
267/* Synthesize only probe point (not argument) */ 762/* Compose only probe arg */
268int synthesize_perf_probe_point(struct probe_point *pp) 763int synthesize_perf_probe_arg(struct perf_probe_arg *pa, char *buf, size_t len)
269{ 764{
270 char *buf; 765 struct perf_probe_arg_field *field = pa->field;
271 char offs[64] = "", line[64] = "";
272 int ret; 766 int ret;
767 char *tmp = buf;
273 768
274 pp->probes[0] = buf = zalloc(MAX_CMDLEN); 769 if (pa->name && pa->var)
275 pp->found = 1; 770 ret = e_snprintf(tmp, len, "%s=%s", pa->name, pa->var);
276 if (!buf) 771 else
277 die("Failed to allocate memory by zalloc."); 772 ret = e_snprintf(tmp, len, "%s", pa->name ? pa->name : pa->var);
773 if (ret <= 0)
774 goto error;
775 tmp += ret;
776 len -= ret;
777
778 while (field) {
779 ret = e_snprintf(tmp, len, "%s%s", field->ref ? "->" : ".",
780 field->name);
781 if (ret <= 0)
782 goto error;
783 tmp += ret;
784 len -= ret;
785 field = field->next;
786 }
787
788 if (pa->type) {
789 ret = e_snprintf(tmp, len, ":%s", pa->type);
790 if (ret <= 0)
791 goto error;
792 tmp += ret;
793 len -= ret;
794 }
795
796 return tmp - buf;
797error:
798 pr_debug("Failed to synthesize perf probe argument: %s",
799 strerror(-ret));
800 return ret;
801}
802
803/* Compose only probe point (not argument) */
804static char *synthesize_perf_probe_point(struct perf_probe_point *pp)
805{
806 char *buf, *tmp;
807 char offs[32] = "", line[32] = "", file[32] = "";
808 int ret, len;
809
810 buf = zalloc(MAX_CMDLEN);
811 if (buf == NULL) {
812 ret = -ENOMEM;
813 goto error;
814 }
278 if (pp->offset) { 815 if (pp->offset) {
279 ret = e_snprintf(offs, 64, "+%d", pp->offset); 816 ret = e_snprintf(offs, 32, "+%lu", pp->offset);
280 if (ret <= 0) 817 if (ret <= 0)
281 goto error; 818 goto error;
282 } 819 }
283 if (pp->line) { 820 if (pp->line) {
284 ret = e_snprintf(line, 64, ":%d", pp->line); 821 ret = e_snprintf(line, 32, ":%d", pp->line);
822 if (ret <= 0)
823 goto error;
824 }
825 if (pp->file) {
826 len = strlen(pp->file) - 31;
827 if (len < 0)
828 len = 0;
829 tmp = strchr(pp->file + len, '/');
830 if (!tmp)
831 tmp = pp->file + len;
832 ret = e_snprintf(file, 32, "@%s", tmp + 1);
285 if (ret <= 0) 833 if (ret <= 0)
286 goto error; 834 goto error;
287 } 835 }
288 836
289 if (pp->function) 837 if (pp->function)
290 ret = e_snprintf(buf, MAX_CMDLEN, "%s%s%s%s", pp->function, 838 ret = e_snprintf(buf, MAX_CMDLEN, "%s%s%s%s%s", pp->function,
291 offs, pp->retprobe ? "%return" : "", line); 839 offs, pp->retprobe ? "%return" : "", line,
840 file);
292 else 841 else
293 ret = e_snprintf(buf, MAX_CMDLEN, "%s%s", pp->file, line); 842 ret = e_snprintf(buf, MAX_CMDLEN, "%s%s", file, line);
294 if (ret <= 0) { 843 if (ret <= 0)
844 goto error;
845
846 return buf;
295error: 847error:
296 free(pp->probes[0]); 848 pr_debug("Failed to synthesize perf probe point: %s",
297 pp->probes[0] = NULL; 849 strerror(-ret));
298 pp->found = 0; 850 if (buf)
299 } 851 free(buf);
300 return ret; 852 return NULL;
301} 853}
302 854
303int synthesize_perf_probe_event(struct probe_point *pp) 855#if 0
856char *synthesize_perf_probe_command(struct perf_probe_event *pev)
304{ 857{
305 char *buf; 858 char *buf;
306 int i, len, ret; 859 int i, len, ret;
307 860
308 len = synthesize_perf_probe_point(pp); 861 buf = synthesize_perf_probe_point(&pev->point);
309 if (len < 0) 862 if (!buf)
310 return 0; 863 return NULL;
311 864
312 buf = pp->probes[0]; 865 len = strlen(buf);
313 for (i = 0; i < pp->nr_args; i++) { 866 for (i = 0; i < pev->nargs; i++) {
314 ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", 867 ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s",
315 pp->args[i]); 868 pev->args[i].name);
316 if (ret <= 0) 869 if (ret <= 0) {
317 goto error; 870 free(buf);
871 return NULL;
872 }
318 len += ret; 873 len += ret;
319 } 874 }
320 pp->found = 1;
321 875
322 return pp->found; 876 return buf;
323error: 877}
324 free(pp->probes[0]); 878#endif
325 pp->probes[0] = NULL; 879
880static int __synthesize_kprobe_trace_arg_ref(struct kprobe_trace_arg_ref *ref,
881 char **buf, size_t *buflen,
882 int depth)
883{
884 int ret;
885 if (ref->next) {
886 depth = __synthesize_kprobe_trace_arg_ref(ref->next, buf,
887 buflen, depth + 1);
888 if (depth < 0)
889 goto out;
890 }
891
892 ret = e_snprintf(*buf, *buflen, "%+ld(", ref->offset);
893 if (ret < 0)
894 depth = ret;
895 else {
896 *buf += ret;
897 *buflen -= ret;
898 }
899out:
900 return depth;
326 901
327 return ret;
328} 902}
329 903
330int synthesize_trace_kprobe_event(struct probe_point *pp) 904static int synthesize_kprobe_trace_arg(struct kprobe_trace_arg *arg,
905 char *buf, size_t buflen)
331{ 906{
907 int ret, depth = 0;
908 char *tmp = buf;
909
910 /* Argument name or separator */
911 if (arg->name)
912 ret = e_snprintf(buf, buflen, " %s=", arg->name);
913 else
914 ret = e_snprintf(buf, buflen, " ");
915 if (ret < 0)
916 return ret;
917 buf += ret;
918 buflen -= ret;
919
920 /* Dereferencing arguments */
921 if (arg->ref) {
922 depth = __synthesize_kprobe_trace_arg_ref(arg->ref, &buf,
923 &buflen, 1);
924 if (depth < 0)
925 return depth;
926 }
927
928 /* Print argument value */
929 ret = e_snprintf(buf, buflen, "%s", arg->value);
930 if (ret < 0)
931 return ret;
932 buf += ret;
933 buflen -= ret;
934
935 /* Closing */
936 while (depth--) {
937 ret = e_snprintf(buf, buflen, ")");
938 if (ret < 0)
939 return ret;
940 buf += ret;
941 buflen -= ret;
942 }
943 /* Print argument type */
944 if (arg->type) {
945 ret = e_snprintf(buf, buflen, ":%s", arg->type);
946 if (ret <= 0)
947 return ret;
948 buf += ret;
949 }
950
951 return buf - tmp;
952}
953
954char *synthesize_kprobe_trace_command(struct kprobe_trace_event *tev)
955{
956 struct kprobe_trace_point *tp = &tev->point;
332 char *buf; 957 char *buf;
333 int i, len, ret; 958 int i, len, ret;
334 959
335 pp->probes[0] = buf = zalloc(MAX_CMDLEN); 960 buf = zalloc(MAX_CMDLEN);
336 if (!buf) 961 if (buf == NULL)
337 die("Failed to allocate memory by zalloc."); 962 return NULL;
338 ret = e_snprintf(buf, MAX_CMDLEN, "%s+%d", pp->function, pp->offset); 963
339 if (ret <= 0) 964 len = e_snprintf(buf, MAX_CMDLEN, "%c:%s/%s %s+%lu",
965 tp->retprobe ? 'r' : 'p',
966 tev->group, tev->event,
967 tp->symbol, tp->offset);
968 if (len <= 0)
340 goto error; 969 goto error;
341 len = ret;
342 970
343 for (i = 0; i < pp->nr_args; i++) { 971 for (i = 0; i < tev->nargs; i++) {
344 ret = e_snprintf(&buf[len], MAX_CMDLEN - len, " %s", 972 ret = synthesize_kprobe_trace_arg(&tev->args[i], buf + len,
345 pp->args[i]); 973 MAX_CMDLEN - len);
346 if (ret <= 0) 974 if (ret <= 0)
347 goto error; 975 goto error;
348 len += ret; 976 len += ret;
349 } 977 }
350 pp->found = 1;
351 978
352 return pp->found; 979 return buf;
353error: 980error:
354 free(pp->probes[0]); 981 free(buf);
355 pp->probes[0] = NULL; 982 return NULL;
983}
984
985int convert_to_perf_probe_event(struct kprobe_trace_event *tev,
986 struct perf_probe_event *pev)
987{
988 char buf[64] = "";
989 int i, ret;
990
991 /* Convert event/group name */
992 pev->event = strdup(tev->event);
993 pev->group = strdup(tev->group);
994 if (pev->event == NULL || pev->group == NULL)
995 return -ENOMEM;
996
997 /* Convert trace_point to probe_point */
998 ret = convert_to_perf_probe_point(&tev->point, &pev->point);
999 if (ret < 0)
1000 return ret;
1001
1002 /* Convert trace_arg to probe_arg */
1003 pev->nargs = tev->nargs;
1004 pev->args = zalloc(sizeof(struct perf_probe_arg) * pev->nargs);
1005 if (pev->args == NULL)
1006 return -ENOMEM;
1007 for (i = 0; i < tev->nargs && ret >= 0; i++) {
1008 if (tev->args[i].name)
1009 pev->args[i].name = strdup(tev->args[i].name);
1010 else {
1011 ret = synthesize_kprobe_trace_arg(&tev->args[i],
1012 buf, 64);
1013 pev->args[i].name = strdup(buf);
1014 }
1015 if (pev->args[i].name == NULL && ret >= 0)
1016 ret = -ENOMEM;
1017 }
1018
1019 if (ret < 0)
1020 clear_perf_probe_event(pev);
356 1021
357 return ret; 1022 return ret;
358} 1023}
359 1024
360static int open_kprobe_events(int flags, int mode) 1025void clear_perf_probe_event(struct perf_probe_event *pev)
1026{
1027 struct perf_probe_point *pp = &pev->point;
1028 struct perf_probe_arg_field *field, *next;
1029 int i;
1030
1031 if (pev->event)
1032 free(pev->event);
1033 if (pev->group)
1034 free(pev->group);
1035 if (pp->file)
1036 free(pp->file);
1037 if (pp->function)
1038 free(pp->function);
1039 if (pp->lazy_line)
1040 free(pp->lazy_line);
1041 for (i = 0; i < pev->nargs; i++) {
1042 if (pev->args[i].name)
1043 free(pev->args[i].name);
1044 if (pev->args[i].var)
1045 free(pev->args[i].var);
1046 if (pev->args[i].type)
1047 free(pev->args[i].type);
1048 field = pev->args[i].field;
1049 while (field) {
1050 next = field->next;
1051 if (field->name)
1052 free(field->name);
1053 free(field);
1054 field = next;
1055 }
1056 }
1057 if (pev->args)
1058 free(pev->args);
1059 memset(pev, 0, sizeof(*pev));
1060}
1061
1062void clear_kprobe_trace_event(struct kprobe_trace_event *tev)
1063{
1064 struct kprobe_trace_arg_ref *ref, *next;
1065 int i;
1066
1067 if (tev->event)
1068 free(tev->event);
1069 if (tev->group)
1070 free(tev->group);
1071 if (tev->point.symbol)
1072 free(tev->point.symbol);
1073 for (i = 0; i < tev->nargs; i++) {
1074 if (tev->args[i].name)
1075 free(tev->args[i].name);
1076 if (tev->args[i].value)
1077 free(tev->args[i].value);
1078 if (tev->args[i].type)
1079 free(tev->args[i].type);
1080 ref = tev->args[i].ref;
1081 while (ref) {
1082 next = ref->next;
1083 free(ref);
1084 ref = next;
1085 }
1086 }
1087 if (tev->args)
1088 free(tev->args);
1089 memset(tev, 0, sizeof(*tev));
1090}
1091
1092static int open_kprobe_events(bool readwrite)
361{ 1093{
362 char buf[PATH_MAX]; 1094 char buf[PATH_MAX];
1095 const char *__debugfs;
363 int ret; 1096 int ret;
364 1097
365 ret = e_snprintf(buf, PATH_MAX, "%s/../kprobe_events", debugfs_path); 1098 __debugfs = debugfs_find_mountpoint();
366 if (ret < 0) 1099 if (__debugfs == NULL) {
367 die("Failed to make kprobe_events path."); 1100 pr_warning("Debugfs is not mounted.\n");
1101 return -ENOENT;
1102 }
1103
1104 ret = e_snprintf(buf, PATH_MAX, "%stracing/kprobe_events", __debugfs);
1105 if (ret >= 0) {
1106 pr_debug("Opening %s write=%d\n", buf, readwrite);
1107 if (readwrite && !probe_event_dry_run)
1108 ret = open(buf, O_RDWR, O_APPEND);
1109 else
1110 ret = open(buf, O_RDONLY, 0);
1111 }
368 1112
369 ret = open(buf, flags, mode);
370 if (ret < 0) { 1113 if (ret < 0) {
371 if (errno == ENOENT) 1114 if (errno == ENOENT)
372 die("kprobe_events file does not exist -" 1115 pr_warning("kprobe_events file does not exist - please"
373 " please rebuild with CONFIG_KPROBE_TRACER."); 1116 " rebuild kernel with CONFIG_KPROBE_EVENT.\n");
374 else 1117 else
375 die("Could not open kprobe_events file: %s", 1118 pr_warning("Failed to open kprobe_events file: %s\n",
376 strerror(errno)); 1119 strerror(errno));
377 } 1120 }
378 return ret; 1121 return ret;
379} 1122}
380 1123
381/* Get raw string list of current kprobe_events */ 1124/* Get raw string list of current kprobe_events */
382static struct strlist *get_trace_kprobe_event_rawlist(int fd) 1125static struct strlist *get_kprobe_trace_command_rawlist(int fd)
383{ 1126{
384 int ret, idx; 1127 int ret, idx;
385 FILE *fp; 1128 FILE *fp;
@@ -399,267 +1142,486 @@ static struct strlist *get_trace_kprobe_event_rawlist(int fd)
399 if (p[idx] == '\n') 1142 if (p[idx] == '\n')
400 p[idx] = '\0'; 1143 p[idx] = '\0';
401 ret = strlist__add(sl, buf); 1144 ret = strlist__add(sl, buf);
402 if (ret < 0) 1145 if (ret < 0) {
403 die("strlist__add failed: %s", strerror(-ret)); 1146 pr_debug("strlist__add failed: %s\n", strerror(-ret));
1147 strlist__delete(sl);
1148 return NULL;
1149 }
404 } 1150 }
405 fclose(fp); 1151 fclose(fp);
406 1152
407 return sl; 1153 return sl;
408} 1154}
409 1155
410/* Free and zero clear probe_point */
411static void clear_probe_point(struct probe_point *pp)
412{
413 int i;
414
415 if (pp->event)
416 free(pp->event);
417 if (pp->group)
418 free(pp->group);
419 if (pp->function)
420 free(pp->function);
421 if (pp->file)
422 free(pp->file);
423 for (i = 0; i < pp->nr_args; i++)
424 free(pp->args[i]);
425 if (pp->args)
426 free(pp->args);
427 for (i = 0; i < pp->found; i++)
428 free(pp->probes[i]);
429 memset(pp, 0, sizeof(*pp));
430}
431
432/* Show an event */ 1156/* Show an event */
433static void show_perf_probe_event(const char *event, const char *place, 1157static int show_perf_probe_event(struct perf_probe_event *pev)
434 struct probe_point *pp)
435{ 1158{
436 int i, ret; 1159 int i, ret;
437 char buf[128]; 1160 char buf[128];
1161 char *place;
1162
1163 /* Synthesize only event probe point */
1164 place = synthesize_perf_probe_point(&pev->point);
1165 if (!place)
1166 return -EINVAL;
438 1167
439 ret = e_snprintf(buf, 128, "%s:%s", pp->group, event); 1168 ret = e_snprintf(buf, 128, "%s:%s", pev->group, pev->event);
440 if (ret < 0) 1169 if (ret < 0)
441 die("Failed to copy event: %s", strerror(-ret)); 1170 return ret;
442 printf(" %-40s (on %s", buf, place); 1171
1172 printf(" %-20s (on %s", buf, place);
443 1173
444 if (pp->nr_args > 0) { 1174 if (pev->nargs > 0) {
445 printf(" with"); 1175 printf(" with");
446 for (i = 0; i < pp->nr_args; i++) 1176 for (i = 0; i < pev->nargs; i++) {
447 printf(" %s", pp->args[i]); 1177 ret = synthesize_perf_probe_arg(&pev->args[i],
1178 buf, 128);
1179 if (ret < 0)
1180 break;
1181 printf(" %s", buf);
1182 }
448 } 1183 }
449 printf(")\n"); 1184 printf(")\n");
1185 free(place);
1186 return ret;
450} 1187}
451 1188
452/* List up current perf-probe events */ 1189/* List up current perf-probe events */
453void show_perf_probe_events(void) 1190int show_perf_probe_events(void)
454{ 1191{
455 int fd; 1192 int fd, ret;
456 struct probe_point pp; 1193 struct kprobe_trace_event tev;
1194 struct perf_probe_event pev;
457 struct strlist *rawlist; 1195 struct strlist *rawlist;
458 struct str_node *ent; 1196 struct str_node *ent;
459 1197
460 memset(&pp, 0, sizeof(pp)); 1198 setup_pager();
461 fd = open_kprobe_events(O_RDONLY, 0); 1199 ret = init_vmlinux();
462 rawlist = get_trace_kprobe_event_rawlist(fd); 1200 if (ret < 0)
1201 return ret;
1202
1203 memset(&tev, 0, sizeof(tev));
1204 memset(&pev, 0, sizeof(pev));
1205
1206 fd = open_kprobe_events(false);
1207 if (fd < 0)
1208 return fd;
1209
1210 rawlist = get_kprobe_trace_command_rawlist(fd);
463 close(fd); 1211 close(fd);
1212 if (!rawlist)
1213 return -ENOENT;
464 1214
465 strlist__for_each(ent, rawlist) { 1215 strlist__for_each(ent, rawlist) {
466 parse_trace_kprobe_event(ent->s, &pp); 1216 ret = parse_kprobe_trace_command(ent->s, &tev);
467 /* Synthesize only event probe point */ 1217 if (ret >= 0) {
468 synthesize_perf_probe_point(&pp); 1218 ret = convert_to_perf_probe_event(&tev, &pev);
469 /* Show an event */ 1219 if (ret >= 0)
470 show_perf_probe_event(pp.event, pp.probes[0], &pp); 1220 ret = show_perf_probe_event(&pev);
471 clear_probe_point(&pp); 1221 }
1222 clear_perf_probe_event(&pev);
1223 clear_kprobe_trace_event(&tev);
1224 if (ret < 0)
1225 break;
472 } 1226 }
473
474 strlist__delete(rawlist); 1227 strlist__delete(rawlist);
1228
1229 return ret;
475} 1230}
476 1231
477/* Get current perf-probe event names */ 1232/* Get current perf-probe event names */
478static struct strlist *get_perf_event_names(int fd, bool include_group) 1233static struct strlist *get_kprobe_trace_event_names(int fd, bool include_group)
479{ 1234{
480 char buf[128]; 1235 char buf[128];
481 struct strlist *sl, *rawlist; 1236 struct strlist *sl, *rawlist;
482 struct str_node *ent; 1237 struct str_node *ent;
483 struct probe_point pp; 1238 struct kprobe_trace_event tev;
1239 int ret = 0;
484 1240
485 memset(&pp, 0, sizeof(pp)); 1241 memset(&tev, 0, sizeof(tev));
486 rawlist = get_trace_kprobe_event_rawlist(fd);
487 1242
1243 rawlist = get_kprobe_trace_command_rawlist(fd);
488 sl = strlist__new(true, NULL); 1244 sl = strlist__new(true, NULL);
489 strlist__for_each(ent, rawlist) { 1245 strlist__for_each(ent, rawlist) {
490 parse_trace_kprobe_event(ent->s, &pp); 1246 ret = parse_kprobe_trace_command(ent->s, &tev);
1247 if (ret < 0)
1248 break;
491 if (include_group) { 1249 if (include_group) {
492 if (e_snprintf(buf, 128, "%s:%s", pp.group, 1250 ret = e_snprintf(buf, 128, "%s:%s", tev.group,
493 pp.event) < 0) 1251 tev.event);
494 die("Failed to copy group:event name."); 1252 if (ret >= 0)
495 strlist__add(sl, buf); 1253 ret = strlist__add(sl, buf);
496 } else 1254 } else
497 strlist__add(sl, pp.event); 1255 ret = strlist__add(sl, tev.event);
498 clear_probe_point(&pp); 1256 clear_kprobe_trace_event(&tev);
1257 if (ret < 0)
1258 break;
499 } 1259 }
500
501 strlist__delete(rawlist); 1260 strlist__delete(rawlist);
502 1261
1262 if (ret < 0) {
1263 strlist__delete(sl);
1264 return NULL;
1265 }
503 return sl; 1266 return sl;
504} 1267}
505 1268
506static void write_trace_kprobe_event(int fd, const char *buf) 1269static int write_kprobe_trace_event(int fd, struct kprobe_trace_event *tev)
507{ 1270{
508 int ret; 1271 int ret = 0;
1272 char *buf = synthesize_kprobe_trace_command(tev);
1273
1274 if (!buf) {
1275 pr_debug("Failed to synthesize kprobe trace event.\n");
1276 return -EINVAL;
1277 }
509 1278
510 pr_debug("Writing event: %s\n", buf); 1279 pr_debug("Writing event: %s\n", buf);
511 ret = write(fd, buf, strlen(buf)); 1280 if (!probe_event_dry_run) {
512 if (ret <= 0) 1281 ret = write(fd, buf, strlen(buf));
513 die("Failed to write event: %s", strerror(errno)); 1282 if (ret <= 0)
1283 pr_warning("Failed to write event: %s\n",
1284 strerror(errno));
1285 }
1286 free(buf);
1287 return ret;
514} 1288}
515 1289
516static void get_new_event_name(char *buf, size_t len, const char *base, 1290static int get_new_event_name(char *buf, size_t len, const char *base,
517 struct strlist *namelist, bool allow_suffix) 1291 struct strlist *namelist, bool allow_suffix)
518{ 1292{
519 int i, ret; 1293 int i, ret;
520 1294
521 /* Try no suffix */ 1295 /* Try no suffix */
522 ret = e_snprintf(buf, len, "%s", base); 1296 ret = e_snprintf(buf, len, "%s", base);
523 if (ret < 0) 1297 if (ret < 0) {
524 die("snprintf() failed: %s", strerror(-ret)); 1298 pr_debug("snprintf() failed: %s\n", strerror(-ret));
1299 return ret;
1300 }
525 if (!strlist__has_entry(namelist, buf)) 1301 if (!strlist__has_entry(namelist, buf))
526 return; 1302 return 0;
527 1303
528 if (!allow_suffix) { 1304 if (!allow_suffix) {
529 pr_warning("Error: event \"%s\" already exists. " 1305 pr_warning("Error: event \"%s\" already exists. "
530 "(Use -f to force duplicates.)\n", base); 1306 "(Use -f to force duplicates.)\n", base);
531 die("Can't add new event."); 1307 return -EEXIST;
532 } 1308 }
533 1309
534 /* Try to add suffix */ 1310 /* Try to add suffix */
535 for (i = 1; i < MAX_EVENT_INDEX; i++) { 1311 for (i = 1; i < MAX_EVENT_INDEX; i++) {
536 ret = e_snprintf(buf, len, "%s_%d", base, i); 1312 ret = e_snprintf(buf, len, "%s_%d", base, i);
537 if (ret < 0) 1313 if (ret < 0) {
538 die("snprintf() failed: %s", strerror(-ret)); 1314 pr_debug("snprintf() failed: %s\n", strerror(-ret));
1315 return ret;
1316 }
539 if (!strlist__has_entry(namelist, buf)) 1317 if (!strlist__has_entry(namelist, buf))
540 break; 1318 break;
541 } 1319 }
542 if (i == MAX_EVENT_INDEX) 1320 if (i == MAX_EVENT_INDEX) {
543 die("Too many events are on the same function."); 1321 pr_warning("Too many events are on the same function.\n");
1322 ret = -ERANGE;
1323 }
1324
1325 return ret;
544} 1326}
545 1327
546void add_trace_kprobe_events(struct probe_point *probes, int nr_probes, 1328static int __add_kprobe_trace_events(struct perf_probe_event *pev,
547 bool force_add) 1329 struct kprobe_trace_event *tevs,
1330 int ntevs, bool allow_suffix)
548{ 1331{
549 int i, j, fd; 1332 int i, fd, ret;
550 struct probe_point *pp; 1333 struct kprobe_trace_event *tev = NULL;
551 char buf[MAX_CMDLEN]; 1334 char buf[64];
552 char event[64]; 1335 const char *event, *group;
553 struct strlist *namelist; 1336 struct strlist *namelist;
554 bool allow_suffix;
555 1337
556 fd = open_kprobe_events(O_RDWR, O_APPEND); 1338 fd = open_kprobe_events(true);
1339 if (fd < 0)
1340 return fd;
557 /* Get current event names */ 1341 /* Get current event names */
558 namelist = get_perf_event_names(fd, false); 1342 namelist = get_kprobe_trace_event_names(fd, false);
559 1343 if (!namelist) {
560 for (j = 0; j < nr_probes; j++) { 1344 pr_debug("Failed to get current event list.\n");
561 pp = probes + j; 1345 return -EIO;
562 if (!pp->event) 1346 }
563 pp->event = strdup(pp->function); 1347
564 if (!pp->group) 1348 ret = 0;
565 pp->group = strdup(PERFPROBE_GROUP); 1349 printf("Add new event%s\n", (ntevs > 1) ? "s:" : ":");
566 DIE_IF(!pp->event || !pp->group); 1350 for (i = 0; i < ntevs; i++) {
567 /* If force_add is true, suffix search is allowed */ 1351 tev = &tevs[i];
568 allow_suffix = force_add; 1352 if (pev->event)
569 for (i = 0; i < pp->found; i++) { 1353 event = pev->event;
570 /* Get an unused new event name */ 1354 else
571 get_new_event_name(event, 64, pp->event, namelist, 1355 if (pev->point.function)
572 allow_suffix); 1356 event = pev->point.function;
573 snprintf(buf, MAX_CMDLEN, "%c:%s/%s %s\n", 1357 else
574 pp->retprobe ? 'r' : 'p', 1358 event = tev->point.symbol;
575 pp->group, event, 1359 if (pev->group)
576 pp->probes[i]); 1360 group = pev->group;
577 write_trace_kprobe_event(fd, buf); 1361 else
578 printf("Added new event:\n"); 1362 group = PERFPROBE_GROUP;
579 /* Get the first parameter (probe-point) */ 1363
580 sscanf(pp->probes[i], "%s", buf); 1364 /* Get an unused new event name */
581 show_perf_probe_event(event, buf, pp); 1365 ret = get_new_event_name(buf, 64, event,
582 /* Add added event name to namelist */ 1366 namelist, allow_suffix);
583 strlist__add(namelist, event); 1367 if (ret < 0)
584 /* 1368 break;
585 * Probes after the first probe which comes from same 1369 event = buf;
586 * user input are always allowed to add suffix, because 1370
587 * there might be several addresses corresponding to 1371 tev->event = strdup(event);
588 * one code line. 1372 tev->group = strdup(group);
589 */ 1373 if (tev->event == NULL || tev->group == NULL) {
590 allow_suffix = true; 1374 ret = -ENOMEM;
1375 break;
591 } 1376 }
1377 ret = write_kprobe_trace_event(fd, tev);
1378 if (ret < 0)
1379 break;
1380 /* Add added event name to namelist */
1381 strlist__add(namelist, event);
1382
1383 /* Trick here - save current event/group */
1384 event = pev->event;
1385 group = pev->group;
1386 pev->event = tev->event;
1387 pev->group = tev->group;
1388 show_perf_probe_event(pev);
1389 /* Trick here - restore current event/group */
1390 pev->event = (char *)event;
1391 pev->group = (char *)group;
1392
1393 /*
1394 * Probes after the first probe which comes from same
1395 * user input are always allowed to add suffix, because
1396 * there might be several addresses corresponding to
1397 * one code line.
1398 */
1399 allow_suffix = true;
1400 }
1401
1402 if (ret >= 0) {
1403 /* Show how to use the event. */
1404 printf("\nYou can now use it on all perf tools, such as:\n\n");
1405 printf("\tperf record -e %s:%s -aR sleep 1\n\n", tev->group,
1406 tev->event);
592 } 1407 }
593 /* Show how to use the event. */
594 printf("\nYou can now use it on all perf tools, such as:\n\n");
595 printf("\tperf record -e %s:%s -a sleep 1\n\n", PERFPROBE_GROUP, event);
596 1408
597 strlist__delete(namelist); 1409 strlist__delete(namelist);
598 close(fd); 1410 close(fd);
1411 return ret;
599} 1412}
600 1413
601static void __del_trace_kprobe_event(int fd, struct str_node *ent) 1414static int convert_to_kprobe_trace_events(struct perf_probe_event *pev,
1415 struct kprobe_trace_event **tevs,
1416 int max_tevs)
1417{
1418 struct symbol *sym;
1419 int ret = 0, i;
1420 struct kprobe_trace_event *tev;
1421
1422 /* Convert perf_probe_event with debuginfo */
1423 ret = try_to_find_kprobe_trace_events(pev, tevs, max_tevs);
1424 if (ret != 0)
1425 return ret;
1426
1427 /* Allocate trace event buffer */
1428 tev = *tevs = zalloc(sizeof(struct kprobe_trace_event));
1429 if (tev == NULL)
1430 return -ENOMEM;
1431
1432 /* Copy parameters */
1433 tev->point.symbol = strdup(pev->point.function);
1434 if (tev->point.symbol == NULL) {
1435 ret = -ENOMEM;
1436 goto error;
1437 }
1438 tev->point.offset = pev->point.offset;
1439 tev->nargs = pev->nargs;
1440 if (tev->nargs) {
1441 tev->args = zalloc(sizeof(struct kprobe_trace_arg)
1442 * tev->nargs);
1443 if (tev->args == NULL) {
1444 ret = -ENOMEM;
1445 goto error;
1446 }
1447 for (i = 0; i < tev->nargs; i++) {
1448 if (pev->args[i].name) {
1449 tev->args[i].name = strdup(pev->args[i].name);
1450 if (tev->args[i].name == NULL) {
1451 ret = -ENOMEM;
1452 goto error;
1453 }
1454 }
1455 tev->args[i].value = strdup(pev->args[i].var);
1456 if (tev->args[i].value == NULL) {
1457 ret = -ENOMEM;
1458 goto error;
1459 }
1460 if (pev->args[i].type) {
1461 tev->args[i].type = strdup(pev->args[i].type);
1462 if (tev->args[i].type == NULL) {
1463 ret = -ENOMEM;
1464 goto error;
1465 }
1466 }
1467 }
1468 }
1469
1470 /* Currently just checking function name from symbol map */
1471 sym = map__find_symbol_by_name(machine.vmlinux_maps[MAP__FUNCTION],
1472 tev->point.symbol, NULL);
1473 if (!sym) {
1474 pr_warning("Kernel symbol \'%s\' not found.\n",
1475 tev->point.symbol);
1476 ret = -ENOENT;
1477 goto error;
1478 }
1479
1480 return 1;
1481error:
1482 clear_kprobe_trace_event(tev);
1483 free(tev);
1484 *tevs = NULL;
1485 return ret;
1486}
1487
1488struct __event_package {
1489 struct perf_probe_event *pev;
1490 struct kprobe_trace_event *tevs;
1491 int ntevs;
1492};
1493
1494int add_perf_probe_events(struct perf_probe_event *pevs, int npevs,
1495 bool force_add, int max_tevs)
1496{
1497 int i, j, ret;
1498 struct __event_package *pkgs;
1499
1500 pkgs = zalloc(sizeof(struct __event_package) * npevs);
1501 if (pkgs == NULL)
1502 return -ENOMEM;
1503
1504 /* Init vmlinux path */
1505 ret = init_vmlinux();
1506 if (ret < 0)
1507 return ret;
1508
1509 /* Loop 1: convert all events */
1510 for (i = 0; i < npevs; i++) {
1511 pkgs[i].pev = &pevs[i];
1512 /* Convert with or without debuginfo */
1513 ret = convert_to_kprobe_trace_events(pkgs[i].pev,
1514 &pkgs[i].tevs, max_tevs);
1515 if (ret < 0)
1516 goto end;
1517 pkgs[i].ntevs = ret;
1518 }
1519
1520 /* Loop 2: add all events */
1521 for (i = 0; i < npevs && ret >= 0; i++)
1522 ret = __add_kprobe_trace_events(pkgs[i].pev, pkgs[i].tevs,
1523 pkgs[i].ntevs, force_add);
1524end:
1525 /* Loop 3: cleanup trace events */
1526 for (i = 0; i < npevs; i++)
1527 for (j = 0; j < pkgs[i].ntevs; j++)
1528 clear_kprobe_trace_event(&pkgs[i].tevs[j]);
1529
1530 return ret;
1531}
1532
1533static int __del_trace_kprobe_event(int fd, struct str_node *ent)
602{ 1534{
603 char *p; 1535 char *p;
604 char buf[128]; 1536 char buf[128];
1537 int ret;
605 1538
606 /* Convert from perf-probe event to trace-kprobe event */ 1539 /* Convert from perf-probe event to trace-kprobe event */
607 if (e_snprintf(buf, 128, "-:%s", ent->s) < 0) 1540 ret = e_snprintf(buf, 128, "-:%s", ent->s);
608 die("Failed to copy event."); 1541 if (ret < 0)
1542 goto error;
1543
609 p = strchr(buf + 2, ':'); 1544 p = strchr(buf + 2, ':');
610 if (!p) 1545 if (!p) {
611 die("Internal error: %s should have ':' but not.", ent->s); 1546 pr_debug("Internal error: %s should have ':' but not.\n",
1547 ent->s);
1548 ret = -ENOTSUP;
1549 goto error;
1550 }
612 *p = '/'; 1551 *p = '/';
613 1552
614 write_trace_kprobe_event(fd, buf); 1553 pr_debug("Writing event: %s\n", buf);
1554 ret = write(fd, buf, strlen(buf));
1555 if (ret < 0)
1556 goto error;
1557
615 printf("Remove event: %s\n", ent->s); 1558 printf("Remove event: %s\n", ent->s);
1559 return 0;
1560error:
1561 pr_warning("Failed to delete event: %s\n", strerror(-ret));
1562 return ret;
616} 1563}
617 1564
618static void del_trace_kprobe_event(int fd, const char *group, 1565static int del_trace_kprobe_event(int fd, const char *group,
619 const char *event, struct strlist *namelist) 1566 const char *event, struct strlist *namelist)
620{ 1567{
621 char buf[128]; 1568 char buf[128];
622 struct str_node *ent, *n; 1569 struct str_node *ent, *n;
623 int found = 0; 1570 int found = 0, ret = 0;
624 1571
625 if (e_snprintf(buf, 128, "%s:%s", group, event) < 0) 1572 ret = e_snprintf(buf, 128, "%s:%s", group, event);
626 die("Failed to copy event."); 1573 if (ret < 0) {
1574 pr_err("Failed to copy event.");
1575 return ret;
1576 }
627 1577
628 if (strpbrk(buf, "*?")) { /* Glob-exp */ 1578 if (strpbrk(buf, "*?")) { /* Glob-exp */
629 strlist__for_each_safe(ent, n, namelist) 1579 strlist__for_each_safe(ent, n, namelist)
630 if (strglobmatch(ent->s, buf)) { 1580 if (strglobmatch(ent->s, buf)) {
631 found++; 1581 found++;
632 __del_trace_kprobe_event(fd, ent); 1582 ret = __del_trace_kprobe_event(fd, ent);
1583 if (ret < 0)
1584 break;
633 strlist__remove(namelist, ent); 1585 strlist__remove(namelist, ent);
634 } 1586 }
635 } else { 1587 } else {
636 ent = strlist__find(namelist, buf); 1588 ent = strlist__find(namelist, buf);
637 if (ent) { 1589 if (ent) {
638 found++; 1590 found++;
639 __del_trace_kprobe_event(fd, ent); 1591 ret = __del_trace_kprobe_event(fd, ent);
640 strlist__remove(namelist, ent); 1592 if (ret >= 0)
1593 strlist__remove(namelist, ent);
641 } 1594 }
642 } 1595 }
643 if (found == 0) 1596 if (found == 0 && ret >= 0)
644 pr_info("Info: event \"%s\" does not exist, could not remove it.\n", buf); 1597 pr_info("Info: Event \"%s\" does not exist.\n", buf);
1598
1599 return ret;
645} 1600}
646 1601
647void del_trace_kprobe_events(struct strlist *dellist) 1602int del_perf_probe_events(struct strlist *dellist)
648{ 1603{
649 int fd; 1604 int fd, ret = 0;
650 const char *group, *event; 1605 const char *group, *event;
651 char *p, *str; 1606 char *p, *str;
652 struct str_node *ent; 1607 struct str_node *ent;
653 struct strlist *namelist; 1608 struct strlist *namelist;
654 1609
655 fd = open_kprobe_events(O_RDWR, O_APPEND); 1610 fd = open_kprobe_events(true);
1611 if (fd < 0)
1612 return fd;
1613
656 /* Get current event names */ 1614 /* Get current event names */
657 namelist = get_perf_event_names(fd, true); 1615 namelist = get_kprobe_trace_event_names(fd, true);
1616 if (namelist == NULL)
1617 return -EINVAL;
658 1618
659 strlist__for_each(ent, dellist) { 1619 strlist__for_each(ent, dellist) {
660 str = strdup(ent->s); 1620 str = strdup(ent->s);
661 if (!str) 1621 if (str == NULL) {
662 die("Failed to copy event."); 1622 ret = -ENOMEM;
1623 break;
1624 }
663 pr_debug("Parsing: %s\n", str); 1625 pr_debug("Parsing: %s\n", str);
664 p = strchr(str, ':'); 1626 p = strchr(str, ':');
665 if (p) { 1627 if (p) {
@@ -671,10 +1633,14 @@ void del_trace_kprobe_events(struct strlist *dellist)
671 event = str; 1633 event = str;
672 } 1634 }
673 pr_debug("Group: %s, Event: %s\n", group, event); 1635 pr_debug("Group: %s, Event: %s\n", group, event);
674 del_trace_kprobe_event(fd, group, event, namelist); 1636 ret = del_trace_kprobe_event(fd, group, event, namelist);
675 free(str); 1637 free(str);
1638 if (ret < 0)
1639 break;
676 } 1640 }
677 strlist__delete(namelist); 1641 strlist__delete(namelist);
678 close(fd); 1642 close(fd);
1643
1644 return ret;
679} 1645}
680 1646
diff --git a/tools/perf/util/probe-event.h b/tools/perf/util/probe-event.h
index 7f1d499118c0..e9db1a214ca4 100644
--- a/tools/perf/util/probe-event.h
+++ b/tools/perf/util/probe-event.h
@@ -2,19 +2,125 @@
2#define _PROBE_EVENT_H 2#define _PROBE_EVENT_H
3 3
4#include <stdbool.h> 4#include <stdbool.h>
5#include "probe-finder.h"
6#include "strlist.h" 5#include "strlist.h"
7 6
8extern void parse_perf_probe_event(const char *str, struct probe_point *pp, 7extern bool probe_event_dry_run;
9 bool *need_dwarf); 8
10extern int synthesize_perf_probe_point(struct probe_point *pp); 9/* kprobe-tracer tracing point */
11extern int synthesize_perf_probe_event(struct probe_point *pp); 10struct kprobe_trace_point {
12extern void parse_trace_kprobe_event(const char *str, struct probe_point *pp); 11 char *symbol; /* Base symbol */
13extern int synthesize_trace_kprobe_event(struct probe_point *pp); 12 unsigned long offset; /* Offset from symbol */
14extern void add_trace_kprobe_events(struct probe_point *probes, int nr_probes, 13 bool retprobe; /* Return probe flag */
15 bool force_add); 14};
16extern void del_trace_kprobe_events(struct strlist *dellist); 15
17extern void show_perf_probe_events(void); 16/* kprobe-tracer tracing argument referencing offset */
17struct kprobe_trace_arg_ref {
18 struct kprobe_trace_arg_ref *next; /* Next reference */
19 long offset; /* Offset value */
20};
21
22/* kprobe-tracer tracing argument */
23struct kprobe_trace_arg {
24 char *name; /* Argument name */
25 char *value; /* Base value */
26 char *type; /* Type name */
27 struct kprobe_trace_arg_ref *ref; /* Referencing offset */
28};
29
30/* kprobe-tracer tracing event (point + arg) */
31struct kprobe_trace_event {
32 char *event; /* Event name */
33 char *group; /* Group name */
34 struct kprobe_trace_point point; /* Trace point */
35 int nargs; /* Number of args */
36 struct kprobe_trace_arg *args; /* Arguments */
37};
38
39/* Perf probe probing point */
40struct perf_probe_point {
41 char *file; /* File path */
42 char *function; /* Function name */
43 int line; /* Line number */
44 bool retprobe; /* Return probe flag */
45 char *lazy_line; /* Lazy matching pattern */
46 unsigned long offset; /* Offset from function entry */
47};
48
49/* Perf probe probing argument field chain */
50struct perf_probe_arg_field {
51 struct perf_probe_arg_field *next; /* Next field */
52 char *name; /* Name of the field */
53 bool ref; /* Referencing flag */
54};
55
56/* Perf probe probing argument */
57struct perf_probe_arg {
58 char *name; /* Argument name */
59 char *var; /* Variable name */
60 char *type; /* Type name */
61 struct perf_probe_arg_field *field; /* Structure fields */
62};
63
64/* Perf probe probing event (point + arg) */
65struct perf_probe_event {
66 char *event; /* Event name */
67 char *group; /* Group name */
68 struct perf_probe_point point; /* Probe point */
69 int nargs; /* Number of arguments */
70 struct perf_probe_arg *args; /* Arguments */
71};
72
73
74/* Line number container */
75struct line_node {
76 struct list_head list;
77 int line;
78};
79
80/* Line range */
81struct line_range {
82 char *file; /* File name */
83 char *function; /* Function name */
84 int start; /* Start line number */
85 int end; /* End line number */
86 int offset; /* Start line offset */
87 char *path; /* Real path name */
88 struct list_head line_list; /* Visible lines */
89};
90
91/* Command string to events */
92extern int parse_perf_probe_command(const char *cmd,
93 struct perf_probe_event *pev);
94extern int parse_kprobe_trace_command(const char *cmd,
95 struct kprobe_trace_event *tev);
96
97/* Events to command string */
98extern char *synthesize_perf_probe_command(struct perf_probe_event *pev);
99extern char *synthesize_kprobe_trace_command(struct kprobe_trace_event *tev);
100extern int synthesize_perf_probe_arg(struct perf_probe_arg *pa, char *buf,
101 size_t len);
102
103/* Check the perf_probe_event needs debuginfo */
104extern bool perf_probe_event_need_dwarf(struct perf_probe_event *pev);
105
106/* Convert from kprobe_trace_event to perf_probe_event */
107extern int convert_to_perf_probe_event(struct kprobe_trace_event *tev,
108 struct perf_probe_event *pev);
109
110/* Release event contents */
111extern void clear_perf_probe_event(struct perf_probe_event *pev);
112extern void clear_kprobe_trace_event(struct kprobe_trace_event *tev);
113
114/* Command string to line-range */
115extern int parse_line_range_desc(const char *cmd, struct line_range *lr);
116
117
118extern int add_perf_probe_events(struct perf_probe_event *pevs, int npevs,
119 bool force_add, int max_probe_points);
120extern int del_perf_probe_events(struct strlist *dellist);
121extern int show_perf_probe_events(void);
122extern int show_line_range(struct line_range *lr);
123
18 124
19/* Maximum index number of event-name postfix */ 125/* Maximum index number of event-name postfix */
20#define MAX_EVENT_INDEX 1024 126#define MAX_EVENT_INDEX 1024
diff --git a/tools/perf/util/probe-finder.c b/tools/perf/util/probe-finder.c
index 4b852c0d16a5..d964cb199c67 100644
--- a/tools/perf/util/probe-finder.c
+++ b/tools/perf/util/probe-finder.c
@@ -31,72 +31,16 @@
31#include <string.h> 31#include <string.h>
32#include <stdarg.h> 32#include <stdarg.h>
33#include <ctype.h> 33#include <ctype.h>
34#include <dwarf-regs.h>
34 35
36#include "string.h"
35#include "event.h" 37#include "event.h"
36#include "debug.h" 38#include "debug.h"
37#include "util.h" 39#include "util.h"
38#include "probe-finder.h" 40#include "probe-finder.h"
39 41
40 42/* Kprobe tracer basic type is up to u64 */
41/* Dwarf_Die Linkage to parent Die */ 43#define MAX_BASIC_TYPE_BITS 64
42struct die_link {
43 struct die_link *parent; /* Parent die */
44 Dwarf_Die die; /* Current die */
45};
46
47static Dwarf_Debug __dw_debug;
48static Dwarf_Error __dw_error;
49
50/*
51 * Generic dwarf analysis helpers
52 */
53
54#define X86_32_MAX_REGS 8
55const char *x86_32_regs_table[X86_32_MAX_REGS] = {
56 "%ax",
57 "%cx",
58 "%dx",
59 "%bx",
60 "$stack", /* Stack address instead of %sp */
61 "%bp",
62 "%si",
63 "%di",
64};
65
66#define X86_64_MAX_REGS 16
67const char *x86_64_regs_table[X86_64_MAX_REGS] = {
68 "%ax",
69 "%dx",
70 "%cx",
71 "%bx",
72 "%si",
73 "%di",
74 "%bp",
75 "%sp",
76 "%r8",
77 "%r9",
78 "%r10",
79 "%r11",
80 "%r12",
81 "%r13",
82 "%r14",
83 "%r15",
84};
85
86/* TODO: switching by dwarf address size */
87#ifdef __x86_64__
88#define ARCH_MAX_REGS X86_64_MAX_REGS
89#define arch_regs_table x86_64_regs_table
90#else
91#define ARCH_MAX_REGS X86_32_MAX_REGS
92#define arch_regs_table x86_32_regs_table
93#endif
94
95/* Return architecture dependent register string (for kprobe-tracer) */
96static const char *get_arch_regstr(unsigned int n)
97{
98 return (n <= ARCH_MAX_REGS) ? arch_regs_table[n] : NULL;
99}
100 44
101/* 45/*
102 * Compare the tail of two strings. 46 * Compare the tail of two strings.
@@ -113,256 +57,299 @@ static int strtailcmp(const char *s1, const char *s2)
113 return 0; 57 return 0;
114} 58}
115 59
116/* Find the fileno of the target file. */ 60/* Line number list operations */
117static Dwarf_Unsigned cu_find_fileno(Dwarf_Die cu_die, const char *fname) 61
62/* Add a line to line number list */
63static int line_list__add_line(struct list_head *head, int line)
64{
65 struct line_node *ln;
66 struct list_head *p;
67
68 /* Reverse search, because new line will be the last one */
69 list_for_each_entry_reverse(ln, head, list) {
70 if (ln->line < line) {
71 p = &ln->list;
72 goto found;
73 } else if (ln->line == line) /* Already exist */
74 return 1;
75 }
76 /* List is empty, or the smallest entry */
77 p = head;
78found:
79 pr_debug("line list: add a line %u\n", line);
80 ln = zalloc(sizeof(struct line_node));
81 if (ln == NULL)
82 return -ENOMEM;
83 ln->line = line;
84 INIT_LIST_HEAD(&ln->list);
85 list_add(&ln->list, p);
86 return 0;
87}
88
89/* Check if the line in line number list */
90static int line_list__has_line(struct list_head *head, int line)
91{
92 struct line_node *ln;
93
94 /* Reverse search, because new line will be the last one */
95 list_for_each_entry(ln, head, list)
96 if (ln->line == line)
97 return 1;
98
99 return 0;
100}
101
102/* Init line number list */
103static void line_list__init(struct list_head *head)
104{
105 INIT_LIST_HEAD(head);
106}
107
108/* Free line number list */
109static void line_list__free(struct list_head *head)
110{
111 struct line_node *ln;
112 while (!list_empty(head)) {
113 ln = list_first_entry(head, struct line_node, list);
114 list_del(&ln->list);
115 free(ln);
116 }
117}
118
119/* Dwarf wrappers */
120
121/* Find the realpath of the target file. */
122static const char *cu_find_realpath(Dwarf_Die *cu_die, const char *fname)
118{ 123{
119 Dwarf_Signed cnt, i; 124 Dwarf_Files *files;
120 Dwarf_Unsigned found = 0; 125 size_t nfiles, i;
121 char **srcs; 126 const char *src = NULL;
122 int ret; 127 int ret;
123 128
124 if (!fname) 129 if (!fname)
125 return 0; 130 return NULL;
126 131
127 ret = dwarf_srcfiles(cu_die, &srcs, &cnt, &__dw_error); 132 ret = dwarf_getsrcfiles(cu_die, &files, &nfiles);
128 if (ret == DW_DLV_OK) { 133 if (ret != 0)
129 for (i = 0; i < cnt && !found; i++) { 134 return NULL;
130 if (strtailcmp(srcs[i], fname) == 0) 135
131 found = i + 1; 136 for (i = 0; i < nfiles; i++) {
132 dwarf_dealloc(__dw_debug, srcs[i], DW_DLA_STRING); 137 src = dwarf_filesrc(files, i, NULL, NULL);
133 } 138 if (strtailcmp(src, fname) == 0)
134 for (; i < cnt; i++) 139 break;
135 dwarf_dealloc(__dw_debug, srcs[i], DW_DLA_STRING);
136 dwarf_dealloc(__dw_debug, srcs, DW_DLA_LIST);
137 } 140 }
138 if (found) 141 if (i == nfiles)
139 pr_debug("found fno: %d\n", (int)found); 142 return NULL;
140 return found; 143 return src;
141} 144}
142 145
143/* Compare diename and tname */ 146/* Compare diename and tname */
144static int die_compare_name(Dwarf_Die dw_die, const char *tname) 147static bool die_compare_name(Dwarf_Die *dw_die, const char *tname)
145{ 148{
146 char *name; 149 const char *name;
147 int ret; 150 name = dwarf_diename(dw_die);
148 ret = dwarf_diename(dw_die, &name, &__dw_error); 151 return name ? strcmp(tname, name) : -1;
149 DIE_IF(ret == DW_DLV_ERROR);
150 if (ret == DW_DLV_OK) {
151 ret = strcmp(tname, name);
152 dwarf_dealloc(__dw_debug, name, DW_DLA_STRING);
153 } else
154 ret = -1;
155 return ret;
156} 152}
157 153
158/* Check the address is in the subprogram(function). */ 154/* Get type die, but skip qualifiers and typedef */
159static int die_within_subprogram(Dwarf_Die sp_die, Dwarf_Addr addr, 155static Dwarf_Die *die_get_real_type(Dwarf_Die *vr_die, Dwarf_Die *die_mem)
160 Dwarf_Signed *offs)
161{ 156{
162 Dwarf_Addr lopc, hipc; 157 Dwarf_Attribute attr;
163 int ret; 158 int tag;
164 159
165 /* TODO: check ranges */ 160 do {
166 ret = dwarf_lowpc(sp_die, &lopc, &__dw_error); 161 if (dwarf_attr(vr_die, DW_AT_type, &attr) == NULL ||
167 DIE_IF(ret == DW_DLV_ERROR); 162 dwarf_formref_die(&attr, die_mem) == NULL)
168 if (ret == DW_DLV_NO_ENTRY) 163 return NULL;
169 return 0; 164
170 ret = dwarf_highpc(sp_die, &hipc, &__dw_error); 165 tag = dwarf_tag(die_mem);
171 DIE_IF(ret != DW_DLV_OK); 166 vr_die = die_mem;
172 if (lopc <= addr && addr < hipc) { 167 } while (tag == DW_TAG_const_type ||
173 *offs = addr - lopc; 168 tag == DW_TAG_restrict_type ||
174 return 1; 169 tag == DW_TAG_volatile_type ||
175 } else 170 tag == DW_TAG_shared_type ||
176 return 0; 171 tag == DW_TAG_typedef);
172
173 return die_mem;
177} 174}
178 175
179/* Check the die is inlined function */ 176static bool die_is_signed_type(Dwarf_Die *tp_die)
180static Dwarf_Bool die_inlined_subprogram(Dwarf_Die dw_die)
181{ 177{
182 /* TODO: check strictly */ 178 Dwarf_Attribute attr;
183 Dwarf_Bool inl; 179 Dwarf_Word ret;
184 int ret; 180
181 if (dwarf_attr(tp_die, DW_AT_encoding, &attr) == NULL ||
182 dwarf_formudata(&attr, &ret) != 0)
183 return false;
185 184
186 ret = dwarf_hasattr(dw_die, DW_AT_inline, &inl, &__dw_error); 185 return (ret == DW_ATE_signed_char || ret == DW_ATE_signed ||
187 DIE_IF(ret == DW_DLV_ERROR); 186 ret == DW_ATE_signed_fixed);
188 return inl;
189} 187}
190 188
191/* Get the offset of abstruct_origin */ 189static int die_get_byte_size(Dwarf_Die *tp_die)
192static Dwarf_Off die_get_abstract_origin(Dwarf_Die dw_die)
193{ 190{
194 Dwarf_Attribute attr; 191 Dwarf_Attribute attr;
195 Dwarf_Off cu_offs; 192 Dwarf_Word ret;
196 int ret; 193
194 if (dwarf_attr(tp_die, DW_AT_byte_size, &attr) == NULL ||
195 dwarf_formudata(&attr, &ret) != 0)
196 return 0;
197 197
198 ret = dwarf_attr(dw_die, DW_AT_abstract_origin, &attr, &__dw_error); 198 return (int)ret;
199 DIE_IF(ret != DW_DLV_OK);
200 ret = dwarf_formref(attr, &cu_offs, &__dw_error);
201 DIE_IF(ret != DW_DLV_OK);
202 dwarf_dealloc(__dw_debug, attr, DW_DLA_ATTR);
203 return cu_offs;
204} 199}
205 200
206/* Get entry pc(or low pc, 1st entry of ranges) of the die */ 201/* Get data_member_location offset */
207static Dwarf_Addr die_get_entrypc(Dwarf_Die dw_die) 202static int die_get_data_member_location(Dwarf_Die *mb_die, Dwarf_Word *offs)
208{ 203{
209 Dwarf_Attribute attr; 204 Dwarf_Attribute attr;
210 Dwarf_Addr addr; 205 Dwarf_Op *expr;
211 Dwarf_Off offs; 206 size_t nexpr;
212 Dwarf_Ranges *ranges;
213 Dwarf_Signed cnt;
214 int ret; 207 int ret;
215 208
216 /* Try to get entry pc */ 209 if (dwarf_attr(mb_die, DW_AT_data_member_location, &attr) == NULL)
217 ret = dwarf_attr(dw_die, DW_AT_entry_pc, &attr, &__dw_error); 210 return -ENOENT;
218 DIE_IF(ret == DW_DLV_ERROR); 211
219 if (ret == DW_DLV_OK) { 212 if (dwarf_formudata(&attr, offs) != 0) {
220 ret = dwarf_formaddr(attr, &addr, &__dw_error); 213 /* DW_AT_data_member_location should be DW_OP_plus_uconst */
221 DIE_IF(ret != DW_DLV_OK); 214 ret = dwarf_getlocation(&attr, &expr, &nexpr);
222 dwarf_dealloc(__dw_debug, attr, DW_DLA_ATTR); 215 if (ret < 0 || nexpr == 0)
223 return addr; 216 return -ENOENT;
224 } 217
225 218 if (expr[0].atom != DW_OP_plus_uconst || nexpr != 1) {
226 /* Try to get low pc */ 219 pr_debug("Unable to get offset:Unexpected OP %x (%zd)\n",
227 ret = dwarf_lowpc(dw_die, &addr, &__dw_error); 220 expr[0].atom, nexpr);
228 DIE_IF(ret == DW_DLV_ERROR); 221 return -ENOTSUP;
229 if (ret == DW_DLV_OK) 222 }
230 return addr; 223 *offs = (Dwarf_Word)expr[0].number;
231 224 }
232 /* Try to get ranges */ 225 return 0;
233 ret = dwarf_attr(dw_die, DW_AT_ranges, &attr, &__dw_error);
234 DIE_IF(ret != DW_DLV_OK);
235 ret = dwarf_formref(attr, &offs, &__dw_error);
236 DIE_IF(ret != DW_DLV_OK);
237 ret = dwarf_get_ranges(__dw_debug, offs, &ranges, &cnt, NULL,
238 &__dw_error);
239 DIE_IF(ret != DW_DLV_OK);
240 addr = ranges[0].dwr_addr1;
241 dwarf_ranges_dealloc(__dw_debug, ranges, cnt);
242 return addr;
243} 226}
244 227
245/* 228/* Return values for die_find callbacks */
246 * Search a Die from Die tree. 229enum {
247 * Note: cur_link->die should be deallocated in this function. 230 DIE_FIND_CB_FOUND = 0, /* End of Search */
248 */ 231 DIE_FIND_CB_CHILD = 1, /* Search only children */
249static int __search_die_tree(struct die_link *cur_link, 232 DIE_FIND_CB_SIBLING = 2, /* Search only siblings */
250 int (*die_cb)(struct die_link *, void *), 233 DIE_FIND_CB_CONTINUE = 3, /* Search children and siblings */
251 void *data) 234};
235
236/* Search a child die */
237static Dwarf_Die *die_find_child(Dwarf_Die *rt_die,
238 int (*callback)(Dwarf_Die *, void *),
239 void *data, Dwarf_Die *die_mem)
252{ 240{
253 Dwarf_Die new_die; 241 Dwarf_Die child_die;
254 struct die_link new_link;
255 int ret; 242 int ret;
256 243
257 if (!die_cb) 244 ret = dwarf_child(rt_die, die_mem);
258 return 0; 245 if (ret != 0)
246 return NULL;
247
248 do {
249 ret = callback(die_mem, data);
250 if (ret == DIE_FIND_CB_FOUND)
251 return die_mem;
259 252
260 /* Check current die */ 253 if ((ret & DIE_FIND_CB_CHILD) &&
261 while (!(ret = die_cb(cur_link, data))) { 254 die_find_child(die_mem, callback, data, &child_die)) {
262 /* Check child die */ 255 memcpy(die_mem, &child_die, sizeof(Dwarf_Die));
263 ret = dwarf_child(cur_link->die, &new_die, &__dw_error); 256 return die_mem;
264 DIE_IF(ret == DW_DLV_ERROR);
265 if (ret == DW_DLV_OK) {
266 new_link.parent = cur_link;
267 new_link.die = new_die;
268 ret = __search_die_tree(&new_link, die_cb, data);
269 if (ret)
270 break;
271 } 257 }
258 } while ((ret & DIE_FIND_CB_SIBLING) &&
259 dwarf_siblingof(die_mem, die_mem) == 0);
272 260
273 /* Move to next sibling */ 261 return NULL;
274 ret = dwarf_siblingof(__dw_debug, cur_link->die, &new_die,
275 &__dw_error);
276 DIE_IF(ret == DW_DLV_ERROR);
277 dwarf_dealloc(__dw_debug, cur_link->die, DW_DLA_DIE);
278 cur_link->die = new_die;
279 if (ret == DW_DLV_NO_ENTRY)
280 return 0;
281 }
282 dwarf_dealloc(__dw_debug, cur_link->die, DW_DLA_DIE);
283 return ret;
284} 262}
285 263
286/* Search a die in its children's die tree */ 264struct __addr_die_search_param {
287static int search_die_from_children(Dwarf_Die parent_die, 265 Dwarf_Addr addr;
288 int (*die_cb)(struct die_link *, void *), 266 Dwarf_Die *die_mem;
289 void *data) 267};
268
269static int __die_search_func_cb(Dwarf_Die *fn_die, void *data)
290{ 270{
291 struct die_link new_link; 271 struct __addr_die_search_param *ad = data;
292 int ret;
293 272
294 new_link.parent = NULL; 273 if (dwarf_tag(fn_die) == DW_TAG_subprogram &&
295 ret = dwarf_child(parent_die, &new_link.die, &__dw_error); 274 dwarf_haspc(fn_die, ad->addr)) {
296 DIE_IF(ret == DW_DLV_ERROR); 275 memcpy(ad->die_mem, fn_die, sizeof(Dwarf_Die));
297 if (ret == DW_DLV_OK) 276 return DWARF_CB_ABORT;
298 return __search_die_tree(&new_link, die_cb, data); 277 }
278 return DWARF_CB_OK;
279}
280
281/* Search a real subprogram including this line, */
282static Dwarf_Die *die_find_real_subprogram(Dwarf_Die *cu_die, Dwarf_Addr addr,
283 Dwarf_Die *die_mem)
284{
285 struct __addr_die_search_param ad;
286 ad.addr = addr;
287 ad.die_mem = die_mem;
288 /* dwarf_getscopes can't find subprogram. */
289 if (!dwarf_getfuncs(cu_die, __die_search_func_cb, &ad, 0))
290 return NULL;
299 else 291 else
300 return 0; 292 return die_mem;
301} 293}
302 294
303/* Find a locdesc corresponding to the address */ 295/* die_find callback for inline function search */
304static int attr_get_locdesc(Dwarf_Attribute attr, Dwarf_Locdesc *desc, 296static int __die_find_inline_cb(Dwarf_Die *die_mem, void *data)
305 Dwarf_Addr addr)
306{ 297{
307 Dwarf_Signed lcnt; 298 Dwarf_Addr *addr = data;
308 Dwarf_Locdesc **llbuf;
309 int ret, i;
310 299
311 ret = dwarf_loclist_n(attr, &llbuf, &lcnt, &__dw_error); 300 if (dwarf_tag(die_mem) == DW_TAG_inlined_subroutine &&
312 DIE_IF(ret != DW_DLV_OK); 301 dwarf_haspc(die_mem, *addr))
313 ret = DW_DLV_NO_ENTRY; 302 return DIE_FIND_CB_FOUND;
314 for (i = 0; i < lcnt; ++i) { 303
315 if (llbuf[i]->ld_lopc <= addr && 304 return DIE_FIND_CB_CONTINUE;
316 llbuf[i]->ld_hipc > addr) {
317 memcpy(desc, llbuf[i], sizeof(Dwarf_Locdesc));
318 desc->ld_s =
319 malloc(sizeof(Dwarf_Loc) * llbuf[i]->ld_cents);
320 DIE_IF(desc->ld_s == NULL);
321 memcpy(desc->ld_s, llbuf[i]->ld_s,
322 sizeof(Dwarf_Loc) * llbuf[i]->ld_cents);
323 ret = DW_DLV_OK;
324 break;
325 }
326 dwarf_dealloc(__dw_debug, llbuf[i]->ld_s, DW_DLA_LOC_BLOCK);
327 dwarf_dealloc(__dw_debug, llbuf[i], DW_DLA_LOCDESC);
328 }
329 /* Releasing loop */
330 for (; i < lcnt; ++i) {
331 dwarf_dealloc(__dw_debug, llbuf[i]->ld_s, DW_DLA_LOC_BLOCK);
332 dwarf_dealloc(__dw_debug, llbuf[i], DW_DLA_LOCDESC);
333 }
334 dwarf_dealloc(__dw_debug, llbuf, DW_DLA_LIST);
335 return ret;
336} 305}
337 306
338/* Get decl_file attribute value (file number) */ 307/* Similar to dwarf_getfuncs, but returns inlined_subroutine if exists. */
339static Dwarf_Unsigned die_get_decl_file(Dwarf_Die sp_die) 308static Dwarf_Die *die_find_inlinefunc(Dwarf_Die *sp_die, Dwarf_Addr addr,
309 Dwarf_Die *die_mem)
340{ 310{
341 Dwarf_Attribute attr; 311 return die_find_child(sp_die, __die_find_inline_cb, &addr, die_mem);
342 Dwarf_Unsigned fno; 312}
343 int ret;
344 313
345 ret = dwarf_attr(sp_die, DW_AT_decl_file, &attr, &__dw_error); 314static int __die_find_variable_cb(Dwarf_Die *die_mem, void *data)
346 DIE_IF(ret != DW_DLV_OK); 315{
347 dwarf_formudata(attr, &fno, &__dw_error); 316 const char *name = data;
348 DIE_IF(ret != DW_DLV_OK); 317 int tag;
349 dwarf_dealloc(__dw_debug, attr, DW_DLA_ATTR); 318
350 return fno; 319 tag = dwarf_tag(die_mem);
320 if ((tag == DW_TAG_formal_parameter ||
321 tag == DW_TAG_variable) &&
322 (die_compare_name(die_mem, name) == 0))
323 return DIE_FIND_CB_FOUND;
324
325 return DIE_FIND_CB_CONTINUE;
351} 326}
352 327
353/* Get decl_line attribute value (line number) */ 328/* Find a variable called 'name' */
354static Dwarf_Unsigned die_get_decl_line(Dwarf_Die sp_die) 329static Dwarf_Die *die_find_variable(Dwarf_Die *sp_die, const char *name,
330 Dwarf_Die *die_mem)
355{ 331{
356 Dwarf_Attribute attr; 332 return die_find_child(sp_die, __die_find_variable_cb, (void *)name,
357 Dwarf_Unsigned lno; 333 die_mem);
358 int ret; 334}
335
336static int __die_find_member_cb(Dwarf_Die *die_mem, void *data)
337{
338 const char *name = data;
359 339
360 ret = dwarf_attr(sp_die, DW_AT_decl_line, &attr, &__dw_error); 340 if ((dwarf_tag(die_mem) == DW_TAG_member) &&
361 DIE_IF(ret != DW_DLV_OK); 341 (die_compare_name(die_mem, name) == 0))
362 dwarf_formudata(attr, &lno, &__dw_error); 342 return DIE_FIND_CB_FOUND;
363 DIE_IF(ret != DW_DLV_OK); 343
364 dwarf_dealloc(__dw_debug, attr, DW_DLA_ATTR); 344 return DIE_FIND_CB_SIBLING;
365 return lno; 345}
346
347/* Find a member called 'name' */
348static Dwarf_Die *die_find_member(Dwarf_Die *st_die, const char *name,
349 Dwarf_Die *die_mem)
350{
351 return die_find_child(st_die, __die_find_member_cb, (void *)name,
352 die_mem);
366} 353}
367 354
368/* 355/*
@@ -370,361 +357,950 @@ static Dwarf_Unsigned die_get_decl_line(Dwarf_Die sp_die)
370 */ 357 */
371 358
372/* Show a location */ 359/* Show a location */
373static void show_location(Dwarf_Loc *loc, struct probe_finder *pf) 360static int convert_location(Dwarf_Op *op, struct probe_finder *pf)
374{ 361{
375 Dwarf_Small op; 362 unsigned int regn;
376 Dwarf_Unsigned regn; 363 Dwarf_Word offs = 0;
377 Dwarf_Signed offs; 364 bool ref = false;
378 int deref = 0, ret;
379 const char *regs; 365 const char *regs;
380 366 struct kprobe_trace_arg *tvar = pf->tvar;
381 op = loc->lr_atom;
382 367
383 /* If this is based on frame buffer, set the offset */ 368 /* If this is based on frame buffer, set the offset */
384 if (op == DW_OP_fbreg) { 369 if (op->atom == DW_OP_fbreg) {
385 deref = 1; 370 if (pf->fb_ops == NULL) {
386 offs = (Dwarf_Signed)loc->lr_number; 371 pr_warning("The attribute of frame base is not "
387 op = pf->fbloc.ld_s[0].lr_atom; 372 "supported.\n");
388 loc = &pf->fbloc.ld_s[0]; 373 return -ENOTSUP;
389 } else 374 }
390 offs = 0; 375 ref = true;
391 376 offs = op->number;
392 if (op >= DW_OP_breg0 && op <= DW_OP_breg31) { 377 op = &pf->fb_ops[0];
393 regn = op - DW_OP_breg0; 378 }
394 offs += (Dwarf_Signed)loc->lr_number; 379
395 deref = 1; 380 if (op->atom >= DW_OP_breg0 && op->atom <= DW_OP_breg31) {
396 } else if (op >= DW_OP_reg0 && op <= DW_OP_reg31) { 381 regn = op->atom - DW_OP_breg0;
397 regn = op - DW_OP_reg0; 382 offs += op->number;
398 } else if (op == DW_OP_bregx) { 383 ref = true;
399 regn = loc->lr_number; 384 } else if (op->atom >= DW_OP_reg0 && op->atom <= DW_OP_reg31) {
400 offs += (Dwarf_Signed)loc->lr_number2; 385 regn = op->atom - DW_OP_reg0;
401 deref = 1; 386 } else if (op->atom == DW_OP_bregx) {
402 } else if (op == DW_OP_regx) { 387 regn = op->number;
403 regn = loc->lr_number; 388 offs += op->number2;
404 } else 389 ref = true;
405 die("Dwarf_OP %d is not supported.\n", op); 390 } else if (op->atom == DW_OP_regx) {
391 regn = op->number;
392 } else {
393 pr_warning("DW_OP %x is not supported.\n", op->atom);
394 return -ENOTSUP;
395 }
406 396
407 regs = get_arch_regstr(regn); 397 regs = get_arch_regstr(regn);
408 if (!regs) 398 if (!regs) {
409 die("%lld exceeds max register number.\n", regn); 399 pr_warning("Mapping for DWARF register number %u missing on this architecture.", regn);
400 return -ERANGE;
401 }
410 402
411 if (deref) 403 tvar->value = strdup(regs);
412 ret = snprintf(pf->buf, pf->len, 404 if (tvar->value == NULL)
413 " %s=%+lld(%s)", pf->var, offs, regs); 405 return -ENOMEM;
414 else 406
415 ret = snprintf(pf->buf, pf->len, " %s=%s", pf->var, regs); 407 if (ref) {
416 DIE_IF(ret < 0); 408 tvar->ref = zalloc(sizeof(struct kprobe_trace_arg_ref));
417 DIE_IF(ret >= pf->len); 409 if (tvar->ref == NULL)
410 return -ENOMEM;
411 tvar->ref->offset = (long)offs;
412 }
413 return 0;
418} 414}
419 415
420/* Show a variables in kprobe event format */ 416static int convert_variable_type(Dwarf_Die *vr_die,
421static void show_variable(Dwarf_Die vr_die, struct probe_finder *pf) 417 struct kprobe_trace_arg *targ)
422{ 418{
423 Dwarf_Attribute attr; 419 Dwarf_Die type;
424 Dwarf_Locdesc ld; 420 char buf[16];
425 int ret; 421 int ret;
426 422
427 ret = dwarf_attr(vr_die, DW_AT_location, &attr, &__dw_error); 423 if (die_get_real_type(vr_die, &type) == NULL) {
428 if (ret != DW_DLV_OK) 424 pr_warning("Failed to get a type information of %s.\n",
429 goto error; 425 dwarf_diename(vr_die));
430 ret = attr_get_locdesc(attr, &ld, (pf->addr - pf->cu_base)); 426 return -ENOENT;
431 if (ret != DW_DLV_OK) 427 }
432 goto error;
433 /* TODO? */
434 DIE_IF(ld.ld_cents != 1);
435 show_location(&ld.ld_s[0], pf);
436 free(ld.ld_s);
437 dwarf_dealloc(__dw_debug, attr, DW_DLA_ATTR);
438 return ;
439error:
440 die("Failed to find the location of %s at this address.\n"
441 " Perhaps, it has been optimized out.\n", pf->var);
442}
443 428
444static int variable_callback(struct die_link *dlink, void *data) 429 ret = die_get_byte_size(&type) * 8;
445{ 430 if (ret) {
446 struct probe_finder *pf = (struct probe_finder *)data; 431 /* Check the bitwidth */
447 Dwarf_Half tag; 432 if (ret > MAX_BASIC_TYPE_BITS) {
448 int ret; 433 pr_info("%s exceeds max-bitwidth."
434 " Cut down to %d bits.\n",
435 dwarf_diename(&type), MAX_BASIC_TYPE_BITS);
436 ret = MAX_BASIC_TYPE_BITS;
437 }
449 438
450 ret = dwarf_tag(dlink->die, &tag, &__dw_error); 439 ret = snprintf(buf, 16, "%c%d",
451 DIE_IF(ret == DW_DLV_ERROR); 440 die_is_signed_type(&type) ? 's' : 'u', ret);
452 if ((tag == DW_TAG_formal_parameter || 441 if (ret < 0 || ret >= 16) {
453 tag == DW_TAG_variable) && 442 if (ret >= 16)
454 (die_compare_name(dlink->die, pf->var) == 0)) { 443 ret = -E2BIG;
455 show_variable(dlink->die, pf); 444 pr_warning("Failed to convert variable type: %s\n",
456 return 1; 445 strerror(-ret));
446 return ret;
447 }
448 targ->type = strdup(buf);
449 if (targ->type == NULL)
450 return -ENOMEM;
457 } 451 }
458 /* TODO: Support struct members and arrays */
459 return 0; 452 return 0;
460} 453}
461 454
462/* Find a variable in a subprogram die */ 455static int convert_variable_fields(Dwarf_Die *vr_die, const char *varname,
463static void find_variable(Dwarf_Die sp_die, struct probe_finder *pf) 456 struct perf_probe_arg_field *field,
457 struct kprobe_trace_arg_ref **ref_ptr,
458 Dwarf_Die *die_mem)
464{ 459{
460 struct kprobe_trace_arg_ref *ref = *ref_ptr;
461 Dwarf_Die type;
462 Dwarf_Word offs;
465 int ret; 463 int ret;
466 464
467 if (!is_c_varname(pf->var)) { 465 pr_debug("converting %s in %s\n", field->name, varname);
468 /* Output raw parameters */ 466 if (die_get_real_type(vr_die, &type) == NULL) {
469 ret = snprintf(pf->buf, pf->len, " %s", pf->var); 467 pr_warning("Failed to get the type of %s.\n", varname);
470 DIE_IF(ret < 0); 468 return -ENOENT;
471 DIE_IF(ret >= pf->len);
472 return ;
473 } 469 }
474 470
475 pr_debug("Searching '%s' variable in context.\n", pf->var); 471 /* Check the pointer and dereference */
476 /* Search child die for local variables and parameters. */ 472 if (dwarf_tag(&type) == DW_TAG_pointer_type) {
477 ret = search_die_from_children(sp_die, variable_callback, pf); 473 if (!field->ref) {
478 if (!ret) 474 pr_err("Semantic error: %s must be referred by '->'\n",
479 die("Failed to find '%s' in this function.\n", pf->var); 475 field->name);
476 return -EINVAL;
477 }
478 /* Get the type pointed by this pointer */
479 if (die_get_real_type(&type, &type) == NULL) {
480 pr_warning("Failed to get the type of %s.\n", varname);
481 return -ENOENT;
482 }
483 /* Verify it is a data structure */
484 if (dwarf_tag(&type) != DW_TAG_structure_type) {
485 pr_warning("%s is not a data structure.\n", varname);
486 return -EINVAL;
487 }
488
489 ref = zalloc(sizeof(struct kprobe_trace_arg_ref));
490 if (ref == NULL)
491 return -ENOMEM;
492 if (*ref_ptr)
493 (*ref_ptr)->next = ref;
494 else
495 *ref_ptr = ref;
496 } else {
497 /* Verify it is a data structure */
498 if (dwarf_tag(&type) != DW_TAG_structure_type) {
499 pr_warning("%s is not a data structure.\n", varname);
500 return -EINVAL;
501 }
502 if (field->ref) {
503 pr_err("Semantic error: %s must be referred by '.'\n",
504 field->name);
505 return -EINVAL;
506 }
507 if (!ref) {
508 pr_warning("Structure on a register is not "
509 "supported yet.\n");
510 return -ENOTSUP;
511 }
512 }
513
514 if (die_find_member(&type, field->name, die_mem) == NULL) {
515 pr_warning("%s(tyep:%s) has no member %s.\n", varname,
516 dwarf_diename(&type), field->name);
517 return -EINVAL;
518 }
519
520 /* Get the offset of the field */
521 ret = die_get_data_member_location(die_mem, &offs);
522 if (ret < 0) {
523 pr_warning("Failed to get the offset of %s.\n", field->name);
524 return ret;
525 }
526 ref->offset += (long)offs;
527
528 /* Converting next field */
529 if (field->next)
530 return convert_variable_fields(die_mem, field->name,
531 field->next, &ref, die_mem);
532 else
533 return 0;
480} 534}
481 535
482/* Get a frame base on the address */ 536/* Show a variables in kprobe event format */
483static void get_current_frame_base(Dwarf_Die sp_die, struct probe_finder *pf) 537static int convert_variable(Dwarf_Die *vr_die, struct probe_finder *pf)
484{ 538{
485 Dwarf_Attribute attr; 539 Dwarf_Attribute attr;
540 Dwarf_Die die_mem;
541 Dwarf_Op *expr;
542 size_t nexpr;
486 int ret; 543 int ret;
487 544
488 ret = dwarf_attr(sp_die, DW_AT_frame_base, &attr, &__dw_error); 545 if (dwarf_attr(vr_die, DW_AT_location, &attr) == NULL)
489 DIE_IF(ret != DW_DLV_OK); 546 goto error;
490 ret = attr_get_locdesc(attr, &pf->fbloc, (pf->addr - pf->cu_base)); 547 /* TODO: handle more than 1 exprs */
491 DIE_IF(ret != DW_DLV_OK); 548 ret = dwarf_getlocation_addr(&attr, pf->addr, &expr, &nexpr, 1);
492 dwarf_dealloc(__dw_debug, attr, DW_DLA_ATTR); 549 if (ret <= 0 || nexpr == 0)
550 goto error;
551
552 ret = convert_location(expr, pf);
553 if (ret == 0 && pf->pvar->field) {
554 ret = convert_variable_fields(vr_die, pf->pvar->var,
555 pf->pvar->field, &pf->tvar->ref,
556 &die_mem);
557 vr_die = &die_mem;
558 }
559 if (ret == 0) {
560 if (pf->pvar->type) {
561 pf->tvar->type = strdup(pf->pvar->type);
562 if (pf->tvar->type == NULL)
563 ret = -ENOMEM;
564 } else
565 ret = convert_variable_type(vr_die, pf->tvar);
566 }
567 /* *expr will be cached in libdw. Don't free it. */
568 return ret;
569error:
570 /* TODO: Support const_value */
571 pr_err("Failed to find the location of %s at this address.\n"
572 " Perhaps, it has been optimized out.\n", pf->pvar->var);
573 return -ENOENT;
493} 574}
494 575
495static void free_current_frame_base(struct probe_finder *pf) 576/* Find a variable in a subprogram die */
577static int find_variable(Dwarf_Die *sp_die, struct probe_finder *pf)
496{ 578{
497 free(pf->fbloc.ld_s); 579 Dwarf_Die vr_die;
498 memset(&pf->fbloc, 0, sizeof(Dwarf_Locdesc)); 580 char buf[32], *ptr;
581 int ret;
582
583 /* TODO: Support arrays */
584 if (pf->pvar->name)
585 pf->tvar->name = strdup(pf->pvar->name);
586 else {
587 ret = synthesize_perf_probe_arg(pf->pvar, buf, 32);
588 if (ret < 0)
589 return ret;
590 ptr = strchr(buf, ':'); /* Change type separator to _ */
591 if (ptr)
592 *ptr = '_';
593 pf->tvar->name = strdup(buf);
594 }
595 if (pf->tvar->name == NULL)
596 return -ENOMEM;
597
598 if (!is_c_varname(pf->pvar->var)) {
599 /* Copy raw parameters */
600 pf->tvar->value = strdup(pf->pvar->var);
601 if (pf->tvar->value == NULL)
602 return -ENOMEM;
603 else
604 return 0;
605 }
606
607 pr_debug("Searching '%s' variable in context.\n",
608 pf->pvar->var);
609 /* Search child die for local variables and parameters. */
610 if (!die_find_variable(sp_die, pf->pvar->var, &vr_die)) {
611 pr_warning("Failed to find '%s' in this function.\n",
612 pf->pvar->var);
613 return -ENOENT;
614 }
615 return convert_variable(&vr_die, pf);
499} 616}
500 617
501/* Show a probe point to output buffer */ 618/* Show a probe point to output buffer */
502static void show_probepoint(Dwarf_Die sp_die, Dwarf_Signed offs, 619static int convert_probe_point(Dwarf_Die *sp_die, struct probe_finder *pf)
503 struct probe_finder *pf) 620{
504{ 621 struct kprobe_trace_event *tev;
505 struct probe_point *pp = pf->pp; 622 Dwarf_Addr eaddr;
506 char *name; 623 Dwarf_Die die_mem;
507 char tmp[MAX_PROBE_BUFFER]; 624 const char *name;
508 int ret, i, len; 625 int ret, i;
509 626 Dwarf_Attribute fb_attr;
510 /* Output name of probe point */ 627 size_t nops;
511 ret = dwarf_diename(sp_die, &name, &__dw_error); 628
512 DIE_IF(ret == DW_DLV_ERROR); 629 if (pf->ntevs == pf->max_tevs) {
513 if (ret == DW_DLV_OK) { 630 pr_warning("Too many( > %d) probe point found.\n",
514 ret = snprintf(tmp, MAX_PROBE_BUFFER, "%s+%u", name, 631 pf->max_tevs);
515 (unsigned int)offs); 632 return -ERANGE;
516 /* Copy the function name if possible */ 633 }
517 if (!pp->function) { 634 tev = &pf->tevs[pf->ntevs++];
518 pp->function = strdup(name); 635
519 pp->offset = offs; 636 /* If no real subprogram, find a real one */
637 if (!sp_die || dwarf_tag(sp_die) != DW_TAG_subprogram) {
638 sp_die = die_find_real_subprogram(&pf->cu_die,
639 pf->addr, &die_mem);
640 if (!sp_die) {
641 pr_warning("Failed to find probe point in any "
642 "functions.\n");
643 return -ENOENT;
520 } 644 }
521 dwarf_dealloc(__dw_debug, name, DW_DLA_STRING); 645 }
522 } else { 646
647 /* Copy the name of probe point */
648 name = dwarf_diename(sp_die);
649 if (name) {
650 if (dwarf_entrypc(sp_die, &eaddr) != 0) {
651 pr_warning("Failed to get entry pc of %s\n",
652 dwarf_diename(sp_die));
653 return -ENOENT;
654 }
655 tev->point.symbol = strdup(name);
656 if (tev->point.symbol == NULL)
657 return -ENOMEM;
658 tev->point.offset = (unsigned long)(pf->addr - eaddr);
659 } else
523 /* This function has no name. */ 660 /* This function has no name. */
524 ret = snprintf(tmp, MAX_PROBE_BUFFER, "0x%llx", pf->addr); 661 tev->point.offset = (unsigned long)pf->addr;
525 if (!pp->function) { 662
526 /* TODO: Use _stext */ 663 pr_debug("Probe point found: %s+%lu\n", tev->point.symbol,
527 pp->function = strdup(""); 664 tev->point.offset);
528 pp->offset = (int)pf->addr; 665
666 /* Get the frame base attribute/ops */
667 dwarf_attr(sp_die, DW_AT_frame_base, &fb_attr);
668 ret = dwarf_getlocation_addr(&fb_attr, pf->addr, &pf->fb_ops, &nops, 1);
669 if (ret <= 0 || nops == 0) {
670 pf->fb_ops = NULL;
671#if _ELFUTILS_PREREQ(0, 142)
672 } else if (nops == 1 && pf->fb_ops[0].atom == DW_OP_call_frame_cfa &&
673 pf->cfi != NULL) {
674 Dwarf_Frame *frame;
675 if (dwarf_cfi_addrframe(pf->cfi, pf->addr, &frame) != 0 ||
676 dwarf_frame_cfa(frame, &pf->fb_ops, &nops) != 0) {
677 pr_warning("Failed to get CFA on 0x%jx\n",
678 (uintmax_t)pf->addr);
679 return -ENOENT;
529 } 680 }
681#endif
530 } 682 }
531 DIE_IF(ret < 0);
532 DIE_IF(ret >= MAX_PROBE_BUFFER);
533 len = ret;
534 pr_debug("Probe point found: %s\n", tmp);
535 683
536 /* Find each argument */ 684 /* Find each argument */
537 get_current_frame_base(sp_die, pf); 685 tev->nargs = pf->pev->nargs;
538 for (i = 0; i < pp->nr_args; i++) { 686 tev->args = zalloc(sizeof(struct kprobe_trace_arg) * tev->nargs);
539 pf->var = pp->args[i]; 687 if (tev->args == NULL)
540 pf->buf = &tmp[len]; 688 return -ENOMEM;
541 pf->len = MAX_PROBE_BUFFER - len; 689 for (i = 0; i < pf->pev->nargs; i++) {
542 find_variable(sp_die, pf); 690 pf->pvar = &pf->pev->args[i];
543 len += strlen(pf->buf); 691 pf->tvar = &tev->args[i];
692 ret = find_variable(sp_die, pf);
693 if (ret != 0)
694 return ret;
544 } 695 }
545 free_current_frame_base(pf);
546 696
547 pp->probes[pp->found] = strdup(tmp); 697 /* *pf->fb_ops will be cached in libdw. Don't free it. */
548 pp->found++; 698 pf->fb_ops = NULL;
699 return 0;
549} 700}
550 701
551static int probeaddr_callback(struct die_link *dlink, void *data) 702/* Find probe point from its line number */
703static int find_probe_point_by_line(struct probe_finder *pf)
552{ 704{
553 struct probe_finder *pf = (struct probe_finder *)data; 705 Dwarf_Lines *lines;
554 Dwarf_Half tag; 706 Dwarf_Line *line;
555 Dwarf_Signed offs; 707 size_t nlines, i;
556 int ret; 708 Dwarf_Addr addr;
709 int lineno;
710 int ret = 0;
557 711
558 ret = dwarf_tag(dlink->die, &tag, &__dw_error); 712 if (dwarf_getsrclines(&pf->cu_die, &lines, &nlines) != 0) {
559 DIE_IF(ret == DW_DLV_ERROR); 713 pr_warning("No source lines found in this CU.\n");
560 /* Check the address is in this subprogram */ 714 return -ENOENT;
561 if (tag == DW_TAG_subprogram &&
562 die_within_subprogram(dlink->die, pf->addr, &offs)) {
563 show_probepoint(dlink->die, offs, pf);
564 return 1;
565 } 715 }
566 return 0; 716
717 for (i = 0; i < nlines && ret == 0; i++) {
718 line = dwarf_onesrcline(lines, i);
719 if (dwarf_lineno(line, &lineno) != 0 ||
720 lineno != pf->lno)
721 continue;
722
723 /* TODO: Get fileno from line, but how? */
724 if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0)
725 continue;
726
727 if (dwarf_lineaddr(line, &addr) != 0) {
728 pr_warning("Failed to get the address of the line.\n");
729 return -ENOENT;
730 }
731 pr_debug("Probe line found: line[%d]:%d addr:0x%jx\n",
732 (int)i, lineno, (uintmax_t)addr);
733 pf->addr = addr;
734
735 ret = convert_probe_point(NULL, pf);
736 /* Continuing, because target line might be inlined. */
737 }
738 return ret;
567} 739}
568 740
569/* Find probe point from its line number */ 741/* Find lines which match lazy pattern */
570static void find_by_line(struct probe_finder *pf) 742static int find_lazy_match_lines(struct list_head *head,
743 const char *fname, const char *pat)
571{ 744{
572 Dwarf_Signed cnt, i, clm; 745 char *fbuf, *p1, *p2;
573 Dwarf_Line *lines; 746 int fd, line, nlines = -1;
574 Dwarf_Unsigned lineno = 0; 747 struct stat st;
748
749 fd = open(fname, O_RDONLY);
750 if (fd < 0) {
751 pr_warning("Failed to open %s: %s\n", fname, strerror(-fd));
752 return -errno;
753 }
754
755 if (fstat(fd, &st) < 0) {
756 pr_warning("Failed to get the size of %s: %s\n",
757 fname, strerror(errno));
758 nlines = -errno;
759 goto out_close;
760 }
761
762 nlines = -ENOMEM;
763 fbuf = malloc(st.st_size + 2);
764 if (fbuf == NULL)
765 goto out_close;
766 if (read(fd, fbuf, st.st_size) < 0) {
767 pr_warning("Failed to read %s: %s\n", fname, strerror(errno));
768 nlines = -errno;
769 goto out_free_fbuf;
770 }
771 fbuf[st.st_size] = '\n'; /* Dummy line */
772 fbuf[st.st_size + 1] = '\0';
773 p1 = fbuf;
774 line = 1;
775 nlines = 0;
776 while ((p2 = strchr(p1, '\n')) != NULL) {
777 *p2 = '\0';
778 if (strlazymatch(p1, pat)) {
779 line_list__add_line(head, line);
780 nlines++;
781 }
782 line++;
783 p1 = p2 + 1;
784 }
785out_free_fbuf:
786 free(fbuf);
787out_close:
788 close(fd);
789 return nlines;
790}
791
792/* Find probe points from lazy pattern */
793static int find_probe_point_lazy(Dwarf_Die *sp_die, struct probe_finder *pf)
794{
795 Dwarf_Lines *lines;
796 Dwarf_Line *line;
797 size_t nlines, i;
575 Dwarf_Addr addr; 798 Dwarf_Addr addr;
576 Dwarf_Unsigned fno; 799 Dwarf_Die die_mem;
577 int ret; 800 int lineno;
801 int ret = 0;
802
803 if (list_empty(&pf->lcache)) {
804 /* Matching lazy line pattern */
805 ret = find_lazy_match_lines(&pf->lcache, pf->fname,
806 pf->pev->point.lazy_line);
807 if (ret == 0) {
808 pr_debug("No matched lines found in %s.\n", pf->fname);
809 return 0;
810 } else if (ret < 0)
811 return ret;
812 }
578 813
579 ret = dwarf_srclines(pf->cu_die, &lines, &cnt, &__dw_error); 814 if (dwarf_getsrclines(&pf->cu_die, &lines, &nlines) != 0) {
580 DIE_IF(ret != DW_DLV_OK); 815 pr_warning("No source lines found in this CU.\n");
816 return -ENOENT;
817 }
581 818
582 for (i = 0; i < cnt; i++) { 819 for (i = 0; i < nlines && ret >= 0; i++) {
583 ret = dwarf_line_srcfileno(lines[i], &fno, &__dw_error); 820 line = dwarf_onesrcline(lines, i);
584 DIE_IF(ret != DW_DLV_OK); 821
585 if (fno != pf->fno) 822 if (dwarf_lineno(line, &lineno) != 0 ||
823 !line_list__has_line(&pf->lcache, lineno))
586 continue; 824 continue;
587 825
588 ret = dwarf_lineno(lines[i], &lineno, &__dw_error); 826 /* TODO: Get fileno from line, but how? */
589 DIE_IF(ret != DW_DLV_OK); 827 if (strtailcmp(dwarf_linesrc(line, NULL, NULL), pf->fname) != 0)
590 if (lineno != pf->lno)
591 continue; 828 continue;
592 829
593 ret = dwarf_lineoff(lines[i], &clm, &__dw_error); 830 if (dwarf_lineaddr(line, &addr) != 0) {
594 DIE_IF(ret != DW_DLV_OK); 831 pr_debug("Failed to get the address of line %d.\n",
832 lineno);
833 continue;
834 }
835 if (sp_die) {
836 /* Address filtering 1: does sp_die include addr? */
837 if (!dwarf_haspc(sp_die, addr))
838 continue;
839 /* Address filtering 2: No child include addr? */
840 if (die_find_inlinefunc(sp_die, addr, &die_mem))
841 continue;
842 }
595 843
596 ret = dwarf_lineaddr(lines[i], &addr, &__dw_error); 844 pr_debug("Probe line found: line[%d]:%d addr:0x%llx\n",
597 DIE_IF(ret != DW_DLV_OK); 845 (int)i, lineno, (unsigned long long)addr);
598 pr_debug("Probe line found: line[%d]:%u,%d addr:0x%llx\n",
599 (int)i, (unsigned)lineno, (int)clm, addr);
600 pf->addr = addr; 846 pf->addr = addr;
601 /* Search a real subprogram including this line, */ 847
602 ret = search_die_from_children(pf->cu_die, 848 ret = convert_probe_point(sp_die, pf);
603 probeaddr_callback, pf);
604 if (ret == 0)
605 die("Probe point is not found in subprograms.\n");
606 /* Continuing, because target line might be inlined. */ 849 /* Continuing, because target line might be inlined. */
607 } 850 }
608 dwarf_srclines_dealloc(__dw_debug, lines, cnt); 851 /* TODO: deallocate lines, but how? */
852 return ret;
609} 853}
610 854
611/* Search function from function name */ 855/* Callback parameter with return value */
612static int probefunc_callback(struct die_link *dlink, void *data) 856struct dwarf_callback_param {
857 void *data;
858 int retval;
859};
860
861static int probe_point_inline_cb(Dwarf_Die *in_die, void *data)
613{ 862{
614 struct probe_finder *pf = (struct probe_finder *)data; 863 struct dwarf_callback_param *param = data;
615 struct probe_point *pp = pf->pp; 864 struct probe_finder *pf = param->data;
616 struct die_link *lk; 865 struct perf_probe_point *pp = &pf->pev->point;
617 Dwarf_Signed offs; 866 Dwarf_Addr addr;
618 Dwarf_Half tag;
619 int ret;
620 867
621 ret = dwarf_tag(dlink->die, &tag, &__dw_error); 868 if (pp->lazy_line)
622 DIE_IF(ret == DW_DLV_ERROR); 869 param->retval = find_probe_point_lazy(in_die, pf);
623 if (tag == DW_TAG_subprogram) { 870 else {
624 if (die_compare_name(dlink->die, pp->function) == 0) { 871 /* Get probe address */
625 if (pp->line) { /* Function relative line */ 872 if (dwarf_entrypc(in_die, &addr) != 0) {
626 pf->fno = die_get_decl_file(dlink->die); 873 pr_warning("Failed to get entry pc of %s.\n",
627 pf->lno = die_get_decl_line(dlink->die) 874 dwarf_diename(in_die));
628 + pp->line; 875 param->retval = -ENOENT;
629 find_by_line(pf); 876 return DWARF_CB_ABORT;
630 return 1; 877 }
631 } 878 pf->addr = addr;
632 if (die_inlined_subprogram(dlink->die)) { 879 pf->addr += pp->offset;
633 /* Inlined function, save it. */ 880 pr_debug("found inline addr: 0x%jx\n",
634 ret = dwarf_die_CU_offset(dlink->die, 881 (uintmax_t)pf->addr);
635 &pf->inl_offs, 882
636 &__dw_error); 883 param->retval = convert_probe_point(in_die, pf);
637 DIE_IF(ret != DW_DLV_OK); 884 if (param->retval < 0)
638 pr_debug("inline definition offset %lld\n", 885 return DWARF_CB_ABORT;
639 pf->inl_offs); 886 }
640 return 0; /* Continue to search */ 887
888 return DWARF_CB_OK;
889}
890
891/* Search function from function name */
892static int probe_point_search_cb(Dwarf_Die *sp_die, void *data)
893{
894 struct dwarf_callback_param *param = data;
895 struct probe_finder *pf = param->data;
896 struct perf_probe_point *pp = &pf->pev->point;
897
898 /* Check tag and diename */
899 if (dwarf_tag(sp_die) != DW_TAG_subprogram ||
900 die_compare_name(sp_die, pp->function) != 0)
901 return DWARF_CB_OK;
902
903 pf->fname = dwarf_decl_file(sp_die);
904 if (pp->line) { /* Function relative line */
905 dwarf_decl_line(sp_die, &pf->lno);
906 pf->lno += pp->line;
907 param->retval = find_probe_point_by_line(pf);
908 } else if (!dwarf_func_inline(sp_die)) {
909 /* Real function */
910 if (pp->lazy_line)
911 param->retval = find_probe_point_lazy(sp_die, pf);
912 else {
913 if (dwarf_entrypc(sp_die, &pf->addr) != 0) {
914 pr_warning("Failed to get entry pc of %s.\n",
915 dwarf_diename(sp_die));
916 param->retval = -ENOENT;
917 return DWARF_CB_ABORT;
641 } 918 }
642 /* Get probe address */
643 pf->addr = die_get_entrypc(dlink->die);
644 pf->addr += pp->offset; 919 pf->addr += pp->offset;
645 /* TODO: Check the address in this function */ 920 /* TODO: Check the address in this function */
646 show_probepoint(dlink->die, pp->offset, pf); 921 param->retval = convert_probe_point(sp_die, pf);
647 return 1; /* Exit; no same symbol in this CU. */
648 } 922 }
649 } else if (tag == DW_TAG_inlined_subroutine && pf->inl_offs) { 923 } else {
650 if (die_get_abstract_origin(dlink->die) == pf->inl_offs) { 924 struct dwarf_callback_param _param = {.data = (void *)pf,
651 /* Get probe address */ 925 .retval = 0};
652 pf->addr = die_get_entrypc(dlink->die); 926 /* Inlined function: search instances */
653 pf->addr += pp->offset; 927 dwarf_func_inline_instances(sp_die, probe_point_inline_cb,
654 pr_debug("found inline addr: 0x%llx\n", pf->addr); 928 &_param);
655 /* Inlined function. Get a real subprogram */ 929 param->retval = _param.retval;
656 for (lk = dlink->parent; lk != NULL; lk = lk->parent) { 930 }
657 tag = 0; 931
658 dwarf_tag(lk->die, &tag, &__dw_error); 932 return DWARF_CB_ABORT; /* Exit; no same symbol in this CU. */
659 DIE_IF(ret == DW_DLV_ERROR); 933}
660 if (tag == DW_TAG_subprogram && 934
661 !die_inlined_subprogram(lk->die)) 935static int find_probe_point_by_func(struct probe_finder *pf)
662 goto found; 936{
937 struct dwarf_callback_param _param = {.data = (void *)pf,
938 .retval = 0};
939 dwarf_getfuncs(&pf->cu_die, probe_point_search_cb, &_param, 0);
940 return _param.retval;
941}
942
943/* Find kprobe_trace_events specified by perf_probe_event from debuginfo */
944int find_kprobe_trace_events(int fd, struct perf_probe_event *pev,
945 struct kprobe_trace_event **tevs, int max_tevs)
946{
947 struct probe_finder pf = {.pev = pev, .max_tevs = max_tevs};
948 struct perf_probe_point *pp = &pev->point;
949 Dwarf_Off off, noff;
950 size_t cuhl;
951 Dwarf_Die *diep;
952 Dwarf *dbg;
953 int ret = 0;
954
955 pf.tevs = zalloc(sizeof(struct kprobe_trace_event) * max_tevs);
956 if (pf.tevs == NULL)
957 return -ENOMEM;
958 *tevs = pf.tevs;
959 pf.ntevs = 0;
960
961 dbg = dwarf_begin(fd, DWARF_C_READ);
962 if (!dbg) {
963 pr_warning("No dwarf info found in the vmlinux - "
964 "please rebuild with CONFIG_DEBUG_INFO=y.\n");
965 free(pf.tevs);
966 *tevs = NULL;
967 return -EBADF;
968 }
969
970#if _ELFUTILS_PREREQ(0, 142)
971 /* Get the call frame information from this dwarf */
972 pf.cfi = dwarf_getcfi(dbg);
973#endif
974
975 off = 0;
976 line_list__init(&pf.lcache);
977 /* Loop on CUs (Compilation Unit) */
978 while (!dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL) &&
979 ret >= 0) {
980 /* Get the DIE(Debugging Information Entry) of this CU */
981 diep = dwarf_offdie(dbg, off + cuhl, &pf.cu_die);
982 if (!diep)
983 continue;
984
985 /* Check if target file is included. */
986 if (pp->file)
987 pf.fname = cu_find_realpath(&pf.cu_die, pp->file);
988 else
989 pf.fname = NULL;
990
991 if (!pp->file || pf.fname) {
992 if (pp->function)
993 ret = find_probe_point_by_func(&pf);
994 else if (pp->lazy_line)
995 ret = find_probe_point_lazy(NULL, &pf);
996 else {
997 pf.lno = pp->line;
998 ret = find_probe_point_by_line(&pf);
663 } 999 }
664 die("Failed to find real subprogram.\n"); 1000 }
1001 off = noff;
1002 }
1003 line_list__free(&pf.lcache);
1004 dwarf_end(dbg);
1005
1006 return (ret < 0) ? ret : pf.ntevs;
1007}
1008
1009/* Reverse search */
1010int find_perf_probe_point(int fd, unsigned long addr,
1011 struct perf_probe_point *ppt)
1012{
1013 Dwarf_Die cudie, spdie, indie;
1014 Dwarf *dbg;
1015 Dwarf_Line *line;
1016 Dwarf_Addr laddr, eaddr;
1017 const char *tmp;
1018 int lineno, ret = 0;
1019 bool found = false;
1020
1021 dbg = dwarf_begin(fd, DWARF_C_READ);
1022 if (!dbg)
1023 return -EBADF;
1024
1025 /* Find cu die */
1026 if (!dwarf_addrdie(dbg, (Dwarf_Addr)addr, &cudie)) {
1027 ret = -EINVAL;
1028 goto end;
1029 }
1030
1031 /* Find a corresponding line */
1032 line = dwarf_getsrc_die(&cudie, (Dwarf_Addr)addr);
1033 if (line) {
1034 if (dwarf_lineaddr(line, &laddr) == 0 &&
1035 (Dwarf_Addr)addr == laddr &&
1036 dwarf_lineno(line, &lineno) == 0) {
1037 tmp = dwarf_linesrc(line, NULL, NULL);
1038 if (tmp) {
1039 ppt->line = lineno;
1040 ppt->file = strdup(tmp);
1041 if (ppt->file == NULL) {
1042 ret = -ENOMEM;
1043 goto end;
1044 }
1045 found = true;
1046 }
1047 }
1048 }
1049
1050 /* Find a corresponding function */
1051 if (die_find_real_subprogram(&cudie, (Dwarf_Addr)addr, &spdie)) {
1052 tmp = dwarf_diename(&spdie);
1053 if (!tmp || dwarf_entrypc(&spdie, &eaddr) != 0)
1054 goto end;
1055
1056 if (ppt->line) {
1057 if (die_find_inlinefunc(&spdie, (Dwarf_Addr)addr,
1058 &indie)) {
1059 /* addr in an inline function */
1060 tmp = dwarf_diename(&indie);
1061 if (!tmp)
1062 goto end;
1063 ret = dwarf_decl_line(&indie, &lineno);
1064 } else {
1065 if (eaddr == addr) { /* Function entry */
1066 lineno = ppt->line;
1067 ret = 0;
1068 } else
1069 ret = dwarf_decl_line(&spdie, &lineno);
1070 }
1071 if (ret == 0) {
1072 /* Make a relative line number */
1073 ppt->line -= lineno;
1074 goto found;
1075 }
1076 }
1077 /* We don't have a line number, let's use offset */
1078 ppt->offset = addr - (unsigned long)eaddr;
665found: 1079found:
666 /* Get offset from subprogram */ 1080 ppt->function = strdup(tmp);
667 ret = die_within_subprogram(lk->die, pf->addr, &offs); 1081 if (ppt->function == NULL) {
668 DIE_IF(!ret); 1082 ret = -ENOMEM;
669 show_probepoint(lk->die, offs, pf); 1083 goto end;
670 /* Continue to search */
671 } 1084 }
1085 found = true;
672 } 1086 }
673 return 0; 1087
1088end:
1089 dwarf_end(dbg);
1090 if (ret >= 0)
1091 ret = found ? 1 : 0;
1092 return ret;
1093}
1094
1095/* Add a line and store the src path */
1096static int line_range_add_line(const char *src, unsigned int lineno,
1097 struct line_range *lr)
1098{
1099 /* Copy real path */
1100 if (!lr->path) {
1101 lr->path = strdup(src);
1102 if (lr->path == NULL)
1103 return -ENOMEM;
1104 }
1105 return line_list__add_line(&lr->line_list, lineno);
674} 1106}
675 1107
676static void find_by_func(struct probe_finder *pf) 1108/* Search function declaration lines */
1109static int line_range_funcdecl_cb(Dwarf_Die *sp_die, void *data)
677{ 1110{
678 search_die_from_children(pf->cu_die, probefunc_callback, pf); 1111 struct dwarf_callback_param *param = data;
1112 struct line_finder *lf = param->data;
1113 const char *src;
1114 int lineno;
1115
1116 src = dwarf_decl_file(sp_die);
1117 if (src && strtailcmp(src, lf->fname) != 0)
1118 return DWARF_CB_OK;
1119
1120 if (dwarf_decl_line(sp_die, &lineno) != 0 ||
1121 (lf->lno_s > lineno || lf->lno_e < lineno))
1122 return DWARF_CB_OK;
1123
1124 param->retval = line_range_add_line(src, lineno, lf->lr);
1125 if (param->retval < 0)
1126 return DWARF_CB_ABORT;
1127 return DWARF_CB_OK;
679} 1128}
680 1129
681/* Find a probe point */ 1130static int find_line_range_func_decl_lines(struct line_finder *lf)
682int find_probepoint(int fd, struct probe_point *pp)
683{ 1131{
684 Dwarf_Half addr_size = 0; 1132 struct dwarf_callback_param param = {.data = (void *)lf, .retval = 0};
685 Dwarf_Unsigned next_cuh = 0; 1133 dwarf_getfuncs(&lf->cu_die, line_range_funcdecl_cb, &param, 0);
686 int cu_number = 0, ret; 1134 return param.retval;
687 struct probe_finder pf = {.pp = pp}; 1135}
1136
1137/* Find line range from its line number */
1138static int find_line_range_by_line(Dwarf_Die *sp_die, struct line_finder *lf)
1139{
1140 Dwarf_Lines *lines;
1141 Dwarf_Line *line;
1142 size_t nlines, i;
1143 Dwarf_Addr addr;
1144 int lineno, ret = 0;
1145 const char *src;
1146 Dwarf_Die die_mem;
688 1147
689 ret = dwarf_init(fd, DW_DLC_READ, 0, 0, &__dw_debug, &__dw_error); 1148 line_list__init(&lf->lr->line_list);
690 if (ret != DW_DLV_OK) 1149 if (dwarf_getsrclines(&lf->cu_die, &lines, &nlines) != 0) {
1150 pr_warning("No source lines found in this CU.\n");
691 return -ENOENT; 1151 return -ENOENT;
1152 }
1153
1154 /* Search probable lines on lines list */
1155 for (i = 0; i < nlines; i++) {
1156 line = dwarf_onesrcline(lines, i);
1157 if (dwarf_lineno(line, &lineno) != 0 ||
1158 (lf->lno_s > lineno || lf->lno_e < lineno))
1159 continue;
1160
1161 if (sp_die) {
1162 /* Address filtering 1: does sp_die include addr? */
1163 if (dwarf_lineaddr(line, &addr) != 0 ||
1164 !dwarf_haspc(sp_die, addr))
1165 continue;
1166
1167 /* Address filtering 2: No child include addr? */
1168 if (die_find_inlinefunc(sp_die, addr, &die_mem))
1169 continue;
1170 }
1171
1172 /* TODO: Get fileno from line, but how? */
1173 src = dwarf_linesrc(line, NULL, NULL);
1174 if (strtailcmp(src, lf->fname) != 0)
1175 continue;
1176
1177 ret = line_range_add_line(src, lineno, lf->lr);
1178 if (ret < 0)
1179 return ret;
1180 }
1181
1182 /*
1183 * Dwarf lines doesn't include function declarations. We have to
1184 * check functions list or given function.
1185 */
1186 if (sp_die) {
1187 src = dwarf_decl_file(sp_die);
1188 if (src && dwarf_decl_line(sp_die, &lineno) == 0 &&
1189 (lf->lno_s <= lineno && lf->lno_e >= lineno))
1190 ret = line_range_add_line(src, lineno, lf->lr);
1191 } else
1192 ret = find_line_range_func_decl_lines(lf);
1193
1194 /* Update status */
1195 if (ret >= 0)
1196 if (!list_empty(&lf->lr->line_list))
1197 ret = lf->found = 1;
1198 else
1199 ret = 0; /* Lines are not found */
1200 else {
1201 free(lf->lr->path);
1202 lf->lr->path = NULL;
1203 }
1204 return ret;
1205}
692 1206
693 pp->found = 0; 1207static int line_range_inline_cb(Dwarf_Die *in_die, void *data)
694 while (++cu_number) { 1208{
695 /* Search CU (Compilation Unit) */ 1209 struct dwarf_callback_param *param = data;
696 ret = dwarf_next_cu_header(__dw_debug, NULL, NULL, NULL, 1210
697 &addr_size, &next_cuh, &__dw_error); 1211 param->retval = find_line_range_by_line(in_die, param->data);
698 DIE_IF(ret == DW_DLV_ERROR); 1212 return DWARF_CB_ABORT; /* No need to find other instances */
699 if (ret == DW_DLV_NO_ENTRY) 1213}
1214
1215/* Search function from function name */
1216static int line_range_search_cb(Dwarf_Die *sp_die, void *data)
1217{
1218 struct dwarf_callback_param *param = data;
1219 struct line_finder *lf = param->data;
1220 struct line_range *lr = lf->lr;
1221
1222 if (dwarf_tag(sp_die) == DW_TAG_subprogram &&
1223 die_compare_name(sp_die, lr->function) == 0) {
1224 lf->fname = dwarf_decl_file(sp_die);
1225 dwarf_decl_line(sp_die, &lr->offset);
1226 pr_debug("fname: %s, lineno:%d\n", lf->fname, lr->offset);
1227 lf->lno_s = lr->offset + lr->start;
1228 if (lf->lno_s < 0) /* Overflow */
1229 lf->lno_s = INT_MAX;
1230 lf->lno_e = lr->offset + lr->end;
1231 if (lf->lno_e < 0) /* Overflow */
1232 lf->lno_e = INT_MAX;
1233 pr_debug("New line range: %d to %d\n", lf->lno_s, lf->lno_e);
1234 lr->start = lf->lno_s;
1235 lr->end = lf->lno_e;
1236 if (dwarf_func_inline(sp_die)) {
1237 struct dwarf_callback_param _param;
1238 _param.data = (void *)lf;
1239 _param.retval = 0;
1240 dwarf_func_inline_instances(sp_die,
1241 line_range_inline_cb,
1242 &_param);
1243 param->retval = _param.retval;
1244 } else
1245 param->retval = find_line_range_by_line(sp_die, lf);
1246 return DWARF_CB_ABORT;
1247 }
1248 return DWARF_CB_OK;
1249}
1250
1251static int find_line_range_by_func(struct line_finder *lf)
1252{
1253 struct dwarf_callback_param param = {.data = (void *)lf, .retval = 0};
1254 dwarf_getfuncs(&lf->cu_die, line_range_search_cb, &param, 0);
1255 return param.retval;
1256}
1257
1258int find_line_range(int fd, struct line_range *lr)
1259{
1260 struct line_finder lf = {.lr = lr, .found = 0};
1261 int ret = 0;
1262 Dwarf_Off off = 0, noff;
1263 size_t cuhl;
1264 Dwarf_Die *diep;
1265 Dwarf *dbg;
1266
1267 dbg = dwarf_begin(fd, DWARF_C_READ);
1268 if (!dbg) {
1269 pr_warning("No dwarf info found in the vmlinux - "
1270 "please rebuild with CONFIG_DEBUG_INFO=y.\n");
1271 return -EBADF;
1272 }
1273
1274 /* Loop on CUs (Compilation Unit) */
1275 while (!lf.found && ret >= 0) {
1276 if (dwarf_nextcu(dbg, off, &noff, &cuhl, NULL, NULL, NULL) != 0)
700 break; 1277 break;
701 1278
702 /* Get the DIE(Debugging Information Entry) of this CU */ 1279 /* Get the DIE(Debugging Information Entry) of this CU */
703 ret = dwarf_siblingof(__dw_debug, 0, &pf.cu_die, &__dw_error); 1280 diep = dwarf_offdie(dbg, off + cuhl, &lf.cu_die);
704 DIE_IF(ret != DW_DLV_OK); 1281 if (!diep)
1282 continue;
705 1283
706 /* Check if target file is included. */ 1284 /* Check if target file is included. */
707 if (pp->file) 1285 if (lr->file)
708 pf.fno = cu_find_fileno(pf.cu_die, pp->file); 1286 lf.fname = cu_find_realpath(&lf.cu_die, lr->file);
709 1287 else
710 if (!pp->file || pf.fno) { 1288 lf.fname = 0;
711 /* Save CU base address (for frame_base) */ 1289
712 ret = dwarf_lowpc(pf.cu_die, &pf.cu_base, &__dw_error); 1290 if (!lr->file || lf.fname) {
713 DIE_IF(ret == DW_DLV_ERROR); 1291 if (lr->function)
714 if (ret == DW_DLV_NO_ENTRY) 1292 ret = find_line_range_by_func(&lf);
715 pf.cu_base = 0;
716 if (pp->function)
717 find_by_func(&pf);
718 else { 1293 else {
719 pf.lno = pp->line; 1294 lf.lno_s = lr->start;
720 find_by_line(&pf); 1295 lf.lno_e = lr->end;
1296 ret = find_line_range_by_line(NULL, &lf);
721 } 1297 }
722 } 1298 }
723 dwarf_dealloc(__dw_debug, pf.cu_die, DW_DLA_DIE); 1299 off = noff;
724 } 1300 }
725 ret = dwarf_finish(__dw_debug, &__dw_error); 1301 pr_debug("path: %lx\n", (unsigned long)lr->path);
726 DIE_IF(ret != DW_DLV_OK); 1302 dwarf_end(dbg);
727 1303
728 return pp->found; 1304 return (ret < 0) ? ret : lf.found;
729} 1305}
730 1306
diff --git a/tools/perf/util/probe-finder.h b/tools/perf/util/probe-finder.h
index a4086aaddb73..e1f61dcd18ff 100644
--- a/tools/perf/util/probe-finder.h
+++ b/tools/perf/util/probe-finder.h
@@ -1,6 +1,10 @@
1#ifndef _PROBE_FINDER_H 1#ifndef _PROBE_FINDER_H
2#define _PROBE_FINDER_H 2#define _PROBE_FINDER_H
3 3
4#include <stdbool.h>
5#include "util.h"
6#include "probe-event.h"
7
4#define MAX_PATH_LEN 256 8#define MAX_PATH_LEN 256
5#define MAX_PROBE_BUFFER 1024 9#define MAX_PROBE_BUFFER 1024
6#define MAX_PROBES 128 10#define MAX_PROBES 128
@@ -11,55 +15,54 @@ static inline int is_c_varname(const char *name)
11 return isalpha(name[0]) || name[0] == '_'; 15 return isalpha(name[0]) || name[0] == '_';
12} 16}
13 17
14struct probe_point { 18#ifdef DWARF_SUPPORT
15 char *event; /* Event name */ 19/* Find kprobe_trace_events specified by perf_probe_event from debuginfo */
16 char *group; /* Event group */ 20extern int find_kprobe_trace_events(int fd, struct perf_probe_event *pev,
17 21 struct kprobe_trace_event **tevs,
18 /* Inputs */ 22 int max_tevs);
19 char *file; /* File name */
20 int line; /* Line number */
21 23
22 char *function; /* Function name */ 24/* Find a perf_probe_point from debuginfo */
23 int offset; /* Offset bytes */ 25extern int find_perf_probe_point(int fd, unsigned long addr,
26 struct perf_probe_point *ppt);
24 27
25 int nr_args; /* Number of arguments */ 28extern int find_line_range(int fd, struct line_range *lr);
26 char **args; /* Arguments */
27
28 int retprobe; /* Return probe */
29
30 /* Output */
31 int found; /* Number of found probe points */
32 char *probes[MAX_PROBES]; /* Output buffers (will be allocated)*/
33};
34
35#ifndef NO_LIBDWARF
36extern int find_probepoint(int fd, struct probe_point *pp);
37
38/* Workaround for undefined _MIPS_SZLONG bug in libdwarf.h: */
39#ifndef _MIPS_SZLONG
40# define _MIPS_SZLONG 0
41#endif
42 29
43#include <dwarf.h> 30#include <dwarf.h>
44#include <libdwarf.h> 31#include <libdw.h>
32#include <version.h>
45 33
46struct probe_finder { 34struct probe_finder {
47 struct probe_point *pp; /* Target probe point */ 35 struct perf_probe_event *pev; /* Target probe event */
36 struct kprobe_trace_event *tevs; /* Result trace events */
37 int ntevs; /* Number of trace events */
38 int max_tevs; /* Max number of trace events */
48 39
49 /* For function searching */ 40 /* For function searching */
50 Dwarf_Addr addr; /* Address */ 41 int lno; /* Line number */
51 Dwarf_Unsigned fno; /* File number */ 42 Dwarf_Addr addr; /* Address */
52 Dwarf_Unsigned lno; /* Line number */ 43 const char *fname; /* Real file name */
53 Dwarf_Off inl_offs; /* Inline offset */ 44 Dwarf_Die cu_die; /* Current CU */
54 Dwarf_Die cu_die; /* Current CU */ 45 struct list_head lcache; /* Line cache for lazy match */
55 46
56 /* For variable searching */ 47 /* For variable searching */
57 Dwarf_Addr cu_base; /* Current CU base address */ 48#if _ELFUTILS_PREREQ(0, 142)
58 Dwarf_Locdesc fbloc; /* Location of Current Frame Base */ 49 Dwarf_CFI *cfi; /* Call Frame Information */
59 const char *var; /* Current variable name */ 50#endif
60 char *buf; /* Current output buffer */ 51 Dwarf_Op *fb_ops; /* Frame base attribute */
61 int len; /* Length of output buffer */ 52 struct perf_probe_arg *pvar; /* Current target variable */
53 struct kprobe_trace_arg *tvar; /* Current result variable */
54};
55
56struct line_finder {
57 struct line_range *lr; /* Target line range */
58
59 const char *fname; /* File name */
60 int lno_s; /* Start line number */
61 int lno_e; /* End line number */
62 Dwarf_Die cu_die; /* Current CU */
63 int found;
62}; 64};
63#endif /* NO_LIBDWARF */ 65
66#endif /* DWARF_SUPPORT */
64 67
65#endif /*_PROBE_FINDER_H */ 68#endif /*_PROBE_FINDER_H */
diff --git a/tools/perf/util/pstack.c b/tools/perf/util/pstack.c
new file mode 100644
index 000000000000..13d36faf64eb
--- /dev/null
+++ b/tools/perf/util/pstack.c
@@ -0,0 +1,75 @@
1/*
2 * Simple pointer stack
3 *
4 * (c) 2010 Arnaldo Carvalho de Melo <acme@redhat.com>
5 */
6
7#include "util.h"
8#include "pstack.h"
9#include <linux/kernel.h>
10#include <stdlib.h>
11
12struct pstack {
13 unsigned short top;
14 unsigned short max_nr_entries;
15 void *entries[0];
16};
17
18struct pstack *pstack__new(unsigned short max_nr_entries)
19{
20 struct pstack *self = zalloc((sizeof(*self) +
21 max_nr_entries * sizeof(void *)));
22 if (self != NULL)
23 self->max_nr_entries = max_nr_entries;
24 return self;
25}
26
27void pstack__delete(struct pstack *self)
28{
29 free(self);
30}
31
32bool pstack__empty(const struct pstack *self)
33{
34 return self->top == 0;
35}
36
37void pstack__remove(struct pstack *self, void *key)
38{
39 unsigned short i = self->top, last_index = self->top - 1;
40
41 while (i-- != 0) {
42 if (self->entries[i] == key) {
43 if (i < last_index)
44 memmove(self->entries + i,
45 self->entries + i + 1,
46 (last_index - i) * sizeof(void *));
47 --self->top;
48 return;
49 }
50 }
51 pr_err("%s: %p not on the pstack!\n", __func__, key);
52}
53
54void pstack__push(struct pstack *self, void *key)
55{
56 if (self->top == self->max_nr_entries) {
57 pr_err("%s: top=%d, overflow!\n", __func__, self->top);
58 return;
59 }
60 self->entries[self->top++] = key;
61}
62
63void *pstack__pop(struct pstack *self)
64{
65 void *ret;
66
67 if (self->top == 0) {
68 pr_err("%s: underflow!\n", __func__);
69 return NULL;
70 }
71
72 ret = self->entries[--self->top];
73 self->entries[self->top] = NULL;
74 return ret;
75}
diff --git a/tools/perf/util/pstack.h b/tools/perf/util/pstack.h
new file mode 100644
index 000000000000..5ad07023504b
--- /dev/null
+++ b/tools/perf/util/pstack.h
@@ -0,0 +1,12 @@
1#ifndef _PERF_PSTACK_
2#define _PERF_PSTACK_
3
4struct pstack;
5struct pstack *pstack__new(unsigned short max_nr_entries);
6void pstack__delete(struct pstack *self);
7bool pstack__empty(const struct pstack *self);
8void pstack__remove(struct pstack *self, void *key);
9void pstack__push(struct pstack *self, void *key);
10void *pstack__pop(struct pstack *self);
11
12#endif /* _PERF_PSTACK_ */
diff --git a/tools/perf/util/quote.c b/tools/perf/util/quote.c
index 2726fe40eb5d..01f03242b86a 100644
--- a/tools/perf/util/quote.c
+++ b/tools/perf/util/quote.c
@@ -1,8 +1,6 @@
1#include "cache.h" 1#include "cache.h"
2#include "quote.h" 2#include "quote.h"
3 3
4int quote_path_fully = 1;
5
6/* Help to copy the thing properly quoted for the shell safety. 4/* Help to copy the thing properly quoted for the shell safety.
7 * any single quote is replaced with '\'', any exclamation point 5 * any single quote is replaced with '\'', any exclamation point
8 * is replaced with '\!', and the whole thing is enclosed in a 6 * is replaced with '\!', and the whole thing is enclosed in a
@@ -19,7 +17,7 @@ static inline int need_bs_quote(char c)
19 return (c == '\'' || c == '!'); 17 return (c == '\'' || c == '!');
20} 18}
21 19
22void sq_quote_buf(struct strbuf *dst, const char *src) 20static void sq_quote_buf(struct strbuf *dst, const char *src)
23{ 21{
24 char *to_free = NULL; 22 char *to_free = NULL;
25 23
@@ -41,23 +39,6 @@ void sq_quote_buf(struct strbuf *dst, const char *src)
41 free(to_free); 39 free(to_free);
42} 40}
43 41
44void sq_quote_print(FILE *stream, const char *src)
45{
46 char c;
47
48 fputc('\'', stream);
49 while ((c = *src++)) {
50 if (need_bs_quote(c)) {
51 fputs("'\\", stream);
52 fputc(c, stream);
53 fputc('\'', stream);
54 } else {
55 fputc(c, stream);
56 }
57 }
58 fputc('\'', stream);
59}
60
61void sq_quote_argv(struct strbuf *dst, const char** argv, size_t maxlen) 42void sq_quote_argv(struct strbuf *dst, const char** argv, size_t maxlen)
62{ 43{
63 int i; 44 int i;
@@ -71,415 +52,3 @@ void sq_quote_argv(struct strbuf *dst, const char** argv, size_t maxlen)
71 die("Too many or long arguments"); 52 die("Too many or long arguments");
72 } 53 }
73} 54}
74
75char *sq_dequote_step(char *arg, char **next)
76{
77 char *dst = arg;
78 char *src = arg;
79 char c;
80
81 if (*src != '\'')
82 return NULL;
83 for (;;) {
84 c = *++src;
85 if (!c)
86 return NULL;
87 if (c != '\'') {
88 *dst++ = c;
89 continue;
90 }
91 /* We stepped out of sq */
92 switch (*++src) {
93 case '\0':
94 *dst = 0;
95 if (next)
96 *next = NULL;
97 return arg;
98 case '\\':
99 c = *++src;
100 if (need_bs_quote(c) && *++src == '\'') {
101 *dst++ = c;
102 continue;
103 }
104 /* Fallthrough */
105 default:
106 if (!next || !isspace(*src))
107 return NULL;
108 do {
109 c = *++src;
110 } while (isspace(c));
111 *dst = 0;
112 *next = src;
113 return arg;
114 }
115 }
116}
117
118char *sq_dequote(char *arg)
119{
120 return sq_dequote_step(arg, NULL);
121}
122
123int sq_dequote_to_argv(char *arg, const char ***argv, int *nr, int *alloc)
124{
125 char *next = arg;
126
127 if (!*arg)
128 return 0;
129 do {
130 char *dequoted = sq_dequote_step(next, &next);
131 if (!dequoted)
132 return -1;
133 ALLOC_GROW(*argv, *nr + 1, *alloc);
134 (*argv)[(*nr)++] = dequoted;
135 } while (next);
136
137 return 0;
138}
139
140/* 1 means: quote as octal
141 * 0 means: quote as octal if (quote_path_fully)
142 * -1 means: never quote
143 * c: quote as "\\c"
144 */
145#define X8(x) x, x, x, x, x, x, x, x
146#define X16(x) X8(x), X8(x)
147static signed char const sq_lookup[256] = {
148 /* 0 1 2 3 4 5 6 7 */
149 /* 0x00 */ 1, 1, 1, 1, 1, 1, 1, 'a',
150 /* 0x08 */ 'b', 't', 'n', 'v', 'f', 'r', 1, 1,
151 /* 0x10 */ X16(1),
152 /* 0x20 */ -1, -1, '"', -1, -1, -1, -1, -1,
153 /* 0x28 */ X16(-1), X16(-1), X16(-1),
154 /* 0x58 */ -1, -1, -1, -1,'\\', -1, -1, -1,
155 /* 0x60 */ X16(-1), X8(-1),
156 /* 0x78 */ -1, -1, -1, -1, -1, -1, -1, 1,
157 /* 0x80 */ /* set to 0 */
158};
159
160static inline int sq_must_quote(char c)
161{
162 return sq_lookup[(unsigned char)c] + quote_path_fully > 0;
163}
164
165/*
166 * Returns the longest prefix not needing a quote up to maxlen if
167 * positive.
168 * This stops at the first \0 because it's marked as a character
169 * needing an escape.
170 */
171static ssize_t next_quote_pos(const char *s, ssize_t maxlen)
172{
173 ssize_t len;
174
175 if (maxlen < 0) {
176 for (len = 0; !sq_must_quote(s[len]); len++);
177 } else {
178 for (len = 0; len < maxlen && !sq_must_quote(s[len]); len++);
179 }
180 return len;
181}
182
183/*
184 * C-style name quoting.
185 *
186 * (1) if sb and fp are both NULL, inspect the input name and counts the
187 * number of bytes that are needed to hold c_style quoted version of name,
188 * counting the double quotes around it but not terminating NUL, and
189 * returns it.
190 * However, if name does not need c_style quoting, it returns 0.
191 *
192 * (2) if sb or fp are not NULL, it emits the c_style quoted version
193 * of name, enclosed with double quotes if asked and needed only.
194 * Return value is the same as in (1).
195 */
196static size_t quote_c_style_counted(const char *name, ssize_t maxlen,
197 struct strbuf *sb, FILE *fp, int no_dq)
198{
199#define EMIT(c) \
200 do { \
201 if (sb) strbuf_addch(sb, (c)); \
202 if (fp) fputc((c), fp); \
203 count++; \
204 } while (0)
205
206#define EMITBUF(s, l) \
207 do { \
208 int __ret; \
209 if (sb) strbuf_add(sb, (s), (l)); \
210 if (fp) __ret = fwrite((s), (l), 1, fp); \
211 count += (l); \
212 } while (0)
213
214 ssize_t len, count = 0;
215 const char *p = name;
216
217 for (;;) {
218 int ch;
219
220 len = next_quote_pos(p, maxlen);
221 if (len == maxlen || !p[len])
222 break;
223
224 if (!no_dq && p == name)
225 EMIT('"');
226
227 EMITBUF(p, len);
228 EMIT('\\');
229 p += len;
230 ch = (unsigned char)*p++;
231 if (sq_lookup[ch] >= ' ') {
232 EMIT(sq_lookup[ch]);
233 } else {
234 EMIT(((ch >> 6) & 03) + '0');
235 EMIT(((ch >> 3) & 07) + '0');
236 EMIT(((ch >> 0) & 07) + '0');
237 }
238 }
239
240 EMITBUF(p, len);
241 if (p == name) /* no ending quote needed */
242 return 0;
243
244 if (!no_dq)
245 EMIT('"');
246 return count;
247}
248
249size_t quote_c_style(const char *name, struct strbuf *sb, FILE *fp, int nodq)
250{
251 return quote_c_style_counted(name, -1, sb, fp, nodq);
252}
253
254void quote_two_c_style(struct strbuf *sb, const char *prefix, const char *path, int nodq)
255{
256 if (quote_c_style(prefix, NULL, NULL, 0) ||
257 quote_c_style(path, NULL, NULL, 0)) {
258 if (!nodq)
259 strbuf_addch(sb, '"');
260 quote_c_style(prefix, sb, NULL, 1);
261 quote_c_style(path, sb, NULL, 1);
262 if (!nodq)
263 strbuf_addch(sb, '"');
264 } else {
265 strbuf_addstr(sb, prefix);
266 strbuf_addstr(sb, path);
267 }
268}
269
270void write_name_quoted(const char *name, FILE *fp, int terminator)
271{
272 if (terminator) {
273 quote_c_style(name, NULL, fp, 0);
274 } else {
275 fputs(name, fp);
276 }
277 fputc(terminator, fp);
278}
279
280void write_name_quotedpfx(const char *pfx, ssize_t pfxlen,
281 const char *name, FILE *fp, int terminator)
282{
283 int needquote = 0;
284
285 if (terminator) {
286 needquote = next_quote_pos(pfx, pfxlen) < pfxlen
287 || name[next_quote_pos(name, -1)];
288 }
289 if (needquote) {
290 fputc('"', fp);
291 quote_c_style_counted(pfx, pfxlen, NULL, fp, 1);
292 quote_c_style(name, NULL, fp, 1);
293 fputc('"', fp);
294 } else {
295 int ret;
296
297 ret = fwrite(pfx, pfxlen, 1, fp);
298 fputs(name, fp);
299 }
300 fputc(terminator, fp);
301}
302
303/* quote path as relative to the given prefix */
304char *quote_path_relative(const char *in, int len,
305 struct strbuf *out, const char *prefix)
306{
307 int needquote;
308
309 if (len < 0)
310 len = strlen(in);
311
312 /* "../" prefix itself does not need quoting, but "in" might. */
313 needquote = (next_quote_pos(in, len) < len);
314 strbuf_setlen(out, 0);
315 strbuf_grow(out, len);
316
317 if (needquote)
318 strbuf_addch(out, '"');
319 if (prefix) {
320 int off = 0;
321 while (off < len && prefix[off] && prefix[off] == in[off])
322 if (prefix[off] == '/') {
323 prefix += off + 1;
324 in += off + 1;
325 len -= off + 1;
326 off = 0;
327 } else
328 off++;
329
330 for (; *prefix; prefix++)
331 if (*prefix == '/')
332 strbuf_addstr(out, "../");
333 }
334
335 quote_c_style_counted (in, len, out, NULL, 1);
336
337 if (needquote)
338 strbuf_addch(out, '"');
339 if (!out->len)
340 strbuf_addstr(out, "./");
341
342 return out->buf;
343}
344
345/*
346 * C-style name unquoting.
347 *
348 * Quoted should point at the opening double quote.
349 * + Returns 0 if it was able to unquote the string properly, and appends the
350 * result in the strbuf `sb'.
351 * + Returns -1 in case of error, and doesn't touch the strbuf. Though note
352 * that this function will allocate memory in the strbuf, so calling
353 * strbuf_release is mandatory whichever result unquote_c_style returns.
354 *
355 * Updates endp pointer to point at one past the ending double quote if given.
356 */
357int unquote_c_style(struct strbuf *sb, const char *quoted, const char **endp)
358{
359 size_t oldlen = sb->len, len;
360 int ch, ac;
361
362 if (*quoted++ != '"')
363 return -1;
364
365 for (;;) {
366 len = strcspn(quoted, "\"\\");
367 strbuf_add(sb, quoted, len);
368 quoted += len;
369
370 switch (*quoted++) {
371 case '"':
372 if (endp)
373 *endp = quoted;
374 return 0;
375 case '\\':
376 break;
377 default:
378 goto error;
379 }
380
381 switch ((ch = *quoted++)) {
382 case 'a': ch = '\a'; break;
383 case 'b': ch = '\b'; break;
384 case 'f': ch = '\f'; break;
385 case 'n': ch = '\n'; break;
386 case 'r': ch = '\r'; break;
387 case 't': ch = '\t'; break;
388 case 'v': ch = '\v'; break;
389
390 case '\\': case '"':
391 break; /* verbatim */
392
393 /* octal values with first digit over 4 overflow */
394 case '0': case '1': case '2': case '3':
395 ac = ((ch - '0') << 6);
396 if ((ch = *quoted++) < '0' || '7' < ch)
397 goto error;
398 ac |= ((ch - '0') << 3);
399 if ((ch = *quoted++) < '0' || '7' < ch)
400 goto error;
401 ac |= (ch - '0');
402 ch = ac;
403 break;
404 default:
405 goto error;
406 }
407 strbuf_addch(sb, ch);
408 }
409
410 error:
411 strbuf_setlen(sb, oldlen);
412 return -1;
413}
414
415/* quoting as a string literal for other languages */
416
417void perl_quote_print(FILE *stream, const char *src)
418{
419 const char sq = '\'';
420 const char bq = '\\';
421 char c;
422
423 fputc(sq, stream);
424 while ((c = *src++)) {
425 if (c == sq || c == bq)
426 fputc(bq, stream);
427 fputc(c, stream);
428 }
429 fputc(sq, stream);
430}
431
432void python_quote_print(FILE *stream, const char *src)
433{
434 const char sq = '\'';
435 const char bq = '\\';
436 const char nl = '\n';
437 char c;
438
439 fputc(sq, stream);
440 while ((c = *src++)) {
441 if (c == nl) {
442 fputc(bq, stream);
443 fputc('n', stream);
444 continue;
445 }
446 if (c == sq || c == bq)
447 fputc(bq, stream);
448 fputc(c, stream);
449 }
450 fputc(sq, stream);
451}
452
453void tcl_quote_print(FILE *stream, const char *src)
454{
455 char c;
456
457 fputc('"', stream);
458 while ((c = *src++)) {
459 switch (c) {
460 case '[': case ']':
461 case '{': case '}':
462 case '$': case '\\': case '"':
463 fputc('\\', stream);
464 default:
465 fputc(c, stream);
466 break;
467 case '\f':
468 fputs("\\f", stream);
469 break;
470 case '\r':
471 fputs("\\r", stream);
472 break;
473 case '\n':
474 fputs("\\n", stream);
475 break;
476 case '\t':
477 fputs("\\t", stream);
478 break;
479 case '\v':
480 fputs("\\v", stream);
481 break;
482 }
483 }
484 fputc('"', stream);
485}
diff --git a/tools/perf/util/quote.h b/tools/perf/util/quote.h
index b6a019733919..172889ea234f 100644
--- a/tools/perf/util/quote.h
+++ b/tools/perf/util/quote.h
@@ -22,47 +22,8 @@
22 * 22 *
23 * Note that the above examples leak memory! Remember to free result from 23 * Note that the above examples leak memory! Remember to free result from
24 * sq_quote() in a real application. 24 * sq_quote() in a real application.
25 *
26 * sq_quote_buf() writes to an existing buffer of specified size; it
27 * will return the number of characters that would have been written
28 * excluding the final null regardless of the buffer size.
29 */ 25 */
30 26
31extern void sq_quote_print(FILE *stream, const char *src);
32
33extern void sq_quote_buf(struct strbuf *, const char *src);
34extern void sq_quote_argv(struct strbuf *, const char **argv, size_t maxlen); 27extern void sq_quote_argv(struct strbuf *, const char **argv, size_t maxlen);
35 28
36/* This unwraps what sq_quote() produces in place, but returns
37 * NULL if the input does not look like what sq_quote would have
38 * produced.
39 */
40extern char *sq_dequote(char *);
41
42/*
43 * Same as the above, but can be used to unwrap many arguments in the
44 * same string separated by space. "next" is changed to point to the
45 * next argument that should be passed as first parameter. When there
46 * is no more argument to be dequoted, "next" is updated to point to NULL.
47 */
48extern char *sq_dequote_step(char *arg, char **next);
49extern int sq_dequote_to_argv(char *arg, const char ***argv, int *nr, int *alloc);
50
51extern int unquote_c_style(struct strbuf *, const char *quoted, const char **endp);
52extern size_t quote_c_style(const char *name, struct strbuf *, FILE *, int no_dq);
53extern void quote_two_c_style(struct strbuf *, const char *, const char *, int);
54
55extern void write_name_quoted(const char *name, FILE *, int terminator);
56extern void write_name_quotedpfx(const char *pfx, ssize_t pfxlen,
57 const char *name, FILE *, int terminator);
58
59/* quote path as relative to the given prefix */
60char *quote_path_relative(const char *in, int len,
61 struct strbuf *out, const char *prefix);
62
63/* quoting as a string literal for other languages */
64extern void perl_quote_print(FILE *stream, const char *src);
65extern void python_quote_print(FILE *stream, const char *src);
66extern void tcl_quote_print(FILE *stream, const char *src);
67
68#endif /* __PERF_QUOTE_H */ 29#endif /* __PERF_QUOTE_H */
diff --git a/tools/perf/util/run-command.c b/tools/perf/util/run-command.c
index 2b615acf94d7..da8e9b285f51 100644
--- a/tools/perf/util/run-command.c
+++ b/tools/perf/util/run-command.c
@@ -212,93 +212,3 @@ int run_command_v_opt(const char **argv, int opt)
212 prepare_run_command_v_opt(&cmd, argv, opt); 212 prepare_run_command_v_opt(&cmd, argv, opt);
213 return run_command(&cmd); 213 return run_command(&cmd);
214} 214}
215
216int run_command_v_opt_cd_env(const char **argv, int opt, const char *dir, const char *const *env)
217{
218 struct child_process cmd;
219 prepare_run_command_v_opt(&cmd, argv, opt);
220 cmd.dir = dir;
221 cmd.env = env;
222 return run_command(&cmd);
223}
224
225int start_async(struct async *async)
226{
227 int pipe_out[2];
228
229 if (pipe(pipe_out) < 0)
230 return error("cannot create pipe: %s", strerror(errno));
231 async->out = pipe_out[0];
232
233 /* Flush stdio before fork() to avoid cloning buffers */
234 fflush(NULL);
235
236 async->pid = fork();
237 if (async->pid < 0) {
238 error("fork (async) failed: %s", strerror(errno));
239 close_pair(pipe_out);
240 return -1;
241 }
242 if (!async->pid) {
243 close(pipe_out[0]);
244 exit(!!async->proc(pipe_out[1], async->data));
245 }
246 close(pipe_out[1]);
247
248 return 0;
249}
250
251int finish_async(struct async *async)
252{
253 int ret = 0;
254
255 if (wait_or_whine(async->pid))
256 ret = error("waitpid (async) failed");
257
258 return ret;
259}
260
261int run_hook(const char *index_file, const char *name, ...)
262{
263 struct child_process hook;
264 const char **argv = NULL, *env[2];
265 char idx[PATH_MAX];
266 va_list args;
267 int ret;
268 size_t i = 0, alloc = 0;
269
270 if (access(perf_path("hooks/%s", name), X_OK) < 0)
271 return 0;
272
273 va_start(args, name);
274 ALLOC_GROW(argv, i + 1, alloc);
275 argv[i++] = perf_path("hooks/%s", name);
276 while (argv[i-1]) {
277 ALLOC_GROW(argv, i + 1, alloc);
278 argv[i++] = va_arg(args, const char *);
279 }
280 va_end(args);
281
282 memset(&hook, 0, sizeof(hook));
283 hook.argv = argv;
284 hook.no_stdin = 1;
285 hook.stdout_to_stderr = 1;
286 if (index_file) {
287 snprintf(idx, sizeof(idx), "PERF_INDEX_FILE=%s", index_file);
288 env[0] = idx;
289 env[1] = NULL;
290 hook.env = env;
291 }
292
293 ret = start_command(&hook);
294 free(argv);
295 if (ret) {
296 warning("Could not spawn %s", argv[0]);
297 return ret;
298 }
299 ret = finish_command(&hook);
300 if (ret == -ERR_RUN_COMMAND_WAITPID_SIGNAL)
301 warning("%s exited due to uncaught signal", argv[0]);
302
303 return ret;
304}
diff --git a/tools/perf/util/run-command.h b/tools/perf/util/run-command.h
index d79028727ce2..1ef264d5069c 100644
--- a/tools/perf/util/run-command.h
+++ b/tools/perf/util/run-command.h
@@ -50,39 +50,9 @@ int start_command(struct child_process *);
50int finish_command(struct child_process *); 50int finish_command(struct child_process *);
51int run_command(struct child_process *); 51int run_command(struct child_process *);
52 52
53extern int run_hook(const char *index_file, const char *name, ...);
54
55#define RUN_COMMAND_NO_STDIN 1 53#define RUN_COMMAND_NO_STDIN 1
56#define RUN_PERF_CMD 2 /*If this is to be perf sub-command */ 54#define RUN_PERF_CMD 2 /*If this is to be perf sub-command */
57#define RUN_COMMAND_STDOUT_TO_STDERR 4 55#define RUN_COMMAND_STDOUT_TO_STDERR 4
58int run_command_v_opt(const char **argv, int opt); 56int run_command_v_opt(const char **argv, int opt);
59 57
60/*
61 * env (the environment) is to be formatted like environ: "VAR=VALUE".
62 * To unset an environment variable use just "VAR".
63 */
64int run_command_v_opt_cd_env(const char **argv, int opt, const char *dir, const char *const *env);
65
66/*
67 * The purpose of the following functions is to feed a pipe by running
68 * a function asynchronously and providing output that the caller reads.
69 *
70 * It is expected that no synchronization and mutual exclusion between
71 * the caller and the feed function is necessary so that the function
72 * can run in a thread without interfering with the caller.
73 */
74struct async {
75 /*
76 * proc writes to fd and closes it;
77 * returns 0 on success, non-zero on failure
78 */
79 int (*proc)(int fd, void *data);
80 void *data;
81 int out; /* caller reads from here and closes it */
82 pid_t pid;
83};
84
85int start_async(struct async *async);
86int finish_async(struct async *async);
87
88#endif /* __PERF_RUN_COMMAND_H */ 58#endif /* __PERF_RUN_COMMAND_H */
diff --git a/tools/perf/util/trace-event-perl.c b/tools/perf/util/scripting-engines/trace-event-perl.c
index 6d6d76b8a21e..b059dc50cc2d 100644
--- a/tools/perf/util/trace-event-perl.c
+++ b/tools/perf/util/scripting-engines/trace-event-perl.c
@@ -25,10 +25,16 @@
25#include <ctype.h> 25#include <ctype.h>
26#include <errno.h> 26#include <errno.h>
27 27
28#include "../perf.h" 28#include "../../perf.h"
29#include "util.h" 29#include "../util.h"
30#include "trace-event.h" 30#include "../trace-event.h"
31#include "trace-event-perl.h" 31
32#include <EXTERN.h>
33#include <perl.h>
34
35void boot_Perf__Trace__Context(pTHX_ CV *cv);
36void boot_DynaLoader(pTHX_ CV *cv);
37typedef PerlInterpreter * INTERP;
32 38
33void xs_init(pTHX); 39void xs_init(pTHX);
34 40
@@ -49,7 +55,7 @@ INTERP my_perl;
49 55
50struct event *events[FTRACE_MAX_EVENT]; 56struct event *events[FTRACE_MAX_EVENT];
51 57
52static struct scripting_context *scripting_context; 58extern struct scripting_context *scripting_context;
53 59
54static char *cur_field_name; 60static char *cur_field_name;
55static int zero_flag_atom; 61static int zero_flag_atom;
@@ -239,33 +245,6 @@ static inline struct event *find_cache_event(int type)
239 return event; 245 return event;
240} 246}
241 247
242int common_pc(struct scripting_context *context)
243{
244 int pc;
245
246 pc = parse_common_pc(context->event_data);
247
248 return pc;
249}
250
251int common_flags(struct scripting_context *context)
252{
253 int flags;
254
255 flags = parse_common_flags(context->event_data);
256
257 return flags;
258}
259
260int common_lock_depth(struct scripting_context *context)
261{
262 int lock_depth;
263
264 lock_depth = parse_common_lock_depth(context->event_data);
265
266 return lock_depth;
267}
268
269static void perl_process_event(int cpu, void *data, 248static void perl_process_event(int cpu, void *data,
270 int size __unused, 249 int size __unused,
271 unsigned long long nsecs, char *comm) 250 unsigned long long nsecs, char *comm)
@@ -392,7 +371,6 @@ static int perl_start_script(const char *script, int argc, const char **argv)
392 run_start_sub(); 371 run_start_sub();
393 372
394 free(command_line); 373 free(command_line);
395 fprintf(stderr, "perf trace started with Perl script %s\n\n", script);
396 return 0; 374 return 0;
397error: 375error:
398 perl_free(my_perl); 376 perl_free(my_perl);
@@ -415,8 +393,6 @@ static int perl_stop_script(void)
415 perl_destruct(my_perl); 393 perl_destruct(my_perl);
416 perl_free(my_perl); 394 perl_free(my_perl);
417 395
418 fprintf(stderr, "\nperf trace Perl script stopped\n");
419
420 return 0; 396 return 0;
421} 397}
422 398
@@ -587,75 +563,3 @@ struct scripting_ops perl_scripting_ops = {
587 .process_event = perl_process_event, 563 .process_event = perl_process_event,
588 .generate_script = perl_generate_script, 564 .generate_script = perl_generate_script,
589}; 565};
590
591static void print_unsupported_msg(void)
592{
593 fprintf(stderr, "Perl scripting not supported."
594 " Install libperl and rebuild perf to enable it.\n"
595 "For example:\n # apt-get install libperl-dev (ubuntu)"
596 "\n # yum install perl-ExtUtils-Embed (Fedora)"
597 "\n etc.\n");
598}
599
600static int perl_start_script_unsupported(const char *script __unused,
601 int argc __unused,
602 const char **argv __unused)
603{
604 print_unsupported_msg();
605
606 return -1;
607}
608
609static int perl_stop_script_unsupported(void)
610{
611 return 0;
612}
613
614static void perl_process_event_unsupported(int cpu __unused,
615 void *data __unused,
616 int size __unused,
617 unsigned long long nsecs __unused,
618 char *comm __unused)
619{
620}
621
622static int perl_generate_script_unsupported(const char *outfile __unused)
623{
624 print_unsupported_msg();
625
626 return -1;
627}
628
629struct scripting_ops perl_scripting_unsupported_ops = {
630 .name = "Perl",
631 .start_script = perl_start_script_unsupported,
632 .stop_script = perl_stop_script_unsupported,
633 .process_event = perl_process_event_unsupported,
634 .generate_script = perl_generate_script_unsupported,
635};
636
637static void register_perl_scripting(struct scripting_ops *scripting_ops)
638{
639 int err;
640 err = script_spec_register("Perl", scripting_ops);
641 if (err)
642 die("error registering Perl script extension");
643
644 err = script_spec_register("pl", scripting_ops);
645 if (err)
646 die("error registering pl script extension");
647
648 scripting_context = malloc(sizeof(struct scripting_context));
649}
650
651#ifdef NO_LIBPERL
652void setup_perl_scripting(void)
653{
654 register_perl_scripting(&perl_scripting_unsupported_ops);
655}
656#else
657void setup_perl_scripting(void)
658{
659 register_perl_scripting(&perl_scripting_ops);
660}
661#endif
diff --git a/tools/perf/util/scripting-engines/trace-event-python.c b/tools/perf/util/scripting-engines/trace-event-python.c
new file mode 100644
index 000000000000..33a632523743
--- /dev/null
+++ b/tools/perf/util/scripting-engines/trace-event-python.c
@@ -0,0 +1,594 @@
1/*
2 * trace-event-python. Feed trace events to an embedded Python interpreter.
3 *
4 * Copyright (C) 2010 Tom Zanussi <tzanussi@gmail.com>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19 *
20 */
21
22#include <Python.h>
23
24#include <stdio.h>
25#include <stdlib.h>
26#include <string.h>
27#include <ctype.h>
28#include <errno.h>
29
30#include "../../perf.h"
31#include "../util.h"
32#include "../trace-event.h"
33
34PyMODINIT_FUNC initperf_trace_context(void);
35
36#define FTRACE_MAX_EVENT \
37 ((1 << (sizeof(unsigned short) * 8)) - 1)
38
39struct event *events[FTRACE_MAX_EVENT];
40
41#define MAX_FIELDS 64
42#define N_COMMON_FIELDS 7
43
44extern struct scripting_context *scripting_context;
45
46static char *cur_field_name;
47static int zero_flag_atom;
48
49static PyObject *main_module, *main_dict;
50
51static void handler_call_die(const char *handler_name)
52{
53 PyErr_Print();
54 Py_FatalError("problem in Python trace event handler");
55}
56
57static void define_value(enum print_arg_type field_type,
58 const char *ev_name,
59 const char *field_name,
60 const char *field_value,
61 const char *field_str)
62{
63 const char *handler_name = "define_flag_value";
64 PyObject *handler, *t, *retval;
65 unsigned long long value;
66 unsigned n = 0;
67
68 if (field_type == PRINT_SYMBOL)
69 handler_name = "define_symbolic_value";
70
71 t = PyTuple_New(4);
72 if (!t)
73 Py_FatalError("couldn't create Python tuple");
74
75 value = eval_flag(field_value);
76
77 PyTuple_SetItem(t, n++, PyString_FromString(ev_name));
78 PyTuple_SetItem(t, n++, PyString_FromString(field_name));
79 PyTuple_SetItem(t, n++, PyInt_FromLong(value));
80 PyTuple_SetItem(t, n++, PyString_FromString(field_str));
81
82 handler = PyDict_GetItemString(main_dict, handler_name);
83 if (handler && PyCallable_Check(handler)) {
84 retval = PyObject_CallObject(handler, t);
85 if (retval == NULL)
86 handler_call_die(handler_name);
87 }
88
89 Py_DECREF(t);
90}
91
92static void define_values(enum print_arg_type field_type,
93 struct print_flag_sym *field,
94 const char *ev_name,
95 const char *field_name)
96{
97 define_value(field_type, ev_name, field_name, field->value,
98 field->str);
99
100 if (field->next)
101 define_values(field_type, field->next, ev_name, field_name);
102}
103
104static void define_field(enum print_arg_type field_type,
105 const char *ev_name,
106 const char *field_name,
107 const char *delim)
108{
109 const char *handler_name = "define_flag_field";
110 PyObject *handler, *t, *retval;
111 unsigned n = 0;
112
113 if (field_type == PRINT_SYMBOL)
114 handler_name = "define_symbolic_field";
115
116 if (field_type == PRINT_FLAGS)
117 t = PyTuple_New(3);
118 else
119 t = PyTuple_New(2);
120 if (!t)
121 Py_FatalError("couldn't create Python tuple");
122
123 PyTuple_SetItem(t, n++, PyString_FromString(ev_name));
124 PyTuple_SetItem(t, n++, PyString_FromString(field_name));
125 if (field_type == PRINT_FLAGS)
126 PyTuple_SetItem(t, n++, PyString_FromString(delim));
127
128 handler = PyDict_GetItemString(main_dict, handler_name);
129 if (handler && PyCallable_Check(handler)) {
130 retval = PyObject_CallObject(handler, t);
131 if (retval == NULL)
132 handler_call_die(handler_name);
133 }
134
135 Py_DECREF(t);
136}
137
138static void define_event_symbols(struct event *event,
139 const char *ev_name,
140 struct print_arg *args)
141{
142 switch (args->type) {
143 case PRINT_NULL:
144 break;
145 case PRINT_ATOM:
146 define_value(PRINT_FLAGS, ev_name, cur_field_name, "0",
147 args->atom.atom);
148 zero_flag_atom = 0;
149 break;
150 case PRINT_FIELD:
151 if (cur_field_name)
152 free(cur_field_name);
153 cur_field_name = strdup(args->field.name);
154 break;
155 case PRINT_FLAGS:
156 define_event_symbols(event, ev_name, args->flags.field);
157 define_field(PRINT_FLAGS, ev_name, cur_field_name,
158 args->flags.delim);
159 define_values(PRINT_FLAGS, args->flags.flags, ev_name,
160 cur_field_name);
161 break;
162 case PRINT_SYMBOL:
163 define_event_symbols(event, ev_name, args->symbol.field);
164 define_field(PRINT_SYMBOL, ev_name, cur_field_name, NULL);
165 define_values(PRINT_SYMBOL, args->symbol.symbols, ev_name,
166 cur_field_name);
167 break;
168 case PRINT_STRING:
169 break;
170 case PRINT_TYPE:
171 define_event_symbols(event, ev_name, args->typecast.item);
172 break;
173 case PRINT_OP:
174 if (strcmp(args->op.op, ":") == 0)
175 zero_flag_atom = 1;
176 define_event_symbols(event, ev_name, args->op.left);
177 define_event_symbols(event, ev_name, args->op.right);
178 break;
179 default:
180 /* we should warn... */
181 return;
182 }
183
184 if (args->next)
185 define_event_symbols(event, ev_name, args->next);
186}
187
188static inline struct event *find_cache_event(int type)
189{
190 static char ev_name[256];
191 struct event *event;
192
193 if (events[type])
194 return events[type];
195
196 events[type] = event = trace_find_event(type);
197 if (!event)
198 return NULL;
199
200 sprintf(ev_name, "%s__%s", event->system, event->name);
201
202 define_event_symbols(event, ev_name, event->print_fmt.args);
203
204 return event;
205}
206
207static void python_process_event(int cpu, void *data,
208 int size __unused,
209 unsigned long long nsecs, char *comm)
210{
211 PyObject *handler, *retval, *context, *t, *obj, *dict = NULL;
212 static char handler_name[256];
213 struct format_field *field;
214 unsigned long long val;
215 unsigned long s, ns;
216 struct event *event;
217 unsigned n = 0;
218 int type;
219 int pid;
220
221 t = PyTuple_New(MAX_FIELDS);
222 if (!t)
223 Py_FatalError("couldn't create Python tuple");
224
225 type = trace_parse_common_type(data);
226
227 event = find_cache_event(type);
228 if (!event)
229 die("ug! no event found for type %d", type);
230
231 pid = trace_parse_common_pid(data);
232
233 sprintf(handler_name, "%s__%s", event->system, event->name);
234
235 handler = PyDict_GetItemString(main_dict, handler_name);
236 if (handler && !PyCallable_Check(handler))
237 handler = NULL;
238 if (!handler) {
239 dict = PyDict_New();
240 if (!dict)
241 Py_FatalError("couldn't create Python dict");
242 }
243 s = nsecs / NSECS_PER_SEC;
244 ns = nsecs - s * NSECS_PER_SEC;
245
246 scripting_context->event_data = data;
247
248 context = PyCObject_FromVoidPtr(scripting_context, NULL);
249
250 PyTuple_SetItem(t, n++, PyString_FromString(handler_name));
251 PyTuple_SetItem(t, n++,
252 PyCObject_FromVoidPtr(scripting_context, NULL));
253
254 if (handler) {
255 PyTuple_SetItem(t, n++, PyInt_FromLong(cpu));
256 PyTuple_SetItem(t, n++, PyInt_FromLong(s));
257 PyTuple_SetItem(t, n++, PyInt_FromLong(ns));
258 PyTuple_SetItem(t, n++, PyInt_FromLong(pid));
259 PyTuple_SetItem(t, n++, PyString_FromString(comm));
260 } else {
261 PyDict_SetItemString(dict, "common_cpu", PyInt_FromLong(cpu));
262 PyDict_SetItemString(dict, "common_s", PyInt_FromLong(s));
263 PyDict_SetItemString(dict, "common_ns", PyInt_FromLong(ns));
264 PyDict_SetItemString(dict, "common_pid", PyInt_FromLong(pid));
265 PyDict_SetItemString(dict, "common_comm", PyString_FromString(comm));
266 }
267 for (field = event->format.fields; field; field = field->next) {
268 if (field->flags & FIELD_IS_STRING) {
269 int offset;
270 if (field->flags & FIELD_IS_DYNAMIC) {
271 offset = *(int *)(data + field->offset);
272 offset &= 0xffff;
273 } else
274 offset = field->offset;
275 obj = PyString_FromString((char *)data + offset);
276 } else { /* FIELD_IS_NUMERIC */
277 val = read_size(data + field->offset, field->size);
278 if (field->flags & FIELD_IS_SIGNED) {
279 if ((long long)val >= LONG_MIN &&
280 (long long)val <= LONG_MAX)
281 obj = PyInt_FromLong(val);
282 else
283 obj = PyLong_FromLongLong(val);
284 } else {
285 if (val <= LONG_MAX)
286 obj = PyInt_FromLong(val);
287 else
288 obj = PyLong_FromUnsignedLongLong(val);
289 }
290 }
291 if (handler)
292 PyTuple_SetItem(t, n++, obj);
293 else
294 PyDict_SetItemString(dict, field->name, obj);
295
296 }
297 if (!handler)
298 PyTuple_SetItem(t, n++, dict);
299
300 if (_PyTuple_Resize(&t, n) == -1)
301 Py_FatalError("error resizing Python tuple");
302
303 if (handler) {
304 retval = PyObject_CallObject(handler, t);
305 if (retval == NULL)
306 handler_call_die(handler_name);
307 } else {
308 handler = PyDict_GetItemString(main_dict, "trace_unhandled");
309 if (handler && PyCallable_Check(handler)) {
310
311 retval = PyObject_CallObject(handler, t);
312 if (retval == NULL)
313 handler_call_die("trace_unhandled");
314 }
315 Py_DECREF(dict);
316 }
317
318 Py_DECREF(t);
319}
320
321static int run_start_sub(void)
322{
323 PyObject *handler, *retval;
324 int err = 0;
325
326 main_module = PyImport_AddModule("__main__");
327 if (main_module == NULL)
328 return -1;
329 Py_INCREF(main_module);
330
331 main_dict = PyModule_GetDict(main_module);
332 if (main_dict == NULL) {
333 err = -1;
334 goto error;
335 }
336 Py_INCREF(main_dict);
337
338 handler = PyDict_GetItemString(main_dict, "trace_begin");
339 if (handler == NULL || !PyCallable_Check(handler))
340 goto out;
341
342 retval = PyObject_CallObject(handler, NULL);
343 if (retval == NULL)
344 handler_call_die("trace_begin");
345
346 Py_DECREF(retval);
347 return err;
348error:
349 Py_XDECREF(main_dict);
350 Py_XDECREF(main_module);
351out:
352 return err;
353}
354
355/*
356 * Start trace script
357 */
358static int python_start_script(const char *script, int argc, const char **argv)
359{
360 const char **command_line;
361 char buf[PATH_MAX];
362 int i, err = 0;
363 FILE *fp;
364
365 command_line = malloc((argc + 1) * sizeof(const char *));
366 command_line[0] = script;
367 for (i = 1; i < argc + 1; i++)
368 command_line[i] = argv[i - 1];
369
370 Py_Initialize();
371
372 initperf_trace_context();
373
374 PySys_SetArgv(argc + 1, (char **)command_line);
375
376 fp = fopen(script, "r");
377 if (!fp) {
378 sprintf(buf, "Can't open python script \"%s\"", script);
379 perror(buf);
380 err = -1;
381 goto error;
382 }
383
384 err = PyRun_SimpleFile(fp, script);
385 if (err) {
386 fprintf(stderr, "Error running python script %s\n", script);
387 goto error;
388 }
389
390 err = run_start_sub();
391 if (err) {
392 fprintf(stderr, "Error starting python script %s\n", script);
393 goto error;
394 }
395
396 free(command_line);
397
398 return err;
399error:
400 Py_Finalize();
401 free(command_line);
402
403 return err;
404}
405
406/*
407 * Stop trace script
408 */
409static int python_stop_script(void)
410{
411 PyObject *handler, *retval;
412 int err = 0;
413
414 handler = PyDict_GetItemString(main_dict, "trace_end");
415 if (handler == NULL || !PyCallable_Check(handler))
416 goto out;
417
418 retval = PyObject_CallObject(handler, NULL);
419 if (retval == NULL)
420 handler_call_die("trace_end");
421 else
422 Py_DECREF(retval);
423out:
424 Py_XDECREF(main_dict);
425 Py_XDECREF(main_module);
426 Py_Finalize();
427
428 return err;
429}
430
431static int python_generate_script(const char *outfile)
432{
433 struct event *event = NULL;
434 struct format_field *f;
435 char fname[PATH_MAX];
436 int not_first, count;
437 FILE *ofp;
438
439 sprintf(fname, "%s.py", outfile);
440 ofp = fopen(fname, "w");
441 if (ofp == NULL) {
442 fprintf(stderr, "couldn't open %s\n", fname);
443 return -1;
444 }
445 fprintf(ofp, "# perf trace event handlers, "
446 "generated by perf trace -g python\n");
447
448 fprintf(ofp, "# Licensed under the terms of the GNU GPL"
449 " License version 2\n\n");
450
451 fprintf(ofp, "# The common_* event handler fields are the most useful "
452 "fields common to\n");
453
454 fprintf(ofp, "# all events. They don't necessarily correspond to "
455 "the 'common_*' fields\n");
456
457 fprintf(ofp, "# in the format files. Those fields not available as "
458 "handler params can\n");
459
460 fprintf(ofp, "# be retrieved using Python functions of the form "
461 "common_*(context).\n");
462
463 fprintf(ofp, "# See the perf-trace-python Documentation for the list "
464 "of available functions.\n\n");
465
466 fprintf(ofp, "import os\n");
467 fprintf(ofp, "import sys\n\n");
468
469 fprintf(ofp, "sys.path.append(os.environ['PERF_EXEC_PATH'] + \\\n");
470 fprintf(ofp, "\t'/scripts/python/Perf-Trace-Util/lib/Perf/Trace')\n");
471 fprintf(ofp, "\nfrom perf_trace_context import *\n");
472 fprintf(ofp, "from Core import *\n\n\n");
473
474 fprintf(ofp, "def trace_begin():\n");
475 fprintf(ofp, "\tprint \"in trace_begin\"\n\n");
476
477 fprintf(ofp, "def trace_end():\n");
478 fprintf(ofp, "\tprint \"in trace_end\"\n\n");
479
480 while ((event = trace_find_next_event(event))) {
481 fprintf(ofp, "def %s__%s(", event->system, event->name);
482 fprintf(ofp, "event_name, ");
483 fprintf(ofp, "context, ");
484 fprintf(ofp, "common_cpu,\n");
485 fprintf(ofp, "\tcommon_secs, ");
486 fprintf(ofp, "common_nsecs, ");
487 fprintf(ofp, "common_pid, ");
488 fprintf(ofp, "common_comm,\n\t");
489
490 not_first = 0;
491 count = 0;
492
493 for (f = event->format.fields; f; f = f->next) {
494 if (not_first++)
495 fprintf(ofp, ", ");
496 if (++count % 5 == 0)
497 fprintf(ofp, "\n\t");
498
499 fprintf(ofp, "%s", f->name);
500 }
501 fprintf(ofp, "):\n");
502
503 fprintf(ofp, "\t\tprint_header(event_name, common_cpu, "
504 "common_secs, common_nsecs,\n\t\t\t"
505 "common_pid, common_comm)\n\n");
506
507 fprintf(ofp, "\t\tprint \"");
508
509 not_first = 0;
510 count = 0;
511
512 for (f = event->format.fields; f; f = f->next) {
513 if (not_first++)
514 fprintf(ofp, ", ");
515 if (count && count % 3 == 0) {
516 fprintf(ofp, "\" \\\n\t\t\"");
517 }
518 count++;
519
520 fprintf(ofp, "%s=", f->name);
521 if (f->flags & FIELD_IS_STRING ||
522 f->flags & FIELD_IS_FLAG ||
523 f->flags & FIELD_IS_SYMBOLIC)
524 fprintf(ofp, "%%s");
525 else if (f->flags & FIELD_IS_SIGNED)
526 fprintf(ofp, "%%d");
527 else
528 fprintf(ofp, "%%u");
529 }
530
531 fprintf(ofp, "\\n\" %% \\\n\t\t(");
532
533 not_first = 0;
534 count = 0;
535
536 for (f = event->format.fields; f; f = f->next) {
537 if (not_first++)
538 fprintf(ofp, ", ");
539
540 if (++count % 5 == 0)
541 fprintf(ofp, "\n\t\t");
542
543 if (f->flags & FIELD_IS_FLAG) {
544 if ((count - 1) % 5 != 0) {
545 fprintf(ofp, "\n\t\t");
546 count = 4;
547 }
548 fprintf(ofp, "flag_str(\"");
549 fprintf(ofp, "%s__%s\", ", event->system,
550 event->name);
551 fprintf(ofp, "\"%s\", %s)", f->name,
552 f->name);
553 } else if (f->flags & FIELD_IS_SYMBOLIC) {
554 if ((count - 1) % 5 != 0) {
555 fprintf(ofp, "\n\t\t");
556 count = 4;
557 }
558 fprintf(ofp, "symbol_str(\"");
559 fprintf(ofp, "%s__%s\", ", event->system,
560 event->name);
561 fprintf(ofp, "\"%s\", %s)", f->name,
562 f->name);
563 } else
564 fprintf(ofp, "%s", f->name);
565 }
566
567 fprintf(ofp, "),\n\n");
568 }
569
570 fprintf(ofp, "def trace_unhandled(event_name, context, "
571 "event_fields_dict):\n");
572
573 fprintf(ofp, "\t\tprint ' '.join(['%%s=%%s'%%(k,str(v))"
574 "for k,v in sorted(event_fields_dict.items())])\n\n");
575
576 fprintf(ofp, "def print_header("
577 "event_name, cpu, secs, nsecs, pid, comm):\n"
578 "\tprint \"%%-20s %%5u %%05u.%%09u %%8u %%-20s \" %% \\\n\t"
579 "(event_name, cpu, secs, nsecs, pid, comm),\n");
580
581 fclose(ofp);
582
583 fprintf(stderr, "generated Python script: %s\n", fname);
584
585 return 0;
586}
587
588struct scripting_ops python_scripting_ops = {
589 .name = "Python",
590 .start_script = python_start_script,
591 .stop_script = python_stop_script,
592 .process_event = python_process_event,
593 .generate_script = python_generate_script,
594};
diff --git a/tools/perf/util/session.c b/tools/perf/util/session.c
index ce3a6c8abe76..c422cd676313 100644
--- a/tools/perf/util/session.c
+++ b/tools/perf/util/session.c
@@ -1,7 +1,11 @@
1#define _FILE_OFFSET_BITS 64
2
1#include <linux/kernel.h> 3#include <linux/kernel.h>
2 4
5#include <byteswap.h>
3#include <unistd.h> 6#include <unistd.h>
4#include <sys/types.h> 7#include <sys/types.h>
8#include <sys/mman.h>
5 9
6#include "session.h" 10#include "session.h"
7#include "sort.h" 11#include "sort.h"
@@ -11,6 +15,16 @@ static int perf_session__open(struct perf_session *self, bool force)
11{ 15{
12 struct stat input_stat; 16 struct stat input_stat;
13 17
18 if (!strcmp(self->filename, "-")) {
19 self->fd_pipe = true;
20 self->fd = STDIN_FILENO;
21
22 if (perf_header__read(self, self->fd) < 0)
23 pr_err("incompatible file format");
24
25 return 0;
26 }
27
14 self->fd = open(self->filename, O_RDONLY); 28 self->fd = open(self->filename, O_RDONLY);
15 if (self->fd < 0) { 29 if (self->fd < 0) {
16 pr_err("failed to open file: %s", self->filename); 30 pr_err("failed to open file: %s", self->filename);
@@ -35,7 +49,7 @@ static int perf_session__open(struct perf_session *self, bool force)
35 goto out_close; 49 goto out_close;
36 } 50 }
37 51
38 if (perf_header__read(&self->header, self->fd) < 0) { 52 if (perf_header__read(self, self->fd) < 0) {
39 pr_err("incompatible file format"); 53 pr_err("incompatible file format");
40 goto out_close; 54 goto out_close;
41 } 55 }
@@ -49,7 +63,21 @@ out_close:
49 return -1; 63 return -1;
50} 64}
51 65
52struct perf_session *perf_session__new(const char *filename, int mode, bool force) 66void perf_session__update_sample_type(struct perf_session *self)
67{
68 self->sample_type = perf_header__sample_type(&self->header);
69}
70
71int perf_session__create_kernel_maps(struct perf_session *self)
72{
73 int ret = machine__create_kernel_maps(&self->host_machine);
74
75 if (ret >= 0)
76 ret = machines__create_guest_kernel_maps(&self->machines);
77 return ret;
78}
79
80struct perf_session *perf_session__new(const char *filename, int mode, bool force, bool repipe)
53{ 81{
54 size_t len = filename ? strlen(filename) + 1 : 0; 82 size_t len = filename ? strlen(filename) + 1 : 0;
55 struct perf_session *self = zalloc(sizeof(*self) + len); 83 struct perf_session *self = zalloc(sizeof(*self) + len);
@@ -62,17 +90,30 @@ struct perf_session *perf_session__new(const char *filename, int mode, bool forc
62 90
63 memcpy(self->filename, filename, len); 91 memcpy(self->filename, filename, len);
64 self->threads = RB_ROOT; 92 self->threads = RB_ROOT;
93 INIT_LIST_HEAD(&self->dead_threads);
94 self->hists_tree = RB_ROOT;
65 self->last_match = NULL; 95 self->last_match = NULL;
66 self->mmap_window = 32; 96 self->mmap_window = 32;
67 self->cwd = NULL; 97 self->cwd = NULL;
68 self->cwdlen = 0; 98 self->cwdlen = 0;
69 map_groups__init(&self->kmaps); 99 self->machines = RB_ROOT;
100 self->repipe = repipe;
101 INIT_LIST_HEAD(&self->ordered_samples.samples_head);
102 machine__init(&self->host_machine, "", HOST_KERNEL_ID);
70 103
71 if (perf_session__create_kernel_maps(self) < 0) 104 if (mode == O_RDONLY) {
72 goto out_delete; 105 if (perf_session__open(self, force) < 0)
106 goto out_delete;
107 } else if (mode == O_WRONLY) {
108 /*
109 * In O_RDONLY mode this will be performed when reading the
110 * kernel MMAP event, in event__process_mmap().
111 */
112 if (perf_session__create_kernel_maps(self) < 0)
113 goto out_delete;
114 }
73 115
74 if (mode == O_RDONLY && perf_session__open(self, force) < 0) 116 perf_session__update_sample_type(self);
75 goto out_delete;
76out: 117out:
77 return self; 118 return self;
78out_free: 119out_free:
@@ -91,6 +132,16 @@ void perf_session__delete(struct perf_session *self)
91 free(self); 132 free(self);
92} 133}
93 134
135void perf_session__remove_thread(struct perf_session *self, struct thread *th)
136{
137 rb_erase(&th->rb_node, &self->threads);
138 /*
139 * We may have references to this thread, for instance in some hist_entry
140 * instances, so just move them to a separate list.
141 */
142 list_add_tail(&th->node, &self->dead_threads);
143}
144
94static bool symbol__match_parent_regex(struct symbol *sym) 145static bool symbol__match_parent_regex(struct symbol *sym)
95{ 146{
96 if (sym->name && !regexec(&parent_regex, sym->name, 0, NULL, 0)) 147 if (sym->name && !regexec(&parent_regex, sym->name, 0, NULL, 0))
@@ -99,22 +150,17 @@ static bool symbol__match_parent_regex(struct symbol *sym)
99 return 0; 150 return 0;
100} 151}
101 152
102struct symbol **perf_session__resolve_callchain(struct perf_session *self, 153struct map_symbol *perf_session__resolve_callchain(struct perf_session *self,
103 struct thread *thread, 154 struct thread *thread,
104 struct ip_callchain *chain, 155 struct ip_callchain *chain,
105 struct symbol **parent) 156 struct symbol **parent)
106{ 157{
107 u8 cpumode = PERF_RECORD_MISC_USER; 158 u8 cpumode = PERF_RECORD_MISC_USER;
108 struct symbol **syms = NULL;
109 unsigned int i; 159 unsigned int i;
160 struct map_symbol *syms = calloc(chain->nr, sizeof(*syms));
110 161
111 if (symbol_conf.use_callchain) { 162 if (!syms)
112 syms = calloc(chain->nr, sizeof(*syms)); 163 return NULL;
113 if (!syms) {
114 fprintf(stderr, "Can't allocate memory for symbols\n");
115 exit(-1);
116 }
117 }
118 164
119 for (i = 0; i < chain->nr; i++) { 165 for (i = 0; i < chain->nr; i++) {
120 u64 ip = chain->ips[i]; 166 u64 ip = chain->ips[i];
@@ -134,17 +180,736 @@ struct symbol **perf_session__resolve_callchain(struct perf_session *self,
134 continue; 180 continue;
135 } 181 }
136 182
183 al.filtered = false;
137 thread__find_addr_location(thread, self, cpumode, 184 thread__find_addr_location(thread, self, cpumode,
138 MAP__FUNCTION, ip, &al, NULL); 185 MAP__FUNCTION, thread->pid, ip, &al, NULL);
139 if (al.sym != NULL) { 186 if (al.sym != NULL) {
140 if (sort__has_parent && !*parent && 187 if (sort__has_parent && !*parent &&
141 symbol__match_parent_regex(al.sym)) 188 symbol__match_parent_regex(al.sym))
142 *parent = al.sym; 189 *parent = al.sym;
143 if (!symbol_conf.use_callchain) 190 if (!symbol_conf.use_callchain)
144 break; 191 break;
145 syms[i] = al.sym; 192 syms[i].map = al.map;
193 syms[i].sym = al.sym;
146 } 194 }
147 } 195 }
148 196
149 return syms; 197 return syms;
150} 198}
199
200static int process_event_stub(event_t *event __used,
201 struct perf_session *session __used)
202{
203 dump_printf(": unhandled!\n");
204 return 0;
205}
206
207static int process_finished_round_stub(event_t *event __used,
208 struct perf_session *session __used,
209 struct perf_event_ops *ops __used)
210{
211 dump_printf(": unhandled!\n");
212 return 0;
213}
214
215static int process_finished_round(event_t *event,
216 struct perf_session *session,
217 struct perf_event_ops *ops);
218
219static void perf_event_ops__fill_defaults(struct perf_event_ops *handler)
220{
221 if (handler->sample == NULL)
222 handler->sample = process_event_stub;
223 if (handler->mmap == NULL)
224 handler->mmap = process_event_stub;
225 if (handler->comm == NULL)
226 handler->comm = process_event_stub;
227 if (handler->fork == NULL)
228 handler->fork = process_event_stub;
229 if (handler->exit == NULL)
230 handler->exit = process_event_stub;
231 if (handler->lost == NULL)
232 handler->lost = process_event_stub;
233 if (handler->read == NULL)
234 handler->read = process_event_stub;
235 if (handler->throttle == NULL)
236 handler->throttle = process_event_stub;
237 if (handler->unthrottle == NULL)
238 handler->unthrottle = process_event_stub;
239 if (handler->attr == NULL)
240 handler->attr = process_event_stub;
241 if (handler->event_type == NULL)
242 handler->event_type = process_event_stub;
243 if (handler->tracing_data == NULL)
244 handler->tracing_data = process_event_stub;
245 if (handler->build_id == NULL)
246 handler->build_id = process_event_stub;
247 if (handler->finished_round == NULL) {
248 if (handler->ordered_samples)
249 handler->finished_round = process_finished_round;
250 else
251 handler->finished_round = process_finished_round_stub;
252 }
253}
254
255void mem_bswap_64(void *src, int byte_size)
256{
257 u64 *m = src;
258
259 while (byte_size > 0) {
260 *m = bswap_64(*m);
261 byte_size -= sizeof(u64);
262 ++m;
263 }
264}
265
266static void event__all64_swap(event_t *self)
267{
268 struct perf_event_header *hdr = &self->header;
269 mem_bswap_64(hdr + 1, self->header.size - sizeof(*hdr));
270}
271
272static void event__comm_swap(event_t *self)
273{
274 self->comm.pid = bswap_32(self->comm.pid);
275 self->comm.tid = bswap_32(self->comm.tid);
276}
277
278static void event__mmap_swap(event_t *self)
279{
280 self->mmap.pid = bswap_32(self->mmap.pid);
281 self->mmap.tid = bswap_32(self->mmap.tid);
282 self->mmap.start = bswap_64(self->mmap.start);
283 self->mmap.len = bswap_64(self->mmap.len);
284 self->mmap.pgoff = bswap_64(self->mmap.pgoff);
285}
286
287static void event__task_swap(event_t *self)
288{
289 self->fork.pid = bswap_32(self->fork.pid);
290 self->fork.tid = bswap_32(self->fork.tid);
291 self->fork.ppid = bswap_32(self->fork.ppid);
292 self->fork.ptid = bswap_32(self->fork.ptid);
293 self->fork.time = bswap_64(self->fork.time);
294}
295
296static void event__read_swap(event_t *self)
297{
298 self->read.pid = bswap_32(self->read.pid);
299 self->read.tid = bswap_32(self->read.tid);
300 self->read.value = bswap_64(self->read.value);
301 self->read.time_enabled = bswap_64(self->read.time_enabled);
302 self->read.time_running = bswap_64(self->read.time_running);
303 self->read.id = bswap_64(self->read.id);
304}
305
306static void event__attr_swap(event_t *self)
307{
308 size_t size;
309
310 self->attr.attr.type = bswap_32(self->attr.attr.type);
311 self->attr.attr.size = bswap_32(self->attr.attr.size);
312 self->attr.attr.config = bswap_64(self->attr.attr.config);
313 self->attr.attr.sample_period = bswap_64(self->attr.attr.sample_period);
314 self->attr.attr.sample_type = bswap_64(self->attr.attr.sample_type);
315 self->attr.attr.read_format = bswap_64(self->attr.attr.read_format);
316 self->attr.attr.wakeup_events = bswap_32(self->attr.attr.wakeup_events);
317 self->attr.attr.bp_type = bswap_32(self->attr.attr.bp_type);
318 self->attr.attr.bp_addr = bswap_64(self->attr.attr.bp_addr);
319 self->attr.attr.bp_len = bswap_64(self->attr.attr.bp_len);
320
321 size = self->header.size;
322 size -= (void *)&self->attr.id - (void *)self;
323 mem_bswap_64(self->attr.id, size);
324}
325
326static void event__event_type_swap(event_t *self)
327{
328 self->event_type.event_type.event_id =
329 bswap_64(self->event_type.event_type.event_id);
330}
331
332static void event__tracing_data_swap(event_t *self)
333{
334 self->tracing_data.size = bswap_32(self->tracing_data.size);
335}
336
337typedef void (*event__swap_op)(event_t *self);
338
339static event__swap_op event__swap_ops[] = {
340 [PERF_RECORD_MMAP] = event__mmap_swap,
341 [PERF_RECORD_COMM] = event__comm_swap,
342 [PERF_RECORD_FORK] = event__task_swap,
343 [PERF_RECORD_EXIT] = event__task_swap,
344 [PERF_RECORD_LOST] = event__all64_swap,
345 [PERF_RECORD_READ] = event__read_swap,
346 [PERF_RECORD_SAMPLE] = event__all64_swap,
347 [PERF_RECORD_HEADER_ATTR] = event__attr_swap,
348 [PERF_RECORD_HEADER_EVENT_TYPE] = event__event_type_swap,
349 [PERF_RECORD_HEADER_TRACING_DATA] = event__tracing_data_swap,
350 [PERF_RECORD_HEADER_BUILD_ID] = NULL,
351 [PERF_RECORD_HEADER_MAX] = NULL,
352};
353
354struct sample_queue {
355 u64 timestamp;
356 struct sample_event *event;
357 struct list_head list;
358};
359
360static void flush_sample_queue(struct perf_session *s,
361 struct perf_event_ops *ops)
362{
363 struct list_head *head = &s->ordered_samples.samples_head;
364 u64 limit = s->ordered_samples.next_flush;
365 struct sample_queue *tmp, *iter;
366
367 if (!ops->ordered_samples || !limit)
368 return;
369
370 list_for_each_entry_safe(iter, tmp, head, list) {
371 if (iter->timestamp > limit)
372 return;
373
374 if (iter == s->ordered_samples.last_inserted)
375 s->ordered_samples.last_inserted = NULL;
376
377 ops->sample((event_t *)iter->event, s);
378
379 s->ordered_samples.last_flush = iter->timestamp;
380 list_del(&iter->list);
381 free(iter->event);
382 free(iter);
383 }
384}
385
386/*
387 * When perf record finishes a pass on every buffers, it records this pseudo
388 * event.
389 * We record the max timestamp t found in the pass n.
390 * Assuming these timestamps are monotonic across cpus, we know that if
391 * a buffer still has events with timestamps below t, they will be all
392 * available and then read in the pass n + 1.
393 * Hence when we start to read the pass n + 2, we can safely flush every
394 * events with timestamps below t.
395 *
396 * ============ PASS n =================
397 * CPU 0 | CPU 1
398 * |
399 * cnt1 timestamps | cnt2 timestamps
400 * 1 | 2
401 * 2 | 3
402 * - | 4 <--- max recorded
403 *
404 * ============ PASS n + 1 ==============
405 * CPU 0 | CPU 1
406 * |
407 * cnt1 timestamps | cnt2 timestamps
408 * 3 | 5
409 * 4 | 6
410 * 5 | 7 <---- max recorded
411 *
412 * Flush every events below timestamp 4
413 *
414 * ============ PASS n + 2 ==============
415 * CPU 0 | CPU 1
416 * |
417 * cnt1 timestamps | cnt2 timestamps
418 * 6 | 8
419 * 7 | 9
420 * - | 10
421 *
422 * Flush every events below timestamp 7
423 * etc...
424 */
425static int process_finished_round(event_t *event __used,
426 struct perf_session *session,
427 struct perf_event_ops *ops)
428{
429 flush_sample_queue(session, ops);
430 session->ordered_samples.next_flush = session->ordered_samples.max_timestamp;
431
432 return 0;
433}
434
435static void __queue_sample_end(struct sample_queue *new, struct list_head *head)
436{
437 struct sample_queue *iter;
438
439 list_for_each_entry_reverse(iter, head, list) {
440 if (iter->timestamp < new->timestamp) {
441 list_add(&new->list, &iter->list);
442 return;
443 }
444 }
445
446 list_add(&new->list, head);
447}
448
449static void __queue_sample_before(struct sample_queue *new,
450 struct sample_queue *iter,
451 struct list_head *head)
452{
453 list_for_each_entry_continue_reverse(iter, head, list) {
454 if (iter->timestamp < new->timestamp) {
455 list_add(&new->list, &iter->list);
456 return;
457 }
458 }
459
460 list_add(&new->list, head);
461}
462
463static void __queue_sample_after(struct sample_queue *new,
464 struct sample_queue *iter,
465 struct list_head *head)
466{
467 list_for_each_entry_continue(iter, head, list) {
468 if (iter->timestamp > new->timestamp) {
469 list_add_tail(&new->list, &iter->list);
470 return;
471 }
472 }
473 list_add_tail(&new->list, head);
474}
475
476/* The queue is ordered by time */
477static void __queue_sample_event(struct sample_queue *new,
478 struct perf_session *s)
479{
480 struct sample_queue *last_inserted = s->ordered_samples.last_inserted;
481 struct list_head *head = &s->ordered_samples.samples_head;
482
483
484 if (!last_inserted) {
485 __queue_sample_end(new, head);
486 return;
487 }
488
489 /*
490 * Most of the time the current event has a timestamp
491 * very close to the last event inserted, unless we just switched
492 * to another event buffer. Having a sorting based on a list and
493 * on the last inserted event that is close to the current one is
494 * probably more efficient than an rbtree based sorting.
495 */
496 if (last_inserted->timestamp >= new->timestamp)
497 __queue_sample_before(new, last_inserted, head);
498 else
499 __queue_sample_after(new, last_inserted, head);
500}
501
502static int queue_sample_event(event_t *event, struct sample_data *data,
503 struct perf_session *s)
504{
505 u64 timestamp = data->time;
506 struct sample_queue *new;
507
508
509 if (timestamp < s->ordered_samples.last_flush) {
510 printf("Warning: Timestamp below last timeslice flush\n");
511 return -EINVAL;
512 }
513
514 new = malloc(sizeof(*new));
515 if (!new)
516 return -ENOMEM;
517
518 new->timestamp = timestamp;
519
520 new->event = malloc(event->header.size);
521 if (!new->event) {
522 free(new);
523 return -ENOMEM;
524 }
525
526 memcpy(new->event, event, event->header.size);
527
528 __queue_sample_event(new, s);
529 s->ordered_samples.last_inserted = new;
530
531 if (new->timestamp > s->ordered_samples.max_timestamp)
532 s->ordered_samples.max_timestamp = new->timestamp;
533
534 return 0;
535}
536
537static int perf_session__process_sample(event_t *event, struct perf_session *s,
538 struct perf_event_ops *ops)
539{
540 struct sample_data data;
541
542 if (!ops->ordered_samples)
543 return ops->sample(event, s);
544
545 bzero(&data, sizeof(struct sample_data));
546 event__parse_sample(event, s->sample_type, &data);
547
548 queue_sample_event(event, &data, s);
549
550 return 0;
551}
552
553static int perf_session__process_event(struct perf_session *self,
554 event_t *event,
555 struct perf_event_ops *ops,
556 u64 offset, u64 head)
557{
558 trace_event(event);
559
560 if (event->header.type < PERF_RECORD_HEADER_MAX) {
561 dump_printf("%#Lx [%#x]: PERF_RECORD_%s",
562 offset + head, event->header.size,
563 event__name[event->header.type]);
564 hists__inc_nr_events(&self->hists, event->header.type);
565 }
566
567 if (self->header.needs_swap && event__swap_ops[event->header.type])
568 event__swap_ops[event->header.type](event);
569
570 switch (event->header.type) {
571 case PERF_RECORD_SAMPLE:
572 return perf_session__process_sample(event, self, ops);
573 case PERF_RECORD_MMAP:
574 return ops->mmap(event, self);
575 case PERF_RECORD_COMM:
576 return ops->comm(event, self);
577 case PERF_RECORD_FORK:
578 return ops->fork(event, self);
579 case PERF_RECORD_EXIT:
580 return ops->exit(event, self);
581 case PERF_RECORD_LOST:
582 return ops->lost(event, self);
583 case PERF_RECORD_READ:
584 return ops->read(event, self);
585 case PERF_RECORD_THROTTLE:
586 return ops->throttle(event, self);
587 case PERF_RECORD_UNTHROTTLE:
588 return ops->unthrottle(event, self);
589 case PERF_RECORD_HEADER_ATTR:
590 return ops->attr(event, self);
591 case PERF_RECORD_HEADER_EVENT_TYPE:
592 return ops->event_type(event, self);
593 case PERF_RECORD_HEADER_TRACING_DATA:
594 /* setup for reading amidst mmap */
595 lseek(self->fd, offset + head, SEEK_SET);
596 return ops->tracing_data(event, self);
597 case PERF_RECORD_HEADER_BUILD_ID:
598 return ops->build_id(event, self);
599 case PERF_RECORD_FINISHED_ROUND:
600 return ops->finished_round(event, self, ops);
601 default:
602 ++self->hists.stats.nr_unknown_events;
603 return -1;
604 }
605}
606
607void perf_event_header__bswap(struct perf_event_header *self)
608{
609 self->type = bswap_32(self->type);
610 self->misc = bswap_16(self->misc);
611 self->size = bswap_16(self->size);
612}
613
614static struct thread *perf_session__register_idle_thread(struct perf_session *self)
615{
616 struct thread *thread = perf_session__findnew(self, 0);
617
618 if (thread == NULL || thread__set_comm(thread, "swapper")) {
619 pr_err("problem inserting idle task.\n");
620 thread = NULL;
621 }
622
623 return thread;
624}
625
626int do_read(int fd, void *buf, size_t size)
627{
628 void *buf_start = buf;
629
630 while (size) {
631 int ret = read(fd, buf, size);
632
633 if (ret <= 0)
634 return ret;
635
636 size -= ret;
637 buf += ret;
638 }
639
640 return buf - buf_start;
641}
642
643#define session_done() (*(volatile int *)(&session_done))
644volatile int session_done;
645
646static int __perf_session__process_pipe_events(struct perf_session *self,
647 struct perf_event_ops *ops)
648{
649 event_t event;
650 uint32_t size;
651 int skip = 0;
652 u64 head;
653 int err;
654 void *p;
655
656 perf_event_ops__fill_defaults(ops);
657
658 head = 0;
659more:
660 err = do_read(self->fd, &event, sizeof(struct perf_event_header));
661 if (err <= 0) {
662 if (err == 0)
663 goto done;
664
665 pr_err("failed to read event header\n");
666 goto out_err;
667 }
668
669 if (self->header.needs_swap)
670 perf_event_header__bswap(&event.header);
671
672 size = event.header.size;
673 if (size == 0)
674 size = 8;
675
676 p = &event;
677 p += sizeof(struct perf_event_header);
678
679 if (size - sizeof(struct perf_event_header)) {
680 err = do_read(self->fd, p,
681 size - sizeof(struct perf_event_header));
682 if (err <= 0) {
683 if (err == 0) {
684 pr_err("unexpected end of event stream\n");
685 goto done;
686 }
687
688 pr_err("failed to read event data\n");
689 goto out_err;
690 }
691 }
692
693 if (size == 0 ||
694 (skip = perf_session__process_event(self, &event, ops,
695 0, head)) < 0) {
696 dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n",
697 head, event.header.size, event.header.type);
698 /*
699 * assume we lost track of the stream, check alignment, and
700 * increment a single u64 in the hope to catch on again 'soon'.
701 */
702 if (unlikely(head & 7))
703 head &= ~7ULL;
704
705 size = 8;
706 }
707
708 head += size;
709
710 dump_printf("\n%#Lx [%#x]: event: %d\n",
711 head, event.header.size, event.header.type);
712
713 if (skip > 0)
714 head += skip;
715
716 if (!session_done())
717 goto more;
718done:
719 err = 0;
720out_err:
721 return err;
722}
723
724int __perf_session__process_events(struct perf_session *self,
725 u64 data_offset, u64 data_size,
726 u64 file_size, struct perf_event_ops *ops)
727{
728 int err, mmap_prot, mmap_flags;
729 u64 head, shift;
730 u64 offset = 0;
731 size_t page_size;
732 event_t *event;
733 uint32_t size;
734 char *buf;
735 struct ui_progress *progress = ui_progress__new("Processing events...",
736 self->size);
737 if (progress == NULL)
738 return -1;
739
740 perf_event_ops__fill_defaults(ops);
741
742 page_size = sysconf(_SC_PAGESIZE);
743
744 head = data_offset;
745 shift = page_size * (head / page_size);
746 offset += shift;
747 head -= shift;
748
749 mmap_prot = PROT_READ;
750 mmap_flags = MAP_SHARED;
751
752 if (self->header.needs_swap) {
753 mmap_prot |= PROT_WRITE;
754 mmap_flags = MAP_PRIVATE;
755 }
756remap:
757 buf = mmap(NULL, page_size * self->mmap_window, mmap_prot,
758 mmap_flags, self->fd, offset);
759 if (buf == MAP_FAILED) {
760 pr_err("failed to mmap file\n");
761 err = -errno;
762 goto out_err;
763 }
764
765more:
766 event = (event_t *)(buf + head);
767 ui_progress__update(progress, offset);
768
769 if (self->header.needs_swap)
770 perf_event_header__bswap(&event->header);
771 size = event->header.size;
772 if (size == 0)
773 size = 8;
774
775 if (head + event->header.size >= page_size * self->mmap_window) {
776 int munmap_ret;
777
778 shift = page_size * (head / page_size);
779
780 munmap_ret = munmap(buf, page_size * self->mmap_window);
781 assert(munmap_ret == 0);
782
783 offset += shift;
784 head -= shift;
785 goto remap;
786 }
787
788 size = event->header.size;
789
790 dump_printf("\n%#Lx [%#x]: event: %d\n",
791 offset + head, event->header.size, event->header.type);
792
793 if (size == 0 ||
794 perf_session__process_event(self, event, ops, offset, head) < 0) {
795 dump_printf("%#Lx [%#x]: skipping unknown header type: %d\n",
796 offset + head, event->header.size,
797 event->header.type);
798 /*
799 * assume we lost track of the stream, check alignment, and
800 * increment a single u64 in the hope to catch on again 'soon'.
801 */
802 if (unlikely(head & 7))
803 head &= ~7ULL;
804
805 size = 8;
806 }
807
808 head += size;
809
810 if (offset + head >= data_offset + data_size)
811 goto done;
812
813 if (offset + head < file_size)
814 goto more;
815done:
816 err = 0;
817 /* do the final flush for ordered samples */
818 self->ordered_samples.next_flush = ULLONG_MAX;
819 flush_sample_queue(self, ops);
820out_err:
821 ui_progress__delete(progress);
822 return err;
823}
824
825int perf_session__process_events(struct perf_session *self,
826 struct perf_event_ops *ops)
827{
828 int err;
829
830 if (perf_session__register_idle_thread(self) == NULL)
831 return -ENOMEM;
832
833 if (!symbol_conf.full_paths) {
834 char bf[PATH_MAX];
835
836 if (getcwd(bf, sizeof(bf)) == NULL) {
837 err = -errno;
838out_getcwd_err:
839 pr_err("failed to get the current directory\n");
840 goto out_err;
841 }
842 self->cwd = strdup(bf);
843 if (self->cwd == NULL) {
844 err = -ENOMEM;
845 goto out_getcwd_err;
846 }
847 self->cwdlen = strlen(self->cwd);
848 }
849
850 if (!self->fd_pipe)
851 err = __perf_session__process_events(self,
852 self->header.data_offset,
853 self->header.data_size,
854 self->size, ops);
855 else
856 err = __perf_session__process_pipe_events(self, ops);
857out_err:
858 return err;
859}
860
861bool perf_session__has_traces(struct perf_session *self, const char *msg)
862{
863 if (!(self->sample_type & PERF_SAMPLE_RAW)) {
864 pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg);
865 return false;
866 }
867
868 return true;
869}
870
871int perf_session__set_kallsyms_ref_reloc_sym(struct map **maps,
872 const char *symbol_name,
873 u64 addr)
874{
875 char *bracket;
876 enum map_type i;
877 struct ref_reloc_sym *ref;
878
879 ref = zalloc(sizeof(struct ref_reloc_sym));
880 if (ref == NULL)
881 return -ENOMEM;
882
883 ref->name = strdup(symbol_name);
884 if (ref->name == NULL) {
885 free(ref);
886 return -ENOMEM;
887 }
888
889 bracket = strchr(ref->name, ']');
890 if (bracket)
891 *bracket = '\0';
892
893 ref->addr = addr;
894
895 for (i = 0; i < MAP__NR_TYPES; ++i) {
896 struct kmap *kmap = map__kmap(maps[i]);
897 kmap->ref_reloc_sym = ref;
898 }
899
900 return 0;
901}
902
903size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp)
904{
905 return __dsos__fprintf(&self->host_machine.kernel_dsos, fp) +
906 __dsos__fprintf(&self->host_machine.user_dsos, fp) +
907 machines__fprintf_dsos(&self->machines, fp);
908}
909
910size_t perf_session__fprintf_dsos_buildid(struct perf_session *self, FILE *fp,
911 bool with_hits)
912{
913 size_t ret = machine__fprintf_dsos_buildid(&self->host_machine, fp, with_hits);
914 return ret + machines__fprintf_dsos_buildid(&self->machines, fp, with_hits);
915}
diff --git a/tools/perf/util/session.h b/tools/perf/util/session.h
index 32eaa1bada06..9fa0fc2a863f 100644
--- a/tools/perf/util/session.h
+++ b/tools/perf/util/session.h
@@ -1,61 +1,145 @@
1#ifndef __PERF_SESSION_H 1#ifndef __PERF_SESSION_H
2#define __PERF_SESSION_H 2#define __PERF_SESSION_H
3 3
4#include "hist.h"
4#include "event.h" 5#include "event.h"
5#include "header.h" 6#include "header.h"
7#include "symbol.h"
6#include "thread.h" 8#include "thread.h"
7#include <linux/rbtree.h> 9#include <linux/rbtree.h>
8#include "../../../include/linux/perf_event.h" 10#include "../../../include/linux/perf_event.h"
9 11
12struct sample_queue;
10struct ip_callchain; 13struct ip_callchain;
11struct thread; 14struct thread;
12struct symbol; 15
16struct ordered_samples {
17 u64 last_flush;
18 u64 next_flush;
19 u64 max_timestamp;
20 struct list_head samples_head;
21 struct sample_queue *last_inserted;
22};
13 23
14struct perf_session { 24struct perf_session {
15 struct perf_header header; 25 struct perf_header header;
16 unsigned long size; 26 unsigned long size;
17 unsigned long mmap_window; 27 unsigned long mmap_window;
18 struct map_groups kmaps;
19 struct rb_root threads; 28 struct rb_root threads;
29 struct list_head dead_threads;
20 struct thread *last_match; 30 struct thread *last_match;
21 struct events_stats events_stats; 31 struct machine host_machine;
22 unsigned long event_total[PERF_RECORD_MAX]; 32 struct rb_root machines;
23 struct rb_root hists; 33 struct rb_root hists_tree;
34 /*
35 * FIXME: should point to the first entry in hists_tree and
36 * be a hists instance. Right now its only 'report'
37 * that is using ->hists_tree while all the rest use
38 * ->hists.
39 */
40 struct hists hists;
24 u64 sample_type; 41 u64 sample_type;
25 int fd; 42 int fd;
43 bool fd_pipe;
44 bool repipe;
26 int cwdlen; 45 int cwdlen;
27 char *cwd; 46 char *cwd;
47 struct ordered_samples ordered_samples;
28 char filename[0]; 48 char filename[0];
29}; 49};
30 50
51struct perf_event_ops;
52
31typedef int (*event_op)(event_t *self, struct perf_session *session); 53typedef int (*event_op)(event_t *self, struct perf_session *session);
54typedef int (*event_op2)(event_t *self, struct perf_session *session,
55 struct perf_event_ops *ops);
32 56
33struct perf_event_ops { 57struct perf_event_ops {
34 event_op process_sample_event; 58 event_op sample,
35 event_op process_mmap_event; 59 mmap,
36 event_op process_comm_event; 60 comm,
37 event_op process_fork_event; 61 fork,
38 event_op process_exit_event; 62 exit,
39 event_op process_lost_event; 63 lost,
40 event_op process_read_event; 64 read,
41 event_op process_throttle_event; 65 throttle,
42 event_op process_unthrottle_event; 66 unthrottle,
43 int (*sample_type_check)(struct perf_session *session); 67 attr,
44 unsigned long total_unknown; 68 event_type,
45 bool full_paths; 69 tracing_data,
70 build_id;
71 event_op2 finished_round;
72 bool ordered_samples;
46}; 73};
47 74
48struct perf_session *perf_session__new(const char *filename, int mode, bool force); 75struct perf_session *perf_session__new(const char *filename, int mode, bool force, bool repipe);
49void perf_session__delete(struct perf_session *self); 76void perf_session__delete(struct perf_session *self);
50 77
78void perf_event_header__bswap(struct perf_event_header *self);
79
80int __perf_session__process_events(struct perf_session *self,
81 u64 data_offset, u64 data_size, u64 size,
82 struct perf_event_ops *ops);
51int perf_session__process_events(struct perf_session *self, 83int perf_session__process_events(struct perf_session *self,
52 struct perf_event_ops *event_ops); 84 struct perf_event_ops *event_ops);
53 85
54struct symbol **perf_session__resolve_callchain(struct perf_session *self, 86struct map_symbol *perf_session__resolve_callchain(struct perf_session *self,
55 struct thread *thread, 87 struct thread *thread,
56 struct ip_callchain *chain, 88 struct ip_callchain *chain,
57 struct symbol **parent); 89 struct symbol **parent);
90
91bool perf_session__has_traces(struct perf_session *self, const char *msg);
92
93int perf_session__set_kallsyms_ref_reloc_sym(struct map **maps,
94 const char *symbol_name,
95 u64 addr);
96
97void mem_bswap_64(void *src, int byte_size);
98
99int perf_session__create_kernel_maps(struct perf_session *self);
100
101int do_read(int fd, void *buf, size_t size);
102void perf_session__update_sample_type(struct perf_session *self);
103void perf_session__remove_thread(struct perf_session *self, struct thread *th);
104
105static inline
106struct machine *perf_session__find_host_machine(struct perf_session *self)
107{
108 return &self->host_machine;
109}
110
111static inline
112struct machine *perf_session__find_machine(struct perf_session *self, pid_t pid)
113{
114 if (pid == HOST_KERNEL_ID)
115 return &self->host_machine;
116 return machines__find(&self->machines, pid);
117}
118
119static inline
120struct machine *perf_session__findnew_machine(struct perf_session *self, pid_t pid)
121{
122 if (pid == HOST_KERNEL_ID)
123 return &self->host_machine;
124 return machines__findnew(&self->machines, pid);
125}
126
127static inline
128void perf_session__process_machines(struct perf_session *self,
129 machine__process_t process)
130{
131 process(&self->host_machine, self);
132 return machines__process(&self->machines, process, self);
133}
134
135size_t perf_session__fprintf_dsos(struct perf_session *self, FILE *fp);
58 136
59int perf_header__read_build_ids(int input, u64 offset, u64 file_size); 137size_t perf_session__fprintf_dsos_buildid(struct perf_session *self,
138 FILE *fp, bool with_hits);
60 139
140static inline
141size_t perf_session__fprintf_nr_events(struct perf_session *self, FILE *fp)
142{
143 return hists__fprintf_nr_events(&self->hists, fp);
144}
61#endif /* __PERF_SESSION_H */ 145#endif /* __PERF_SESSION_H */
diff --git a/tools/perf/util/sigchain.c b/tools/perf/util/sigchain.c
index 1118b99e57d3..ba785e9b1841 100644
--- a/tools/perf/util/sigchain.c
+++ b/tools/perf/util/sigchain.c
@@ -16,7 +16,7 @@ static void check_signum(int sig)
16 die("BUG: signal out of range: %d", sig); 16 die("BUG: signal out of range: %d", sig);
17} 17}
18 18
19int sigchain_push(int sig, sigchain_fun f) 19static int sigchain_push(int sig, sigchain_fun f)
20{ 20{
21 struct sigchain_signal *s = signals + sig; 21 struct sigchain_signal *s = signals + sig;
22 check_signum(sig); 22 check_signum(sig);
diff --git a/tools/perf/util/sigchain.h b/tools/perf/util/sigchain.h
index 1a53c11265fd..959d64eb5557 100644
--- a/tools/perf/util/sigchain.h
+++ b/tools/perf/util/sigchain.h
@@ -3,7 +3,6 @@
3 3
4typedef void (*sigchain_fun)(int); 4typedef void (*sigchain_fun)(int);
5 5
6int sigchain_push(int sig, sigchain_fun f);
7int sigchain_pop(int sig); 6int sigchain_pop(int sig);
8 7
9void sigchain_push_common(sigchain_fun f); 8void sigchain_push_common(sigchain_fun f);
diff --git a/tools/perf/util/sort.c b/tools/perf/util/sort.c
index cb0f327de9e8..2316cb5a4116 100644
--- a/tools/perf/util/sort.c
+++ b/tools/perf/util/sort.c
@@ -1,10 +1,10 @@
1#include "sort.h" 1#include "sort.h"
2 2
3regex_t parent_regex; 3regex_t parent_regex;
4char default_parent_pattern[] = "^sys_|^do_page_fault"; 4const char default_parent_pattern[] = "^sys_|^do_page_fault";
5char *parent_pattern = default_parent_pattern; 5const char *parent_pattern = default_parent_pattern;
6char default_sort_order[] = "comm,dso,symbol"; 6const char default_sort_order[] = "comm,dso,symbol";
7char *sort_order = default_sort_order; 7const char *sort_order = default_sort_order;
8int sort__need_collapse = 0; 8int sort__need_collapse = 0;
9int sort__has_parent = 0; 9int sort__has_parent = 0;
10 10
@@ -18,39 +18,50 @@ char * field_sep;
18 18
19LIST_HEAD(hist_entry__sort_list); 19LIST_HEAD(hist_entry__sort_list);
20 20
21static int hist_entry__thread_snprintf(struct hist_entry *self, char *bf,
22 size_t size, unsigned int width);
23static int hist_entry__comm_snprintf(struct hist_entry *self, char *bf,
24 size_t size, unsigned int width);
25static int hist_entry__dso_snprintf(struct hist_entry *self, char *bf,
26 size_t size, unsigned int width);
27static int hist_entry__sym_snprintf(struct hist_entry *self, char *bf,
28 size_t size, unsigned int width);
29static int hist_entry__parent_snprintf(struct hist_entry *self, char *bf,
30 size_t size, unsigned int width);
31
21struct sort_entry sort_thread = { 32struct sort_entry sort_thread = {
22 .header = "Command: Pid", 33 .se_header = "Command: Pid",
23 .cmp = sort__thread_cmp, 34 .se_cmp = sort__thread_cmp,
24 .print = sort__thread_print, 35 .se_snprintf = hist_entry__thread_snprintf,
25 .width = &threads__col_width, 36 .se_width = &threads__col_width,
26}; 37};
27 38
28struct sort_entry sort_comm = { 39struct sort_entry sort_comm = {
29 .header = "Command", 40 .se_header = "Command",
30 .cmp = sort__comm_cmp, 41 .se_cmp = sort__comm_cmp,
31 .collapse = sort__comm_collapse, 42 .se_collapse = sort__comm_collapse,
32 .print = sort__comm_print, 43 .se_snprintf = hist_entry__comm_snprintf,
33 .width = &comms__col_width, 44 .se_width = &comms__col_width,
34}; 45};
35 46
36struct sort_entry sort_dso = { 47struct sort_entry sort_dso = {
37 .header = "Shared Object", 48 .se_header = "Shared Object",
38 .cmp = sort__dso_cmp, 49 .se_cmp = sort__dso_cmp,
39 .print = sort__dso_print, 50 .se_snprintf = hist_entry__dso_snprintf,
40 .width = &dsos__col_width, 51 .se_width = &dsos__col_width,
41}; 52};
42 53
43struct sort_entry sort_sym = { 54struct sort_entry sort_sym = {
44 .header = "Symbol", 55 .se_header = "Symbol",
45 .cmp = sort__sym_cmp, 56 .se_cmp = sort__sym_cmp,
46 .print = sort__sym_print, 57 .se_snprintf = hist_entry__sym_snprintf,
47}; 58};
48 59
49struct sort_entry sort_parent = { 60struct sort_entry sort_parent = {
50 .header = "Parent symbol", 61 .se_header = "Parent symbol",
51 .cmp = sort__parent_cmp, 62 .se_cmp = sort__parent_cmp,
52 .print = sort__parent_print, 63 .se_snprintf = hist_entry__parent_snprintf,
53 .width = &parent_symbol__col_width, 64 .se_width = &parent_symbol__col_width,
54}; 65};
55 66
56struct sort_dimension { 67struct sort_dimension {
@@ -85,45 +96,38 @@ sort__thread_cmp(struct hist_entry *left, struct hist_entry *right)
85 return right->thread->pid - left->thread->pid; 96 return right->thread->pid - left->thread->pid;
86} 97}
87 98
88int repsep_fprintf(FILE *fp, const char *fmt, ...) 99static int repsep_snprintf(char *bf, size_t size, const char *fmt, ...)
89{ 100{
90 int n; 101 int n;
91 va_list ap; 102 va_list ap;
92 103
93 va_start(ap, fmt); 104 va_start(ap, fmt);
94 if (!field_sep) 105 n = vsnprintf(bf, size, fmt, ap);
95 n = vfprintf(fp, fmt, ap); 106 if (field_sep && n > 0) {
96 else { 107 char *sep = bf;
97 char *bf = NULL; 108
98 n = vasprintf(&bf, fmt, ap); 109 while (1) {
99 if (n > 0) { 110 sep = strchr(sep, *field_sep);
100 char *sep = bf; 111 if (sep == NULL)
101 112 break;
102 while (1) { 113 *sep = '.';
103 sep = strchr(sep, *field_sep);
104 if (sep == NULL)
105 break;
106 *sep = '.';
107 }
108 } 114 }
109 fputs(bf, fp);
110 free(bf);
111 } 115 }
112 va_end(ap); 116 va_end(ap);
113 return n; 117 return n;
114} 118}
115 119
116size_t 120static int hist_entry__thread_snprintf(struct hist_entry *self, char *bf,
117sort__thread_print(FILE *fp, struct hist_entry *self, unsigned int width) 121 size_t size, unsigned int width)
118{ 122{
119 return repsep_fprintf(fp, "%*s:%5d", width - 6, 123 return repsep_snprintf(bf, size, "%*s:%5d", width,
120 self->thread->comm ?: "", self->thread->pid); 124 self->thread->comm ?: "", self->thread->pid);
121} 125}
122 126
123size_t 127static int hist_entry__comm_snprintf(struct hist_entry *self, char *bf,
124sort__comm_print(FILE *fp, struct hist_entry *self, unsigned int width) 128 size_t size, unsigned int width)
125{ 129{
126 return repsep_fprintf(fp, "%*s", width, self->thread->comm); 130 return repsep_snprintf(bf, size, "%*s", width, self->thread->comm);
127} 131}
128 132
129/* --sort dso */ 133/* --sort dso */
@@ -131,8 +135,8 @@ sort__comm_print(FILE *fp, struct hist_entry *self, unsigned int width)
131int64_t 135int64_t
132sort__dso_cmp(struct hist_entry *left, struct hist_entry *right) 136sort__dso_cmp(struct hist_entry *left, struct hist_entry *right)
133{ 137{
134 struct dso *dso_l = left->map ? left->map->dso : NULL; 138 struct dso *dso_l = left->ms.map ? left->ms.map->dso : NULL;
135 struct dso *dso_r = right->map ? right->map->dso : NULL; 139 struct dso *dso_r = right->ms.map ? right->ms.map->dso : NULL;
136 const char *dso_name_l, *dso_name_r; 140 const char *dso_name_l, *dso_name_r;
137 141
138 if (!dso_l || !dso_r) 142 if (!dso_l || !dso_r)
@@ -149,16 +153,16 @@ sort__dso_cmp(struct hist_entry *left, struct hist_entry *right)
149 return strcmp(dso_name_l, dso_name_r); 153 return strcmp(dso_name_l, dso_name_r);
150} 154}
151 155
152size_t 156static int hist_entry__dso_snprintf(struct hist_entry *self, char *bf,
153sort__dso_print(FILE *fp, struct hist_entry *self, unsigned int width) 157 size_t size, unsigned int width)
154{ 158{
155 if (self->map && self->map->dso) { 159 if (self->ms.map && self->ms.map->dso) {
156 const char *dso_name = !verbose ? self->map->dso->short_name : 160 const char *dso_name = !verbose ? self->ms.map->dso->short_name :
157 self->map->dso->long_name; 161 self->ms.map->dso->long_name;
158 return repsep_fprintf(fp, "%-*s", width, dso_name); 162 return repsep_snprintf(bf, size, "%-*s", width, dso_name);
159 } 163 }
160 164
161 return repsep_fprintf(fp, "%*llx", width, (u64)self->ip); 165 return repsep_snprintf(bf, size, "%*Lx", width, self->ip);
162} 166}
163 167
164/* --sort symbol */ 168/* --sort symbol */
@@ -168,31 +172,31 @@ sort__sym_cmp(struct hist_entry *left, struct hist_entry *right)
168{ 172{
169 u64 ip_l, ip_r; 173 u64 ip_l, ip_r;
170 174
171 if (left->sym == right->sym) 175 if (left->ms.sym == right->ms.sym)
172 return 0; 176 return 0;
173 177
174 ip_l = left->sym ? left->sym->start : left->ip; 178 ip_l = left->ms.sym ? left->ms.sym->start : left->ip;
175 ip_r = right->sym ? right->sym->start : right->ip; 179 ip_r = right->ms.sym ? right->ms.sym->start : right->ip;
176 180
177 return (int64_t)(ip_r - ip_l); 181 return (int64_t)(ip_r - ip_l);
178} 182}
179 183
180 184static int hist_entry__sym_snprintf(struct hist_entry *self, char *bf,
181size_t 185 size_t size, unsigned int width __used)
182sort__sym_print(FILE *fp, struct hist_entry *self, unsigned int width __used)
183{ 186{
184 size_t ret = 0; 187 size_t ret = 0;
185 188
186 if (verbose) { 189 if (verbose) {
187 char o = self->map ? dso__symtab_origin(self->map->dso) : '!'; 190 char o = self->ms.map ? dso__symtab_origin(self->ms.map->dso) : '!';
188 ret += repsep_fprintf(fp, "%#018llx %c ", (u64)self->ip, o); 191 ret += repsep_snprintf(bf, size, "%#018llx %c ", self->ip, o);
189 } 192 }
190 193
191 ret += repsep_fprintf(fp, "[%c] ", self->level); 194 ret += repsep_snprintf(bf + ret, size - ret, "[%c] ", self->level);
192 if (self->sym) 195 if (self->ms.sym)
193 ret += repsep_fprintf(fp, "%s", self->sym->name); 196 ret += repsep_snprintf(bf + ret, size - ret, "%s",
197 self->ms.sym->name);
194 else 198 else
195 ret += repsep_fprintf(fp, "%#016llx", (u64)self->ip); 199 ret += repsep_snprintf(bf + ret, size - ret, "%#016llx", self->ip);
196 200
197 return ret; 201 return ret;
198} 202}
@@ -231,10 +235,10 @@ sort__parent_cmp(struct hist_entry *left, struct hist_entry *right)
231 return strcmp(sym_l->name, sym_r->name); 235 return strcmp(sym_l->name, sym_r->name);
232} 236}
233 237
234size_t 238static int hist_entry__parent_snprintf(struct hist_entry *self, char *bf,
235sort__parent_print(FILE *fp, struct hist_entry *self, unsigned int width) 239 size_t size, unsigned int width)
236{ 240{
237 return repsep_fprintf(fp, "%-*s", width, 241 return repsep_snprintf(bf, size, "%-*s", width,
238 self->parent ? self->parent->name : "[other]"); 242 self->parent ? self->parent->name : "[other]");
239} 243}
240 244
@@ -251,7 +255,7 @@ int sort_dimension__add(const char *tok)
251 if (strncasecmp(tok, sd->name, strlen(tok))) 255 if (strncasecmp(tok, sd->name, strlen(tok)))
252 continue; 256 continue;
253 257
254 if (sd->entry->collapse) 258 if (sd->entry->se_collapse)
255 sort__need_collapse = 1; 259 sort__need_collapse = 1;
256 260
257 if (sd->entry == &sort_parent) { 261 if (sd->entry == &sort_parent) {
@@ -260,9 +264,8 @@ int sort_dimension__add(const char *tok)
260 char err[BUFSIZ]; 264 char err[BUFSIZ];
261 265
262 regerror(ret, &parent_regex, err, sizeof(err)); 266 regerror(ret, &parent_regex, err, sizeof(err));
263 fprintf(stderr, "Invalid regex: %s\n%s", 267 pr_err("Invalid regex: %s\n%s", parent_pattern, err);
264 parent_pattern, err); 268 return -EINVAL;
265 exit(-1);
266 } 269 }
267 sort__has_parent = 1; 270 sort__has_parent = 1;
268 } 271 }
diff --git a/tools/perf/util/sort.h b/tools/perf/util/sort.h
index 753f9ea99fb0..0d61c4082f43 100644
--- a/tools/perf/util/sort.h
+++ b/tools/perf/util/sort.h
@@ -25,10 +25,10 @@
25#include "sort.h" 25#include "sort.h"
26 26
27extern regex_t parent_regex; 27extern regex_t parent_regex;
28extern char *sort_order; 28extern const char *sort_order;
29extern char default_parent_pattern[]; 29extern const char default_parent_pattern[];
30extern char *parent_pattern; 30extern const char *parent_pattern;
31extern char default_sort_order[]; 31extern const char default_sort_order[];
32extern int sort__need_collapse; 32extern int sort__need_collapse;
33extern int sort__has_parent; 33extern int sort__has_parent;
34extern char *field_sep; 34extern char *field_sep;
@@ -43,19 +43,24 @@ extern enum sort_type sort__first_dimension;
43 43
44struct hist_entry { 44struct hist_entry {
45 struct rb_node rb_node; 45 struct rb_node rb_node;
46 u64 count; 46 u64 period;
47 u64 period_sys;
48 u64 period_us;
49 u64 period_guest_sys;
50 u64 period_guest_us;
51 struct map_symbol ms;
47 struct thread *thread; 52 struct thread *thread;
48 struct map *map;
49 struct symbol *sym;
50 u64 ip; 53 u64 ip;
54 u32 nr_events;
51 char level; 55 char level;
52 struct symbol *parent; 56 u8 filtered;
53 struct callchain_node callchain; 57 struct symbol *parent;
54 union { 58 union {
55 unsigned long position; 59 unsigned long position;
56 struct hist_entry *pair; 60 struct hist_entry *pair;
57 struct rb_root sorted_chain; 61 struct rb_root sorted_chain;
58 }; 62 };
63 struct callchain_node callchain[0];
59}; 64};
60 65
61enum sort_type { 66enum sort_type {
@@ -73,12 +78,13 @@ enum sort_type {
73struct sort_entry { 78struct sort_entry {
74 struct list_head list; 79 struct list_head list;
75 80
76 const char *header; 81 const char *se_header;
77 82
78 int64_t (*cmp)(struct hist_entry *, struct hist_entry *); 83 int64_t (*se_cmp)(struct hist_entry *, struct hist_entry *);
79 int64_t (*collapse)(struct hist_entry *, struct hist_entry *); 84 int64_t (*se_collapse)(struct hist_entry *, struct hist_entry *);
80 size_t (*print)(FILE *fp, struct hist_entry *, unsigned int width); 85 int (*se_snprintf)(struct hist_entry *self, char *bf, size_t size,
81 unsigned int *width; 86 unsigned int width);
87 unsigned int *se_width;
82 bool elide; 88 bool elide;
83}; 89};
84 90
@@ -87,7 +93,6 @@ extern struct list_head hist_entry__sort_list;
87 93
88void setup_sorting(const char * const usagestr[], const struct option *opts); 94void setup_sorting(const char * const usagestr[], const struct option *opts);
89 95
90extern int repsep_fprintf(FILE *fp, const char *fmt, ...);
91extern size_t sort__thread_print(FILE *, struct hist_entry *, unsigned int); 96extern size_t sort__thread_print(FILE *, struct hist_entry *, unsigned int);
92extern size_t sort__comm_print(FILE *, struct hist_entry *, unsigned int); 97extern size_t sort__comm_print(FILE *, struct hist_entry *, unsigned int);
93extern size_t sort__dso_print(FILE *, struct hist_entry *, unsigned int); 98extern size_t sort__dso_print(FILE *, struct hist_entry *, unsigned int);
diff --git a/tools/perf/util/strbuf.c b/tools/perf/util/strbuf.c
index 5249d5a1b0c2..92e068517c1a 100644
--- a/tools/perf/util/strbuf.c
+++ b/tools/perf/util/strbuf.c
@@ -41,16 +41,6 @@ char *strbuf_detach(struct strbuf *sb, size_t *sz)
41 return res; 41 return res;
42} 42}
43 43
44void strbuf_attach(struct strbuf *sb, void *buf, size_t len, size_t alloc)
45{
46 strbuf_release(sb);
47 sb->buf = buf;
48 sb->len = len;
49 sb->alloc = alloc;
50 strbuf_grow(sb, 0);
51 sb->buf[sb->len] = '\0';
52}
53
54void strbuf_grow(struct strbuf *sb, size_t extra) 44void strbuf_grow(struct strbuf *sb, size_t extra)
55{ 45{
56 if (sb->len + extra + 1 <= sb->len) 46 if (sb->len + extra + 1 <= sb->len)
@@ -60,94 +50,7 @@ void strbuf_grow(struct strbuf *sb, size_t extra)
60 ALLOC_GROW(sb->buf, sb->len + extra + 1, sb->alloc); 50 ALLOC_GROW(sb->buf, sb->len + extra + 1, sb->alloc);
61} 51}
62 52
63void strbuf_trim(struct strbuf *sb) 53static void strbuf_splice(struct strbuf *sb, size_t pos, size_t len,
64{
65 char *b = sb->buf;
66 while (sb->len > 0 && isspace((unsigned char)sb->buf[sb->len - 1]))
67 sb->len--;
68 while (sb->len > 0 && isspace(*b)) {
69 b++;
70 sb->len--;
71 }
72 memmove(sb->buf, b, sb->len);
73 sb->buf[sb->len] = '\0';
74}
75void strbuf_rtrim(struct strbuf *sb)
76{
77 while (sb->len > 0 && isspace((unsigned char)sb->buf[sb->len - 1]))
78 sb->len--;
79 sb->buf[sb->len] = '\0';
80}
81
82void strbuf_ltrim(struct strbuf *sb)
83{
84 char *b = sb->buf;
85 while (sb->len > 0 && isspace(*b)) {
86 b++;
87 sb->len--;
88 }
89 memmove(sb->buf, b, sb->len);
90 sb->buf[sb->len] = '\0';
91}
92
93void strbuf_tolower(struct strbuf *sb)
94{
95 unsigned int i;
96
97 for (i = 0; i < sb->len; i++)
98 sb->buf[i] = tolower(sb->buf[i]);
99}
100
101struct strbuf **strbuf_split(const struct strbuf *sb, int delim)
102{
103 int alloc = 2, pos = 0;
104 char *n, *p;
105 struct strbuf **ret;
106 struct strbuf *t;
107
108 ret = calloc(alloc, sizeof(struct strbuf *));
109 p = n = sb->buf;
110 while (n < sb->buf + sb->len) {
111 int len;
112 n = memchr(n, delim, sb->len - (n - sb->buf));
113 if (pos + 1 >= alloc) {
114 alloc = alloc * 2;
115 ret = realloc(ret, sizeof(struct strbuf *) * alloc);
116 }
117 if (!n)
118 n = sb->buf + sb->len - 1;
119 len = n - p + 1;
120 t = malloc(sizeof(struct strbuf));
121 strbuf_init(t, len);
122 strbuf_add(t, p, len);
123 ret[pos] = t;
124 ret[++pos] = NULL;
125 p = ++n;
126 }
127 return ret;
128}
129
130void strbuf_list_free(struct strbuf **sbs)
131{
132 struct strbuf **s = sbs;
133
134 while (*s) {
135 strbuf_release(*s);
136 free(*s++);
137 }
138 free(sbs);
139}
140
141int strbuf_cmp(const struct strbuf *a, const struct strbuf *b)
142{
143 int len = a->len < b->len ? a->len: b->len;
144 int cmp = memcmp(a->buf, b->buf, len);
145 if (cmp)
146 return cmp;
147 return a->len < b->len ? -1: a->len != b->len;
148}
149
150void strbuf_splice(struct strbuf *sb, size_t pos, size_t len,
151 const void *data, size_t dlen) 54 const void *data, size_t dlen)
152{ 55{
153 if (pos + len < pos) 56 if (pos + len < pos)
@@ -166,11 +69,6 @@ void strbuf_splice(struct strbuf *sb, size_t pos, size_t len,
166 strbuf_setlen(sb, sb->len + dlen - len); 69 strbuf_setlen(sb, sb->len + dlen - len);
167} 70}
168 71
169void strbuf_insert(struct strbuf *sb, size_t pos, const void *data, size_t len)
170{
171 strbuf_splice(sb, pos, 0, data, len);
172}
173
174void strbuf_remove(struct strbuf *sb, size_t pos, size_t len) 72void strbuf_remove(struct strbuf *sb, size_t pos, size_t len)
175{ 73{
176 strbuf_splice(sb, pos, len, NULL, 0); 74 strbuf_splice(sb, pos, len, NULL, 0);
@@ -183,13 +81,6 @@ void strbuf_add(struct strbuf *sb, const void *data, size_t len)
183 strbuf_setlen(sb, sb->len + len); 81 strbuf_setlen(sb, sb->len + len);
184} 82}
185 83
186void strbuf_adddup(struct strbuf *sb, size_t pos, size_t len)
187{
188 strbuf_grow(sb, len);
189 memcpy(sb->buf + sb->len, sb->buf + pos, len);
190 strbuf_setlen(sb, sb->len + len);
191}
192
193void strbuf_addf(struct strbuf *sb, const char *fmt, ...) 84void strbuf_addf(struct strbuf *sb, const char *fmt, ...)
194{ 85{
195 int len; 86 int len;
@@ -214,57 +105,6 @@ void strbuf_addf(struct strbuf *sb, const char *fmt, ...)
214 strbuf_setlen(sb, sb->len + len); 105 strbuf_setlen(sb, sb->len + len);
215} 106}
216 107
217void strbuf_expand(struct strbuf *sb, const char *format, expand_fn_t fn,
218 void *context)
219{
220 for (;;) {
221 const char *percent;
222 size_t consumed;
223
224 percent = strchrnul(format, '%');
225 strbuf_add(sb, format, percent - format);
226 if (!*percent)
227 break;
228 format = percent + 1;
229
230 consumed = fn(sb, format, context);
231 if (consumed)
232 format += consumed;
233 else
234 strbuf_addch(sb, '%');
235 }
236}
237
238size_t strbuf_expand_dict_cb(struct strbuf *sb, const char *placeholder,
239 void *context)
240{
241 struct strbuf_expand_dict_entry *e = context;
242 size_t len;
243
244 for (; e->placeholder && (len = strlen(e->placeholder)); e++) {
245 if (!strncmp(placeholder, e->placeholder, len)) {
246 if (e->value)
247 strbuf_addstr(sb, e->value);
248 return len;
249 }
250 }
251 return 0;
252}
253
254size_t strbuf_fread(struct strbuf *sb, size_t size, FILE *f)
255{
256 size_t res;
257 size_t oldalloc = sb->alloc;
258
259 strbuf_grow(sb, size);
260 res = fread(sb->buf + sb->len, 1, size, f);
261 if (res > 0)
262 strbuf_setlen(sb, sb->len + res);
263 else if (oldalloc == 0)
264 strbuf_release(sb);
265 return res;
266}
267
268ssize_t strbuf_read(struct strbuf *sb, int fd, ssize_t hint) 108ssize_t strbuf_read(struct strbuf *sb, int fd, ssize_t hint)
269{ 109{
270 size_t oldlen = sb->len; 110 size_t oldlen = sb->len;
@@ -291,70 +131,3 @@ ssize_t strbuf_read(struct strbuf *sb, int fd, ssize_t hint)
291 sb->buf[sb->len] = '\0'; 131 sb->buf[sb->len] = '\0';
292 return sb->len - oldlen; 132 return sb->len - oldlen;
293} 133}
294
295#define STRBUF_MAXLINK (2*PATH_MAX)
296
297int strbuf_readlink(struct strbuf *sb, const char *path, ssize_t hint)
298{
299 size_t oldalloc = sb->alloc;
300
301 if (hint < 32)
302 hint = 32;
303
304 while (hint < STRBUF_MAXLINK) {
305 ssize_t len;
306
307 strbuf_grow(sb, hint);
308 len = readlink(path, sb->buf, hint);
309 if (len < 0) {
310 if (errno != ERANGE)
311 break;
312 } else if (len < hint) {
313 strbuf_setlen(sb, len);
314 return 0;
315 }
316
317 /* .. the buffer was too small - try again */
318 hint *= 2;
319 }
320 if (oldalloc == 0)
321 strbuf_release(sb);
322 return -1;
323}
324
325int strbuf_getline(struct strbuf *sb, FILE *fp, int term)
326{
327 int ch;
328
329 strbuf_grow(sb, 0);
330 if (feof(fp))
331 return EOF;
332
333 strbuf_reset(sb);
334 while ((ch = fgetc(fp)) != EOF) {
335 if (ch == term)
336 break;
337 strbuf_grow(sb, 1);
338 sb->buf[sb->len++] = ch;
339 }
340 if (ch == EOF && sb->len == 0)
341 return EOF;
342
343 sb->buf[sb->len] = '\0';
344 return 0;
345}
346
347int strbuf_read_file(struct strbuf *sb, const char *path, ssize_t hint)
348{
349 int fd, len;
350
351 fd = open(path, O_RDONLY);
352 if (fd < 0)
353 return -1;
354 len = strbuf_read(sb, fd, hint);
355 close(fd);
356 if (len < 0)
357 return -1;
358
359 return len;
360}
diff --git a/tools/perf/util/strbuf.h b/tools/perf/util/strbuf.h
index a3d121d6c83e..436ac319f6c7 100644
--- a/tools/perf/util/strbuf.h
+++ b/tools/perf/util/strbuf.h
@@ -53,12 +53,6 @@ struct strbuf {
53extern void strbuf_init(struct strbuf *buf, ssize_t hint); 53extern void strbuf_init(struct strbuf *buf, ssize_t hint);
54extern void strbuf_release(struct strbuf *); 54extern void strbuf_release(struct strbuf *);
55extern char *strbuf_detach(struct strbuf *, size_t *); 55extern char *strbuf_detach(struct strbuf *, size_t *);
56extern void strbuf_attach(struct strbuf *, void *, size_t, size_t);
57static inline void strbuf_swap(struct strbuf *a, struct strbuf *b) {
58 struct strbuf tmp = *a;
59 *a = *b;
60 *b = tmp;
61}
62 56
63/*----- strbuf size related -----*/ 57/*----- strbuf size related -----*/
64static inline ssize_t strbuf_avail(const struct strbuf *sb) { 58static inline ssize_t strbuf_avail(const struct strbuf *sb) {
@@ -74,17 +68,6 @@ static inline void strbuf_setlen(struct strbuf *sb, size_t len) {
74 sb->len = len; 68 sb->len = len;
75 sb->buf[len] = '\0'; 69 sb->buf[len] = '\0';
76} 70}
77#define strbuf_reset(sb) strbuf_setlen(sb, 0)
78
79/*----- content related -----*/
80extern void strbuf_trim(struct strbuf *);
81extern void strbuf_rtrim(struct strbuf *);
82extern void strbuf_ltrim(struct strbuf *);
83extern int strbuf_cmp(const struct strbuf *, const struct strbuf *);
84extern void strbuf_tolower(struct strbuf *);
85
86extern struct strbuf **strbuf_split(const struct strbuf *, int delim);
87extern void strbuf_list_free(struct strbuf **);
88 71
89/*----- add data in your buffer -----*/ 72/*----- add data in your buffer -----*/
90static inline void strbuf_addch(struct strbuf *sb, int c) { 73static inline void strbuf_addch(struct strbuf *sb, int c) {
@@ -93,45 +76,17 @@ static inline void strbuf_addch(struct strbuf *sb, int c) {
93 sb->buf[sb->len] = '\0'; 76 sb->buf[sb->len] = '\0';
94} 77}
95 78
96extern void strbuf_insert(struct strbuf *, size_t pos, const void *, size_t);
97extern void strbuf_remove(struct strbuf *, size_t pos, size_t len); 79extern void strbuf_remove(struct strbuf *, size_t pos, size_t len);
98 80
99/* splice pos..pos+len with given data */
100extern void strbuf_splice(struct strbuf *, size_t pos, size_t len,
101 const void *, size_t);
102
103extern void strbuf_add(struct strbuf *, const void *, size_t); 81extern void strbuf_add(struct strbuf *, const void *, size_t);
104static inline void strbuf_addstr(struct strbuf *sb, const char *s) { 82static inline void strbuf_addstr(struct strbuf *sb, const char *s) {
105 strbuf_add(sb, s, strlen(s)); 83 strbuf_add(sb, s, strlen(s));
106} 84}
107static inline void strbuf_addbuf(struct strbuf *sb, const struct strbuf *sb2) {
108 strbuf_add(sb, sb2->buf, sb2->len);
109}
110extern void strbuf_adddup(struct strbuf *sb, size_t pos, size_t len);
111
112typedef size_t (*expand_fn_t) (struct strbuf *sb, const char *placeholder, void *context);
113extern void strbuf_expand(struct strbuf *sb, const char *format, expand_fn_t fn, void *context);
114struct strbuf_expand_dict_entry {
115 const char *placeholder;
116 const char *value;
117};
118extern size_t strbuf_expand_dict_cb(struct strbuf *sb, const char *placeholder, void *context);
119 85
120__attribute__((format(printf,2,3))) 86__attribute__((format(printf,2,3)))
121extern void strbuf_addf(struct strbuf *sb, const char *fmt, ...); 87extern void strbuf_addf(struct strbuf *sb, const char *fmt, ...);
122 88
123extern size_t strbuf_fread(struct strbuf *, size_t, FILE *);
124/* XXX: if read fails, any partial read is undone */ 89/* XXX: if read fails, any partial read is undone */
125extern ssize_t strbuf_read(struct strbuf *, int fd, ssize_t hint); 90extern ssize_t strbuf_read(struct strbuf *, int fd, ssize_t hint);
126extern int strbuf_read_file(struct strbuf *sb, const char *path, ssize_t hint);
127extern int strbuf_readlink(struct strbuf *sb, const char *path, ssize_t hint);
128
129extern int strbuf_getline(struct strbuf *, FILE *, int);
130
131extern void stripspace(struct strbuf *buf, int skip_comments);
132extern int launch_editor(const char *path, struct strbuf *buffer, const char *const *env);
133
134extern int strbuf_branchname(struct strbuf *sb, const char *name);
135extern int strbuf_check_branch_ref(struct strbuf *sb, const char *name);
136 91
137#endif /* __PERF_STRBUF_H */ 92#endif /* __PERF_STRBUF_H */
diff --git a/tools/perf/util/string.c b/tools/perf/util/string.c
index 5352d7dccc61..0409fc7c0058 100644
--- a/tools/perf/util/string.c
+++ b/tools/perf/util/string.c
@@ -1,48 +1,5 @@
1#include "string.h"
2#include "util.h" 1#include "util.h"
3 2#include "string.h"
4static int hex(char ch)
5{
6 if ((ch >= '0') && (ch <= '9'))
7 return ch - '0';
8 if ((ch >= 'a') && (ch <= 'f'))
9 return ch - 'a' + 10;
10 if ((ch >= 'A') && (ch <= 'F'))
11 return ch - 'A' + 10;
12 return -1;
13}
14
15/*
16 * While we find nice hex chars, build a long_val.
17 * Return number of chars processed.
18 */
19int hex2u64(const char *ptr, u64 *long_val)
20{
21 const char *p = ptr;
22 *long_val = 0;
23
24 while (*p) {
25 const int hex_val = hex(*p);
26
27 if (hex_val < 0)
28 break;
29
30 *long_val = (*long_val << 4) | hex_val;
31 p++;
32 }
33
34 return p - ptr;
35}
36
37char *strxfrchar(char *s, char from, char to)
38{
39 char *p = s;
40
41 while ((p = strchr(p, from)) != NULL)
42 *p++ = to;
43
44 return s;
45}
46 3
47#define K 1024LL 4#define K 1024LL
48/* 5/*
@@ -227,16 +184,73 @@ fail:
227 return NULL; 184 return NULL;
228} 185}
229 186
230/* Glob expression pattern matching */ 187/* Character class matching */
231bool strglobmatch(const char *str, const char *pat) 188static bool __match_charclass(const char *pat, char c, const char **npat)
189{
190 bool complement = false, ret = true;
191
192 if (*pat == '!') {
193 complement = true;
194 pat++;
195 }
196 if (*pat++ == c) /* First character is special */
197 goto end;
198
199 while (*pat && *pat != ']') { /* Matching */
200 if (*pat == '-' && *(pat + 1) != ']') { /* Range */
201 if (*(pat - 1) <= c && c <= *(pat + 1))
202 goto end;
203 if (*(pat - 1) > *(pat + 1))
204 goto error;
205 pat += 2;
206 } else if (*pat++ == c)
207 goto end;
208 }
209 if (!*pat)
210 goto error;
211 ret = false;
212
213end:
214 while (*pat && *pat != ']') /* Searching closing */
215 pat++;
216 if (!*pat)
217 goto error;
218 *npat = pat + 1;
219 return complement ? !ret : ret;
220
221error:
222 return false;
223}
224
225/* Glob/lazy pattern matching */
226static bool __match_glob(const char *str, const char *pat, bool ignore_space)
232{ 227{
233 while (*str && *pat && *pat != '*') { 228 while (*str && *pat && *pat != '*') {
234 if (*pat == '?') { 229 if (ignore_space) {
230 /* Ignore spaces for lazy matching */
231 if (isspace(*str)) {
232 str++;
233 continue;
234 }
235 if (isspace(*pat)) {
236 pat++;
237 continue;
238 }
239 }
240 if (*pat == '?') { /* Matches any single character */
235 str++; 241 str++;
236 pat++; 242 pat++;
237 } else 243 continue;
238 if (*str++ != *pat++) 244 } else if (*pat == '[') /* Character classes/Ranges */
245 if (__match_charclass(pat + 1, *str, &pat)) {
246 str++;
247 continue;
248 } else
239 return false; 249 return false;
250 else if (*pat == '\\') /* Escaped char match as normal char */
251 pat++;
252 if (*str++ != *pat++)
253 return false;
240 } 254 }
241 /* Check wild card */ 255 /* Check wild card */
242 if (*pat == '*') { 256 if (*pat == '*') {
@@ -251,3 +265,32 @@ bool strglobmatch(const char *str, const char *pat)
251 return !*str && !*pat; 265 return !*str && !*pat;
252} 266}
253 267
268/**
269 * strglobmatch - glob expression pattern matching
270 * @str: the target string to match
271 * @pat: the pattern string to match
272 *
273 * This returns true if the @str matches @pat. @pat can includes wildcards
274 * ('*','?') and character classes ([CHARS], complementation and ranges are
275 * also supported). Also, this supports escape character ('\') to use special
276 * characters as normal character.
277 *
278 * Note: if @pat syntax is broken, this always returns false.
279 */
280bool strglobmatch(const char *str, const char *pat)
281{
282 return __match_glob(str, pat, false);
283}
284
285/**
286 * strlazymatch - matching pattern strings lazily with glob pattern
287 * @str: the target string to match
288 * @pat: the pattern string to match
289 *
290 * This is similar to strglobmatch, except this ignores spaces in
291 * the target string.
292 */
293bool strlazymatch(const char *str, const char *pat)
294{
295 return __match_glob(str, pat, true);
296}
diff --git a/tools/perf/util/string.h b/tools/perf/util/string.h
deleted file mode 100644
index 02ede58c54b4..000000000000
--- a/tools/perf/util/string.h
+++ /dev/null
@@ -1,17 +0,0 @@
1#ifndef __PERF_STRING_H_
2#define __PERF_STRING_H_
3
4#include <stdbool.h>
5#include "types.h"
6
7int hex2u64(const char *ptr, u64 *val);
8char *strxfrchar(char *s, char from, char to);
9s64 perf_atoll(const char *str);
10char **argv_split(const char *str, int *argcp);
11void argv_free(char **argv);
12bool strglobmatch(const char *str, const char *pat);
13
14#define _STR(x) #x
15#define STR(x) _STR(x)
16
17#endif /* __PERF_STRING_H */
diff --git a/tools/perf/util/symbol.c b/tools/perf/util/symbol.c
index ab92763edb03..5b276833e2bf 100644
--- a/tools/perf/util/symbol.c
+++ b/tools/perf/util/symbol.c
@@ -1,14 +1,20 @@
1#include "util.h" 1#define _GNU_SOURCE
2#include "../perf.h" 2#include <ctype.h>
3#include "session.h" 3#include <dirent.h>
4#include "sort.h" 4#include <errno.h>
5#include "string.h" 5#include <libgen.h>
6#include <stdlib.h>
7#include <stdio.h>
8#include <string.h>
9#include <sys/types.h>
10#include <sys/stat.h>
11#include <sys/param.h>
12#include <fcntl.h>
13#include <unistd.h>
14#include "build-id.h"
6#include "symbol.h" 15#include "symbol.h"
7#include "thread.h" 16#include "strlist.h"
8 17
9#include "debug.h"
10
11#include <asm/bug.h>
12#include <libelf.h> 18#include <libelf.h>
13#include <gelf.h> 19#include <gelf.h>
14#include <elf.h> 20#include <elf.h>
@@ -19,21 +25,12 @@
19#define NT_GNU_BUILD_ID 3 25#define NT_GNU_BUILD_ID 3
20#endif 26#endif
21 27
22enum dso_origin {
23 DSO__ORIG_KERNEL = 0,
24 DSO__ORIG_JAVA_JIT,
25 DSO__ORIG_FEDORA,
26 DSO__ORIG_UBUNTU,
27 DSO__ORIG_BUILDID,
28 DSO__ORIG_DSO,
29 DSO__ORIG_KMODULE,
30 DSO__ORIG_NOT_FOUND,
31};
32
33static void dsos__add(struct list_head *head, struct dso *dso); 28static void dsos__add(struct list_head *head, struct dso *dso);
34static struct map *map__new2(u64 start, struct dso *dso, enum map_type type); 29static struct map *map__new2(u64 start, struct dso *dso, enum map_type type);
35static int dso__load_kernel_sym(struct dso *self, struct map *map, 30static int dso__load_kernel_sym(struct dso *self, struct map *map,
36 struct perf_session *session, symbol_filter_t filter); 31 symbol_filter_t filter);
32static int dso__load_guest_kernel_sym(struct dso *self, struct map *map,
33 symbol_filter_t filter);
37static int vmlinux_path__nr_entries; 34static int vmlinux_path__nr_entries;
38static char **vmlinux_path; 35static char **vmlinux_path;
39 36
@@ -53,17 +50,12 @@ bool dso__sorted_by_name(const struct dso *self, enum map_type type)
53 return self->sorted_by_name & (1 << type); 50 return self->sorted_by_name & (1 << type);
54} 51}
55 52
56static void dso__set_loaded(struct dso *self, enum map_type type)
57{
58 self->loaded |= (1 << type);
59}
60
61static void dso__set_sorted_by_name(struct dso *self, enum map_type type) 53static void dso__set_sorted_by_name(struct dso *self, enum map_type type)
62{ 54{
63 self->sorted_by_name |= (1 << type); 55 self->sorted_by_name |= (1 << type);
64} 56}
65 57
66static bool symbol_type__is_a(char symbol_type, enum map_type map_type) 58bool symbol_type__is_a(char symbol_type, enum map_type map_type)
67{ 59{
68 switch (map_type) { 60 switch (map_type) {
69 case MAP__FUNCTION: 61 case MAP__FUNCTION:
@@ -131,25 +123,26 @@ static void map_groups__fixup_end(struct map_groups *self)
131static struct symbol *symbol__new(u64 start, u64 len, const char *name) 123static struct symbol *symbol__new(u64 start, u64 len, const char *name)
132{ 124{
133 size_t namelen = strlen(name) + 1; 125 size_t namelen = strlen(name) + 1;
134 struct symbol *self = zalloc(symbol_conf.priv_size + 126 struct symbol *self = calloc(1, (symbol_conf.priv_size +
135 sizeof(*self) + namelen); 127 sizeof(*self) + namelen));
136 if (self == NULL) 128 if (self == NULL)
137 return NULL; 129 return NULL;
138 130
139 if (symbol_conf.priv_size) 131 if (symbol_conf.priv_size)
140 self = ((void *)self) + symbol_conf.priv_size; 132 self = ((void *)self) + symbol_conf.priv_size;
141 133
142 self->start = start; 134 self->start = start;
143 self->end = len ? start + len - 1 : start; 135 self->end = len ? start + len - 1 : start;
136 self->namelen = namelen - 1;
144 137
145 pr_debug3("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end); 138 pr_debug4("%s: %s %#Lx-%#Lx\n", __func__, name, start, self->end);
146 139
147 memcpy(self->name, name, namelen); 140 memcpy(self->name, name, namelen);
148 141
149 return self; 142 return self;
150} 143}
151 144
152static void symbol__delete(struct symbol *self) 145void symbol__delete(struct symbol *self)
153{ 146{
154 free(((void *)self) - symbol_conf.priv_size); 147 free(((void *)self) - symbol_conf.priv_size);
155} 148}
@@ -160,7 +153,7 @@ static size_t symbol__fprintf(struct symbol *self, FILE *fp)
160 self->start, self->end, self->name); 153 self->start, self->end, self->name);
161} 154}
162 155
163static void dso__set_long_name(struct dso *self, char *name) 156void dso__set_long_name(struct dso *self, char *name)
164{ 157{
165 if (name == NULL) 158 if (name == NULL)
166 return; 159 return;
@@ -168,20 +161,28 @@ static void dso__set_long_name(struct dso *self, char *name)
168 self->long_name_len = strlen(name); 161 self->long_name_len = strlen(name);
169} 162}
170 163
164static void dso__set_short_name(struct dso *self, const char *name)
165{
166 if (name == NULL)
167 return;
168 self->short_name = name;
169 self->short_name_len = strlen(name);
170}
171
171static void dso__set_basename(struct dso *self) 172static void dso__set_basename(struct dso *self)
172{ 173{
173 self->short_name = basename(self->long_name); 174 dso__set_short_name(self, basename(self->long_name));
174} 175}
175 176
176struct dso *dso__new(const char *name) 177struct dso *dso__new(const char *name)
177{ 178{
178 struct dso *self = malloc(sizeof(*self) + strlen(name) + 1); 179 struct dso *self = calloc(1, sizeof(*self) + strlen(name) + 1);
179 180
180 if (self != NULL) { 181 if (self != NULL) {
181 int i; 182 int i;
182 strcpy(self->name, name); 183 strcpy(self->name, name);
183 dso__set_long_name(self, self->name); 184 dso__set_long_name(self, self->name);
184 self->short_name = self->name; 185 dso__set_short_name(self, self->name);
185 for (i = 0; i < MAP__NR_TYPES; ++i) 186 for (i = 0; i < MAP__NR_TYPES; ++i)
186 self->symbols[i] = self->symbol_names[i] = RB_ROOT; 187 self->symbols[i] = self->symbol_names[i] = RB_ROOT;
187 self->slen_calculated = 0; 188 self->slen_calculated = 0;
@@ -189,6 +190,8 @@ struct dso *dso__new(const char *name)
189 self->loaded = 0; 190 self->loaded = 0;
190 self->sorted_by_name = 0; 191 self->sorted_by_name = 0;
191 self->has_build_id = 0; 192 self->has_build_id = 0;
193 self->kernel = DSO_TYPE_USER;
194 INIT_LIST_HEAD(&self->node);
192 } 195 }
193 196
194 return self; 197 return self;
@@ -344,10 +347,10 @@ void dso__sort_by_name(struct dso *self, enum map_type type)
344 &self->symbols[type]); 347 &self->symbols[type]);
345} 348}
346 349
347int build_id__sprintf(u8 *self, int len, char *bf) 350int build_id__sprintf(const u8 *self, int len, char *bf)
348{ 351{
349 char *bid = bf; 352 char *bid = bf;
350 u8 *raw = self; 353 const u8 *raw = self;
351 int i; 354 int i;
352 355
353 for (i = 0; i < len; ++i) { 356 for (i = 0; i < len; ++i) {
@@ -372,6 +375,10 @@ size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp)
372 struct rb_node *nd; 375 struct rb_node *nd;
373 size_t ret = fprintf(fp, "dso: %s (", self->short_name); 376 size_t ret = fprintf(fp, "dso: %s (", self->short_name);
374 377
378 if (self->short_name != self->long_name)
379 ret += fprintf(fp, "%s, ", self->long_name);
380 ret += fprintf(fp, "%s, %sloaded, ", map_type__name[type],
381 self->loaded ? "" : "NOT ");
375 ret += dso__fprintf_buildid(self, fp); 382 ret += dso__fprintf_buildid(self, fp);
376 ret += fprintf(fp, ")\n"); 383 ret += fprintf(fp, ")\n");
377 for (nd = rb_first(&self->symbols[type]); nd; nd = rb_next(nd)) { 384 for (nd = rb_first(&self->symbols[type]); nd; nd = rb_next(nd)) {
@@ -382,35 +389,28 @@ size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp)
382 return ret; 389 return ret;
383} 390}
384 391
385/* 392int kallsyms__parse(const char *filename, void *arg,
386 * Loads the function entries in /proc/kallsyms into kernel_map->dso, 393 int (*process_symbol)(void *arg, const char *name,
387 * so that we can in the next step set the symbol ->end address and then 394 char type, u64 start))
388 * call kernel_maps__split_kallsyms.
389 */
390static int dso__load_all_kallsyms(struct dso *self, struct map *map)
391{ 395{
392 char *line = NULL; 396 char *line = NULL;
393 size_t n; 397 size_t n;
394 struct rb_root *root = &self->symbols[map->type]; 398 int err = 0;
395 FILE *file = fopen("/proc/kallsyms", "r"); 399 FILE *file = fopen(filename, "r");
396 400
397 if (file == NULL) 401 if (file == NULL)
398 goto out_failure; 402 goto out_failure;
399 403
400 while (!feof(file)) { 404 while (!feof(file)) {
401 u64 start; 405 u64 start;
402 struct symbol *sym;
403 int line_len, len; 406 int line_len, len;
404 char symbol_type; 407 char symbol_type;
405 char *symbol_name; 408 char *symbol_name;
406 409
407 line_len = getline(&line, &n, file); 410 line_len = getline(&line, &n, file);
408 if (line_len < 0) 411 if (line_len < 0 || !line)
409 break; 412 break;
410 413
411 if (!line)
412 goto out_failure;
413
414 line[--line_len] = '\0'; /* \n */ 414 line[--line_len] = '\0'; /* \n */
415 415
416 len = hex2u64(line, &start); 416 len = hex2u64(line, &start);
@@ -420,43 +420,74 @@ static int dso__load_all_kallsyms(struct dso *self, struct map *map)
420 continue; 420 continue;
421 421
422 symbol_type = toupper(line[len]); 422 symbol_type = toupper(line[len]);
423 if (!symbol_type__is_a(symbol_type, map->type))
424 continue;
425
426 symbol_name = line + len + 2; 423 symbol_name = line + len + 2;
427 /*
428 * Will fix up the end later, when we have all symbols sorted.
429 */
430 sym = symbol__new(start, 0, symbol_name);
431 424
432 if (sym == NULL) 425 err = process_symbol(arg, symbol_name, symbol_type, start);
433 goto out_delete_line; 426 if (err)
434 /* 427 break;
435 * We will pass the symbols to the filter later, in
436 * map__split_kallsyms, when we have split the maps per module
437 */
438 symbols__insert(root, sym);
439 } 428 }
440 429
441 free(line); 430 free(line);
442 fclose(file); 431 fclose(file);
432 return err;
443 433
444 return 0;
445
446out_delete_line:
447 free(line);
448out_failure: 434out_failure:
449 return -1; 435 return -1;
450} 436}
451 437
438struct process_kallsyms_args {
439 struct map *map;
440 struct dso *dso;
441};
442
443static int map__process_kallsym_symbol(void *arg, const char *name,
444 char type, u64 start)
445{
446 struct symbol *sym;
447 struct process_kallsyms_args *a = arg;
448 struct rb_root *root = &a->dso->symbols[a->map->type];
449
450 if (!symbol_type__is_a(type, a->map->type))
451 return 0;
452
453 /*
454 * Will fix up the end later, when we have all symbols sorted.
455 */
456 sym = symbol__new(start, 0, name);
457
458 if (sym == NULL)
459 return -ENOMEM;
460 /*
461 * We will pass the symbols to the filter later, in
462 * map__split_kallsyms, when we have split the maps per module
463 */
464 symbols__insert(root, sym);
465
466 return 0;
467}
468
469/*
470 * Loads the function entries in /proc/kallsyms into kernel_map->dso,
471 * so that we can in the next step set the symbol ->end address and then
472 * call kernel_maps__split_kallsyms.
473 */
474static int dso__load_all_kallsyms(struct dso *self, const char *filename,
475 struct map *map)
476{
477 struct process_kallsyms_args args = { .map = map, .dso = self, };
478 return kallsyms__parse(filename, &args, map__process_kallsym_symbol);
479}
480
452/* 481/*
453 * Split the symbols into maps, making sure there are no overlaps, i.e. the 482 * Split the symbols into maps, making sure there are no overlaps, i.e. the
454 * kernel range is broken in several maps, named [kernel].N, as we don't have 483 * kernel range is broken in several maps, named [kernel].N, as we don't have
455 * the original ELF section names vmlinux have. 484 * the original ELF section names vmlinux have.
456 */ 485 */
457static int dso__split_kallsyms(struct dso *self, struct map *map, 486static int dso__split_kallsyms(struct dso *self, struct map *map,
458 struct perf_session *session, symbol_filter_t filter) 487 symbol_filter_t filter)
459{ 488{
489 struct map_groups *kmaps = map__kmap(map)->kmaps;
490 struct machine *machine = kmaps->machine;
460 struct map *curr_map = map; 491 struct map *curr_map = map;
461 struct symbol *pos; 492 struct symbol *pos;
462 int count = 0; 493 int count = 0;
@@ -477,13 +508,35 @@ static int dso__split_kallsyms(struct dso *self, struct map *map,
477 508
478 *module++ = '\0'; 509 *module++ = '\0';
479 510
480 if (strcmp(self->name, module)) { 511 if (strcmp(curr_map->dso->short_name, module)) {
481 curr_map = map_groups__find_by_name(&session->kmaps, map->type, module); 512 if (curr_map != map &&
513 self->kernel == DSO_TYPE_GUEST_KERNEL &&
514 machine__is_default_guest(machine)) {
515 /*
516 * We assume all symbols of a module are
517 * continuous in * kallsyms, so curr_map
518 * points to a module and all its
519 * symbols are in its kmap. Mark it as
520 * loaded.
521 */
522 dso__set_loaded(curr_map->dso,
523 curr_map->type);
524 }
525
526 curr_map = map_groups__find_by_name(kmaps,
527 map->type, module);
482 if (curr_map == NULL) { 528 if (curr_map == NULL) {
483 pr_debug("/proc/{kallsyms,modules} " 529 pr_debug("%s/proc/{kallsyms,modules} "
484 "inconsistency!\n"); 530 "inconsistency while looking "
485 return -1; 531 "for \"%s\" module!\n",
532 machine->root_dir, module);
533 curr_map = map;
534 goto discard_symbol;
486 } 535 }
536
537 if (curr_map->dso->loaded &&
538 !machine__is_default_guest(machine))
539 goto discard_symbol;
487 } 540 }
488 /* 541 /*
489 * So that we look just like we get from .ko files, 542 * So that we look just like we get from .ko files,
@@ -495,21 +548,29 @@ static int dso__split_kallsyms(struct dso *self, struct map *map,
495 char dso_name[PATH_MAX]; 548 char dso_name[PATH_MAX];
496 struct dso *dso; 549 struct dso *dso;
497 550
498 snprintf(dso_name, sizeof(dso_name), "[kernel].%d", 551 if (self->kernel == DSO_TYPE_GUEST_KERNEL)
499 kernel_range++); 552 snprintf(dso_name, sizeof(dso_name),
553 "[guest.kernel].%d",
554 kernel_range++);
555 else
556 snprintf(dso_name, sizeof(dso_name),
557 "[kernel].%d",
558 kernel_range++);
500 559
501 dso = dso__new(dso_name); 560 dso = dso__new(dso_name);
502 if (dso == NULL) 561 if (dso == NULL)
503 return -1; 562 return -1;
504 563
564 dso->kernel = self->kernel;
565
505 curr_map = map__new2(pos->start, dso, map->type); 566 curr_map = map__new2(pos->start, dso, map->type);
506 if (map == NULL) { 567 if (curr_map == NULL) {
507 dso__delete(dso); 568 dso__delete(dso);
508 return -1; 569 return -1;
509 } 570 }
510 571
511 curr_map->map_ip = curr_map->unmap_ip = identity__map_ip; 572 curr_map->map_ip = curr_map->unmap_ip = identity__map_ip;
512 map_groups__insert(&session->kmaps, curr_map); 573 map_groups__insert(kmaps, curr_map);
513 ++kernel_range; 574 ++kernel_range;
514 } 575 }
515 576
@@ -525,20 +586,28 @@ discard_symbol: rb_erase(&pos->rb_node, root);
525 } 586 }
526 } 587 }
527 588
589 if (curr_map != map &&
590 self->kernel == DSO_TYPE_GUEST_KERNEL &&
591 machine__is_default_guest(kmaps->machine)) {
592 dso__set_loaded(curr_map->dso, curr_map->type);
593 }
594
528 return count; 595 return count;
529} 596}
530 597
531 598int dso__load_kallsyms(struct dso *self, const char *filename,
532static int dso__load_kallsyms(struct dso *self, struct map *map, 599 struct map *map, symbol_filter_t filter)
533 struct perf_session *session, symbol_filter_t filter)
534{ 600{
535 if (dso__load_all_kallsyms(self, map) < 0) 601 if (dso__load_all_kallsyms(self, filename, map) < 0)
536 return -1; 602 return -1;
537 603
538 symbols__fixup_end(&self->symbols[map->type]); 604 symbols__fixup_end(&self->symbols[map->type]);
539 self->origin = DSO__ORIG_KERNEL; 605 if (self->kernel == DSO_TYPE_GUEST_KERNEL)
606 self->origin = DSO__ORIG_GUEST_KERNEL;
607 else
608 self->origin = DSO__ORIG_KERNEL;
540 609
541 return dso__split_kallsyms(self, map, session, filter); 610 return dso__split_kallsyms(self, map, filter);
542} 611}
543 612
544static int dso__load_perf_map(struct dso *self, struct map *map, 613static int dso__load_perf_map(struct dso *self, struct map *map,
@@ -835,8 +904,8 @@ out_close:
835 if (err == 0) 904 if (err == 0)
836 return nr; 905 return nr;
837out: 906out:
838 pr_warning("%s: problems reading %s PLT info.\n", 907 pr_debug("%s: problems reading %s PLT info.\n",
839 __func__, self->long_name); 908 __func__, self->long_name);
840 return 0; 909 return 0;
841} 910}
842 911
@@ -864,13 +933,12 @@ static bool elf_sec__is_a(GElf_Shdr *self, Elf_Data *secstrs, enum map_type type
864 } 933 }
865} 934}
866 935
867static int dso__load_sym(struct dso *self, struct map *map, 936static int dso__load_sym(struct dso *self, struct map *map, const char *name,
868 struct perf_session *session, const char *name, int fd, 937 int fd, symbol_filter_t filter, int kmodule)
869 symbol_filter_t filter, int kernel, int kmodule)
870{ 938{
939 struct kmap *kmap = self->kernel ? map__kmap(map) : NULL;
871 struct map *curr_map = map; 940 struct map *curr_map = map;
872 struct dso *curr_dso = self; 941 struct dso *curr_dso = self;
873 size_t dso_name_len = strlen(self->short_name);
874 Elf_Data *symstrs, *secstrs; 942 Elf_Data *symstrs, *secstrs;
875 uint32_t nr_syms; 943 uint32_t nr_syms;
876 int err = -1; 944 int err = -1;
@@ -924,7 +992,7 @@ static int dso__load_sym(struct dso *self, struct map *map,
924 nr_syms = shdr.sh_size / shdr.sh_entsize; 992 nr_syms = shdr.sh_size / shdr.sh_entsize;
925 993
926 memset(&sym, 0, sizeof(sym)); 994 memset(&sym, 0, sizeof(sym));
927 if (!kernel) { 995 if (self->kernel == DSO_TYPE_USER) {
928 self->adjust_symbols = (ehdr.e_type == ET_EXEC || 996 self->adjust_symbols = (ehdr.e_type == ET_EXEC ||
929 elf_section_by_name(elf, &ehdr, &shdr, 997 elf_section_by_name(elf, &ehdr, &shdr,
930 ".gnu.prelink_undo", 998 ".gnu.prelink_undo",
@@ -933,11 +1001,15 @@ static int dso__load_sym(struct dso *self, struct map *map,
933 1001
934 elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) { 1002 elf_symtab__for_each_symbol(syms, nr_syms, idx, sym) {
935 struct symbol *f; 1003 struct symbol *f;
936 const char *elf_name; 1004 const char *elf_name = elf_sym__name(&sym, symstrs);
937 char *demangled = NULL; 1005 char *demangled = NULL;
938 int is_label = elf_sym__is_label(&sym); 1006 int is_label = elf_sym__is_label(&sym);
939 const char *section_name; 1007 const char *section_name;
940 1008
1009 if (kmap && kmap->ref_reloc_sym && kmap->ref_reloc_sym->name &&
1010 strcmp(elf_name, kmap->ref_reloc_sym->name) == 0)
1011 kmap->ref_reloc_sym->unrelocated_addr = sym.st_value;
1012
941 if (!is_label && !elf_sym__is_a(&sym, map->type)) 1013 if (!is_label && !elf_sym__is_a(&sym, map->type))
942 continue; 1014 continue;
943 1015
@@ -950,14 +1022,14 @@ static int dso__load_sym(struct dso *self, struct map *map,
950 if (is_label && !elf_sec__is_a(&shdr, secstrs, map->type)) 1022 if (is_label && !elf_sec__is_a(&shdr, secstrs, map->type))
951 continue; 1023 continue;
952 1024
953 elf_name = elf_sym__name(&sym, symstrs);
954 section_name = elf_sec__name(&shdr, secstrs); 1025 section_name = elf_sec__name(&shdr, secstrs);
955 1026
956 if (kernel || kmodule) { 1027 if (self->kernel != DSO_TYPE_USER || kmodule) {
957 char dso_name[PATH_MAX]; 1028 char dso_name[PATH_MAX];
958 1029
959 if (strcmp(section_name, 1030 if (strcmp(section_name,
960 curr_dso->short_name + dso_name_len) == 0) 1031 (curr_dso->short_name +
1032 self->short_name_len)) == 0)
961 goto new_symbol; 1033 goto new_symbol;
962 1034
963 if (strcmp(section_name, ".text") == 0) { 1035 if (strcmp(section_name, ".text") == 0) {
@@ -969,7 +1041,7 @@ static int dso__load_sym(struct dso *self, struct map *map,
969 snprintf(dso_name, sizeof(dso_name), 1041 snprintf(dso_name, sizeof(dso_name),
970 "%s%s", self->short_name, section_name); 1042 "%s%s", self->short_name, section_name);
971 1043
972 curr_map = map_groups__find_by_name(&session->kmaps, map->type, dso_name); 1044 curr_map = map_groups__find_by_name(kmap->kmaps, map->type, dso_name);
973 if (curr_map == NULL) { 1045 if (curr_map == NULL) {
974 u64 start = sym.st_value; 1046 u64 start = sym.st_value;
975 1047
@@ -979,17 +1051,19 @@ static int dso__load_sym(struct dso *self, struct map *map,
979 curr_dso = dso__new(dso_name); 1051 curr_dso = dso__new(dso_name);
980 if (curr_dso == NULL) 1052 if (curr_dso == NULL)
981 goto out_elf_end; 1053 goto out_elf_end;
1054 curr_dso->kernel = self->kernel;
982 curr_map = map__new2(start, curr_dso, 1055 curr_map = map__new2(start, curr_dso,
983 MAP__FUNCTION); 1056 map->type);
984 if (curr_map == NULL) { 1057 if (curr_map == NULL) {
985 dso__delete(curr_dso); 1058 dso__delete(curr_dso);
986 goto out_elf_end; 1059 goto out_elf_end;
987 } 1060 }
988 curr_map->map_ip = identity__map_ip; 1061 curr_map->map_ip = identity__map_ip;
989 curr_map->unmap_ip = identity__map_ip; 1062 curr_map->unmap_ip = identity__map_ip;
990 curr_dso->origin = DSO__ORIG_KERNEL; 1063 curr_dso->origin = self->origin;
991 map_groups__insert(&session->kmaps, curr_map); 1064 map_groups__insert(kmap->kmaps, curr_map);
992 dsos__add(&dsos__kernel, curr_dso); 1065 dsos__add(&self->node, curr_dso);
1066 dso__set_loaded(curr_dso, map->type);
993 } else 1067 } else
994 curr_dso = curr_map->dso; 1068 curr_dso = curr_map->dso;
995 1069
@@ -997,9 +1071,10 @@ static int dso__load_sym(struct dso *self, struct map *map,
997 } 1071 }
998 1072
999 if (curr_dso->adjust_symbols) { 1073 if (curr_dso->adjust_symbols) {
1000 pr_debug2("adjusting symbol: st_value: %Lx sh_addr: " 1074 pr_debug4("%s: adjusting symbol: st_value: %#Lx "
1001 "%Lx sh_offset: %Lx\n", (u64)sym.st_value, 1075 "sh_addr: %#Lx sh_offset: %#Lx\n", __func__,
1002 (u64)shdr.sh_addr, (u64)shdr.sh_offset); 1076 (u64)sym.st_value, (u64)shdr.sh_addr,
1077 (u64)shdr.sh_offset);
1003 sym.st_value -= shdr.sh_addr - shdr.sh_offset; 1078 sym.st_value -= shdr.sh_addr - shdr.sh_offset;
1004 } 1079 }
1005 /* 1080 /*
@@ -1027,8 +1102,16 @@ new_symbol:
1027 /* 1102 /*
1028 * For misannotated, zeroed, ASM function sizes. 1103 * For misannotated, zeroed, ASM function sizes.
1029 */ 1104 */
1030 if (nr > 0) 1105 if (nr > 0) {
1031 symbols__fixup_end(&self->symbols[map->type]); 1106 symbols__fixup_end(&self->symbols[map->type]);
1107 if (kmap) {
1108 /*
1109 * We need to fixup this here too because we create new
1110 * maps here, for things like vsyscall sections.
1111 */
1112 __map_groups__fixup_end(kmap->kmaps, map->type);
1113 }
1114 }
1032 err = nr; 1115 err = nr;
1033out_elf_end: 1116out_elf_end:
1034 elf_end(elf); 1117 elf_end(elf);
@@ -1041,28 +1124,28 @@ static bool dso__build_id_equal(const struct dso *self, u8 *build_id)
1041 return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0; 1124 return memcmp(self->build_id, build_id, sizeof(self->build_id)) == 0;
1042} 1125}
1043 1126
1044static bool __dsos__read_build_ids(struct list_head *head) 1127bool __dsos__read_build_ids(struct list_head *head, bool with_hits)
1045{ 1128{
1046 bool have_build_id = false; 1129 bool have_build_id = false;
1047 struct dso *pos; 1130 struct dso *pos;
1048 1131
1049 list_for_each_entry(pos, head, node) 1132 list_for_each_entry(pos, head, node) {
1133 if (with_hits && !pos->hit)
1134 continue;
1135 if (pos->has_build_id) {
1136 have_build_id = true;
1137 continue;
1138 }
1050 if (filename__read_build_id(pos->long_name, pos->build_id, 1139 if (filename__read_build_id(pos->long_name, pos->build_id,
1051 sizeof(pos->build_id)) > 0) { 1140 sizeof(pos->build_id)) > 0) {
1052 have_build_id = true; 1141 have_build_id = true;
1053 pos->has_build_id = true; 1142 pos->has_build_id = true;
1054 } 1143 }
1144 }
1055 1145
1056 return have_build_id; 1146 return have_build_id;
1057} 1147}
1058 1148
1059bool dsos__read_build_ids(void)
1060{
1061 bool kbuildids = __dsos__read_build_ids(&dsos__kernel),
1062 ubuildids = __dsos__read_build_ids(&dsos__user);
1063 return kbuildids || ubuildids;
1064}
1065
1066/* 1149/*
1067 * Align offset to 4 bytes as needed for note name and descriptor data. 1150 * Align offset to 4 bytes as needed for note name and descriptor data.
1068 */ 1151 */
@@ -1191,11 +1274,14 @@ char dso__symtab_origin(const struct dso *self)
1191 static const char origin[] = { 1274 static const char origin[] = {
1192 [DSO__ORIG_KERNEL] = 'k', 1275 [DSO__ORIG_KERNEL] = 'k',
1193 [DSO__ORIG_JAVA_JIT] = 'j', 1276 [DSO__ORIG_JAVA_JIT] = 'j',
1277 [DSO__ORIG_BUILD_ID_CACHE] = 'B',
1194 [DSO__ORIG_FEDORA] = 'f', 1278 [DSO__ORIG_FEDORA] = 'f',
1195 [DSO__ORIG_UBUNTU] = 'u', 1279 [DSO__ORIG_UBUNTU] = 'u',
1196 [DSO__ORIG_BUILDID] = 'b', 1280 [DSO__ORIG_BUILDID] = 'b',
1197 [DSO__ORIG_DSO] = 'd', 1281 [DSO__ORIG_DSO] = 'd',
1198 [DSO__ORIG_KMODULE] = 'K', 1282 [DSO__ORIG_KMODULE] = 'K',
1283 [DSO__ORIG_GUEST_KERNEL] = 'g',
1284 [DSO__ORIG_GUEST_KMODULE] = 'G',
1199 }; 1285 };
1200 1286
1201 if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND) 1287 if (self == NULL || self->origin == DSO__ORIG_NOT_FOUND)
@@ -1203,19 +1289,27 @@ char dso__symtab_origin(const struct dso *self)
1203 return origin[self->origin]; 1289 return origin[self->origin];
1204} 1290}
1205 1291
1206int dso__load(struct dso *self, struct map *map, struct perf_session *session, 1292int dso__load(struct dso *self, struct map *map, symbol_filter_t filter)
1207 symbol_filter_t filter)
1208{ 1293{
1209 int size = PATH_MAX; 1294 int size = PATH_MAX;
1210 char *name; 1295 char *name;
1211 u8 build_id[BUILD_ID_SIZE]; 1296 u8 build_id[BUILD_ID_SIZE];
1212 int ret = -1; 1297 int ret = -1;
1213 int fd; 1298 int fd;
1299 struct machine *machine;
1300 const char *root_dir;
1214 1301
1215 dso__set_loaded(self, map->type); 1302 dso__set_loaded(self, map->type);
1216 1303
1217 if (self->kernel) 1304 if (self->kernel == DSO_TYPE_KERNEL)
1218 return dso__load_kernel_sym(self, map, session, filter); 1305 return dso__load_kernel_sym(self, map, filter);
1306 else if (self->kernel == DSO_TYPE_GUEST_KERNEL)
1307 return dso__load_guest_kernel_sym(self, map, filter);
1308
1309 if (map->groups && map->groups->machine)
1310 machine = map->groups->machine;
1311 else
1312 machine = NULL;
1219 1313
1220 name = malloc(size); 1314 name = malloc(size);
1221 if (!name) 1315 if (!name)
@@ -1230,8 +1324,9 @@ int dso__load(struct dso *self, struct map *map, struct perf_session *session,
1230 return ret; 1324 return ret;
1231 } 1325 }
1232 1326
1233 self->origin = DSO__ORIG_FEDORA - 1; 1327 self->origin = DSO__ORIG_BUILD_ID_CACHE;
1234 1328 if (dso__build_id_filename(self, name, size) != NULL)
1329 goto open_file;
1235more: 1330more:
1236 do { 1331 do {
1237 self->origin++; 1332 self->origin++;
@@ -1248,7 +1343,6 @@ more:
1248 if (filename__read_build_id(self->long_name, build_id, 1343 if (filename__read_build_id(self->long_name, build_id,
1249 sizeof(build_id))) { 1344 sizeof(build_id))) {
1250 char build_id_hex[BUILD_ID_SIZE * 2 + 1]; 1345 char build_id_hex[BUILD_ID_SIZE * 2 + 1];
1251
1252 build_id__sprintf(build_id, sizeof(build_id), 1346 build_id__sprintf(build_id, sizeof(build_id),
1253 build_id_hex); 1347 build_id_hex);
1254 snprintf(name, size, 1348 snprintf(name, size,
@@ -1263,6 +1357,13 @@ more:
1263 case DSO__ORIG_DSO: 1357 case DSO__ORIG_DSO:
1264 snprintf(name, size, "%s", self->long_name); 1358 snprintf(name, size, "%s", self->long_name);
1265 break; 1359 break;
1360 case DSO__ORIG_GUEST_KMODULE:
1361 if (map->groups && map->groups->machine)
1362 root_dir = map->groups->machine->root_dir;
1363 else
1364 root_dir = "";
1365 snprintf(name, size, "%s%s", root_dir, self->long_name);
1366 break;
1266 1367
1267 default: 1368 default:
1268 goto out; 1369 goto out;
@@ -1276,11 +1377,11 @@ compare_build_id:
1276 if (!dso__build_id_equal(self, build_id)) 1377 if (!dso__build_id_equal(self, build_id))
1277 goto more; 1378 goto more;
1278 } 1379 }
1279 1380open_file:
1280 fd = open(name, O_RDONLY); 1381 fd = open(name, O_RDONLY);
1281 } while (fd < 0); 1382 } while (fd < 0);
1282 1383
1283 ret = dso__load_sym(self, map, NULL, name, fd, filter, 0, 0); 1384 ret = dso__load_sym(self, map, name, fd, filter, 0);
1284 close(fd); 1385 close(fd);
1285 1386
1286 /* 1387 /*
@@ -1309,35 +1410,65 @@ struct map *map_groups__find_by_name(struct map_groups *self,
1309 for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) { 1410 for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) {
1310 struct map *map = rb_entry(nd, struct map, rb_node); 1411 struct map *map = rb_entry(nd, struct map, rb_node);
1311 1412
1312 if (map->dso && strcmp(map->dso->name, name) == 0) 1413 if (map->dso && strcmp(map->dso->short_name, name) == 0)
1313 return map; 1414 return map;
1314 } 1415 }
1315 1416
1316 return NULL; 1417 return NULL;
1317} 1418}
1318 1419
1319static int perf_session__set_modules_path_dir(struct perf_session *self, char *dirname) 1420static int dso__kernel_module_get_build_id(struct dso *self,
1421 const char *root_dir)
1422{
1423 char filename[PATH_MAX];
1424 /*
1425 * kernel module short names are of the form "[module]" and
1426 * we need just "module" here.
1427 */
1428 const char *name = self->short_name + 1;
1429
1430 snprintf(filename, sizeof(filename),
1431 "%s/sys/module/%.*s/notes/.note.gnu.build-id",
1432 root_dir, (int)strlen(name) - 1, name);
1433
1434 if (sysfs__read_build_id(filename, self->build_id,
1435 sizeof(self->build_id)) == 0)
1436 self->has_build_id = true;
1437
1438 return 0;
1439}
1440
1441static int map_groups__set_modules_path_dir(struct map_groups *self,
1442 const char *dir_name)
1320{ 1443{
1321 struct dirent *dent; 1444 struct dirent *dent;
1322 DIR *dir = opendir(dirname); 1445 DIR *dir = opendir(dir_name);
1446 int ret = 0;
1323 1447
1324 if (!dir) { 1448 if (!dir) {
1325 pr_debug("%s: cannot open %s dir\n", __func__, dirname); 1449 pr_debug("%s: cannot open %s dir\n", __func__, dir_name);
1326 return -1; 1450 return -1;
1327 } 1451 }
1328 1452
1329 while ((dent = readdir(dir)) != NULL) { 1453 while ((dent = readdir(dir)) != NULL) {
1330 char path[PATH_MAX]; 1454 char path[PATH_MAX];
1455 struct stat st;
1456
1457 /*sshfs might return bad dent->d_type, so we have to stat*/
1458 sprintf(path, "%s/%s", dir_name, dent->d_name);
1459 if (stat(path, &st))
1460 continue;
1331 1461
1332 if (dent->d_type == DT_DIR) { 1462 if (S_ISDIR(st.st_mode)) {
1333 if (!strcmp(dent->d_name, ".") || 1463 if (!strcmp(dent->d_name, ".") ||
1334 !strcmp(dent->d_name, "..")) 1464 !strcmp(dent->d_name, ".."))
1335 continue; 1465 continue;
1336 1466
1337 snprintf(path, sizeof(path), "%s/%s", 1467 snprintf(path, sizeof(path), "%s/%s",
1338 dirname, dent->d_name); 1468 dir_name, dent->d_name);
1339 if (perf_session__set_modules_path_dir(self, path) < 0) 1469 ret = map_groups__set_modules_path_dir(self, path);
1340 goto failure; 1470 if (ret < 0)
1471 goto out;
1341 } else { 1472 } else {
1342 char *dot = strrchr(dent->d_name, '.'), 1473 char *dot = strrchr(dent->d_name, '.'),
1343 dso_name[PATH_MAX]; 1474 dso_name[PATH_MAX];
@@ -1350,38 +1481,69 @@ static int perf_session__set_modules_path_dir(struct perf_session *self, char *d
1350 (int)(dot - dent->d_name), dent->d_name); 1481 (int)(dot - dent->d_name), dent->d_name);
1351 1482
1352 strxfrchar(dso_name, '-', '_'); 1483 strxfrchar(dso_name, '-', '_');
1353 map = map_groups__find_by_name(&self->kmaps, MAP__FUNCTION, dso_name); 1484 map = map_groups__find_by_name(self, MAP__FUNCTION, dso_name);
1354 if (map == NULL) 1485 if (map == NULL)
1355 continue; 1486 continue;
1356 1487
1357 snprintf(path, sizeof(path), "%s/%s", 1488 snprintf(path, sizeof(path), "%s/%s",
1358 dirname, dent->d_name); 1489 dir_name, dent->d_name);
1359 1490
1360 long_name = strdup(path); 1491 long_name = strdup(path);
1361 if (long_name == NULL) 1492 if (long_name == NULL) {
1362 goto failure; 1493 ret = -1;
1494 goto out;
1495 }
1363 dso__set_long_name(map->dso, long_name); 1496 dso__set_long_name(map->dso, long_name);
1497 dso__kernel_module_get_build_id(map->dso, "");
1364 } 1498 }
1365 } 1499 }
1366 1500
1367 return 0; 1501out:
1368failure:
1369 closedir(dir); 1502 closedir(dir);
1370 return -1; 1503 return ret;
1371} 1504}
1372 1505
1373static int perf_session__set_modules_path(struct perf_session *self) 1506static char *get_kernel_version(const char *root_dir)
1374{ 1507{
1375 struct utsname uts; 1508 char version[PATH_MAX];
1509 FILE *file;
1510 char *name, *tmp;
1511 const char *prefix = "Linux version ";
1512
1513 sprintf(version, "%s/proc/version", root_dir);
1514 file = fopen(version, "r");
1515 if (!file)
1516 return NULL;
1517
1518 version[0] = '\0';
1519 tmp = fgets(version, sizeof(version), file);
1520 fclose(file);
1521
1522 name = strstr(version, prefix);
1523 if (!name)
1524 return NULL;
1525 name += strlen(prefix);
1526 tmp = strchr(name, ' ');
1527 if (tmp)
1528 *tmp = '\0';
1529
1530 return strdup(name);
1531}
1532
1533static int machine__set_modules_path(struct machine *self)
1534{
1535 char *version;
1376 char modules_path[PATH_MAX]; 1536 char modules_path[PATH_MAX];
1377 1537
1378 if (uname(&uts) < 0) 1538 version = get_kernel_version(self->root_dir);
1539 if (!version)
1379 return -1; 1540 return -1;
1380 1541
1381 snprintf(modules_path, sizeof(modules_path), "/lib/modules/%s/kernel", 1542 snprintf(modules_path, sizeof(modules_path), "%s/lib/modules/%s/kernel",
1382 uts.release); 1543 self->root_dir, version);
1544 free(version);
1383 1545
1384 return perf_session__set_modules_path_dir(self, modules_path); 1546 return map_groups__set_modules_path_dir(&self->kmaps, modules_path);
1385} 1547}
1386 1548
1387/* 1549/*
@@ -1391,8 +1553,8 @@ static int perf_session__set_modules_path(struct perf_session *self)
1391 */ 1553 */
1392static struct map *map__new2(u64 start, struct dso *dso, enum map_type type) 1554static struct map *map__new2(u64 start, struct dso *dso, enum map_type type)
1393{ 1555{
1394 struct map *self = malloc(sizeof(*self)); 1556 struct map *self = calloc(1, (sizeof(*self) +
1395 1557 (dso->kernel ? sizeof(struct kmap) : 0)));
1396 if (self != NULL) { 1558 if (self != NULL) {
1397 /* 1559 /*
1398 * ->end will be filled after we load all the symbols 1560 * ->end will be filled after we load all the symbols
@@ -1403,20 +1565,50 @@ static struct map *map__new2(u64 start, struct dso *dso, enum map_type type)
1403 return self; 1565 return self;
1404} 1566}
1405 1567
1406static int perf_session__create_module_maps(struct perf_session *self) 1568struct map *machine__new_module(struct machine *self, u64 start,
1569 const char *filename)
1570{
1571 struct map *map;
1572 struct dso *dso = __dsos__findnew(&self->kernel_dsos, filename);
1573
1574 if (dso == NULL)
1575 return NULL;
1576
1577 map = map__new2(start, dso, MAP__FUNCTION);
1578 if (map == NULL)
1579 return NULL;
1580
1581 if (machine__is_host(self))
1582 dso->origin = DSO__ORIG_KMODULE;
1583 else
1584 dso->origin = DSO__ORIG_GUEST_KMODULE;
1585 map_groups__insert(&self->kmaps, map);
1586 return map;
1587}
1588
1589static int machine__create_modules(struct machine *self)
1407{ 1590{
1408 char *line = NULL; 1591 char *line = NULL;
1409 size_t n; 1592 size_t n;
1410 FILE *file = fopen("/proc/modules", "r"); 1593 FILE *file;
1411 struct map *map; 1594 struct map *map;
1595 const char *modules;
1596 char path[PATH_MAX];
1597
1598 if (machine__is_default_guest(self))
1599 modules = symbol_conf.default_guest_modules;
1600 else {
1601 sprintf(path, "%s/proc/modules", self->root_dir);
1602 modules = path;
1603 }
1412 1604
1605 file = fopen(modules, "r");
1413 if (file == NULL) 1606 if (file == NULL)
1414 return -1; 1607 return -1;
1415 1608
1416 while (!feof(file)) { 1609 while (!feof(file)) {
1417 char name[PATH_MAX]; 1610 char name[PATH_MAX];
1418 u64 start; 1611 u64 start;
1419 struct dso *dso;
1420 char *sep; 1612 char *sep;
1421 int line_len; 1613 int line_len;
1422 1614
@@ -1442,32 +1634,16 @@ static int perf_session__create_module_maps(struct perf_session *self)
1442 *sep = '\0'; 1634 *sep = '\0';
1443 1635
1444 snprintf(name, sizeof(name), "[%s]", line); 1636 snprintf(name, sizeof(name), "[%s]", line);
1445 dso = dso__new(name); 1637 map = machine__new_module(self, start, name);
1446 1638 if (map == NULL)
1447 if (dso == NULL)
1448 goto out_delete_line;
1449
1450 map = map__new2(start, dso, MAP__FUNCTION);
1451 if (map == NULL) {
1452 dso__delete(dso);
1453 goto out_delete_line; 1639 goto out_delete_line;
1454 } 1640 dso__kernel_module_get_build_id(map->dso, self->root_dir);
1455
1456 snprintf(name, sizeof(name),
1457 "/sys/module/%s/notes/.note.gnu.build-id", line);
1458 if (sysfs__read_build_id(name, dso->build_id,
1459 sizeof(dso->build_id)) == 0)
1460 dso->has_build_id = true;
1461
1462 dso->origin = DSO__ORIG_KMODULE;
1463 map_groups__insert(&self->kmaps, map);
1464 dsos__add(&dsos__kernel, dso);
1465 } 1641 }
1466 1642
1467 free(line); 1643 free(line);
1468 fclose(file); 1644 fclose(file);
1469 1645
1470 return perf_session__set_modules_path(self); 1646 return machine__set_modules_path(self);
1471 1647
1472out_delete_line: 1648out_delete_line:
1473 free(line); 1649 free(line);
@@ -1476,7 +1652,6 @@ out_failure:
1476} 1652}
1477 1653
1478static int dso__load_vmlinux(struct dso *self, struct map *map, 1654static int dso__load_vmlinux(struct dso *self, struct map *map,
1479 struct perf_session *session,
1480 const char *vmlinux, symbol_filter_t filter) 1655 const char *vmlinux, symbol_filter_t filter)
1481{ 1656{
1482 int err = -1, fd; 1657 int err = -1, fd;
@@ -1510,51 +1685,139 @@ static int dso__load_vmlinux(struct dso *self, struct map *map,
1510 return -1; 1685 return -1;
1511 1686
1512 dso__set_loaded(self, map->type); 1687 dso__set_loaded(self, map->type);
1513 err = dso__load_sym(self, map, session, self->long_name, fd, filter, 1, 0); 1688 err = dso__load_sym(self, map, vmlinux, fd, filter, 0);
1514 close(fd); 1689 close(fd);
1515 1690
1691 if (err > 0)
1692 pr_debug("Using %s for symbols\n", vmlinux);
1693
1694 return err;
1695}
1696
1697int dso__load_vmlinux_path(struct dso *self, struct map *map,
1698 symbol_filter_t filter)
1699{
1700 int i, err = 0;
1701 char *filename;
1702
1703 pr_debug("Looking at the vmlinux_path (%d entries long)\n",
1704 vmlinux_path__nr_entries + 1);
1705
1706 filename = dso__build_id_filename(self, NULL, 0);
1707 if (filename != NULL) {
1708 err = dso__load_vmlinux(self, map, filename, filter);
1709 if (err > 0) {
1710 dso__set_long_name(self, filename);
1711 goto out;
1712 }
1713 free(filename);
1714 }
1715
1716 for (i = 0; i < vmlinux_path__nr_entries; ++i) {
1717 err = dso__load_vmlinux(self, map, vmlinux_path[i], filter);
1718 if (err > 0) {
1719 dso__set_long_name(self, strdup(vmlinux_path[i]));
1720 break;
1721 }
1722 }
1723out:
1516 return err; 1724 return err;
1517} 1725}
1518 1726
1519static int dso__load_kernel_sym(struct dso *self, struct map *map, 1727static int dso__load_kernel_sym(struct dso *self, struct map *map,
1520 struct perf_session *session, symbol_filter_t filter) 1728 symbol_filter_t filter)
1521{ 1729{
1522 int err; 1730 int err;
1523 bool is_kallsyms; 1731 const char *kallsyms_filename = NULL;
1732 char *kallsyms_allocated_filename = NULL;
1733 /*
1734 * Step 1: if the user specified a vmlinux filename, use it and only
1735 * it, reporting errors to the user if it cannot be used.
1736 *
1737 * For instance, try to analyse an ARM perf.data file _without_ a
1738 * build-id, or if the user specifies the wrong path to the right
1739 * vmlinux file, obviously we can't fallback to another vmlinux (a
1740 * x86_86 one, on the machine where analysis is being performed, say),
1741 * or worse, /proc/kallsyms.
1742 *
1743 * If the specified file _has_ a build-id and there is a build-id
1744 * section in the perf.data file, we will still do the expected
1745 * validation in dso__load_vmlinux and will bail out if they don't
1746 * match.
1747 */
1748 if (symbol_conf.vmlinux_name != NULL) {
1749 err = dso__load_vmlinux(self, map,
1750 symbol_conf.vmlinux_name, filter);
1751 if (err > 0) {
1752 dso__set_long_name(self,
1753 strdup(symbol_conf.vmlinux_name));
1754 goto out_fixup;
1755 }
1756 return err;
1757 }
1524 1758
1525 if (vmlinux_path != NULL) { 1759 if (vmlinux_path != NULL) {
1526 int i; 1760 err = dso__load_vmlinux_path(self, map, filter);
1527 pr_debug("Looking at the vmlinux_path (%d entries long)\n", 1761 if (err > 0)
1528 vmlinux_path__nr_entries); 1762 goto out_fixup;
1529 for (i = 0; i < vmlinux_path__nr_entries; ++i) { 1763 }
1530 err = dso__load_vmlinux(self, map, session, 1764
1531 vmlinux_path[i], filter); 1765 /*
1532 if (err > 0) { 1766 * Say the kernel DSO was created when processing the build-id header table,
1533 pr_debug("Using %s for symbols\n", 1767 * we have a build-id, so check if it is the same as the running kernel,
1534 vmlinux_path[i]); 1768 * using it if it is.
1535 dso__set_long_name(self, 1769 */
1536 strdup(vmlinux_path[i])); 1770 if (self->has_build_id) {
1537 goto out_fixup; 1771 u8 kallsyms_build_id[BUILD_ID_SIZE];
1772 char sbuild_id[BUILD_ID_SIZE * 2 + 1];
1773
1774 if (sysfs__read_build_id("/sys/kernel/notes", kallsyms_build_id,
1775 sizeof(kallsyms_build_id)) == 0) {
1776 if (dso__build_id_equal(self, kallsyms_build_id)) {
1777 kallsyms_filename = "/proc/kallsyms";
1778 goto do_kallsyms;
1538 } 1779 }
1539 } 1780 }
1540 } 1781 /*
1782 * Now look if we have it on the build-id cache in
1783 * $HOME/.debug/[kernel.kallsyms].
1784 */
1785 build_id__sprintf(self->build_id, sizeof(self->build_id),
1786 sbuild_id);
1541 1787
1542 is_kallsyms = self->long_name[0] == '['; 1788 if (asprintf(&kallsyms_allocated_filename,
1543 if (is_kallsyms) 1789 "%s/.debug/[kernel.kallsyms]/%s",
1544 goto do_kallsyms; 1790 getenv("HOME"), sbuild_id) == -1) {
1791 pr_err("Not enough memory for kallsyms file lookup\n");
1792 return -1;
1793 }
1545 1794
1546 err = dso__load_vmlinux(self, map, session, self->long_name, filter); 1795 kallsyms_filename = kallsyms_allocated_filename;
1547 if (err <= 0) { 1796
1548 pr_info("The file %s cannot be used, " 1797 if (access(kallsyms_filename, F_OK)) {
1549 "trying to use /proc/kallsyms...", self->long_name); 1798 pr_err("No kallsyms or vmlinux with build-id %s "
1550do_kallsyms: 1799 "was found\n", sbuild_id);
1551 err = dso__load_kallsyms(self, map, session, filter); 1800 free(kallsyms_allocated_filename);
1552 if (err > 0 && !is_kallsyms) 1801 return -1;
1553 dso__set_long_name(self, strdup("[kernel.kallsyms]")); 1802 }
1803 } else {
1804 /*
1805 * Last resort, if we don't have a build-id and couldn't find
1806 * any vmlinux file, try the running kernel kallsyms table.
1807 */
1808 kallsyms_filename = "/proc/kallsyms";
1554 } 1809 }
1555 1810
1811do_kallsyms:
1812 err = dso__load_kallsyms(self, kallsyms_filename, map, filter);
1813 if (err > 0)
1814 pr_debug("Using %s for symbols\n", kallsyms_filename);
1815 free(kallsyms_allocated_filename);
1816
1556 if (err > 0) { 1817 if (err > 0) {
1557out_fixup: 1818out_fixup:
1819 if (kallsyms_filename != NULL)
1820 dso__set_long_name(self, strdup("[kernel.kallsyms]"));
1558 map__fixup_start(map); 1821 map__fixup_start(map);
1559 map__fixup_end(map); 1822 map__fixup_end(map);
1560 } 1823 }
@@ -1562,9 +1825,56 @@ out_fixup:
1562 return err; 1825 return err;
1563} 1826}
1564 1827
1565LIST_HEAD(dsos__user); 1828static int dso__load_guest_kernel_sym(struct dso *self, struct map *map,
1566LIST_HEAD(dsos__kernel); 1829 symbol_filter_t filter)
1567struct dso *vdso; 1830{
1831 int err;
1832 const char *kallsyms_filename = NULL;
1833 struct machine *machine;
1834 char path[PATH_MAX];
1835
1836 if (!map->groups) {
1837 pr_debug("Guest kernel map hasn't the point to groups\n");
1838 return -1;
1839 }
1840 machine = map->groups->machine;
1841
1842 if (machine__is_default_guest(machine)) {
1843 /*
1844 * if the user specified a vmlinux filename, use it and only
1845 * it, reporting errors to the user if it cannot be used.
1846 * Or use file guest_kallsyms inputted by user on commandline
1847 */
1848 if (symbol_conf.default_guest_vmlinux_name != NULL) {
1849 err = dso__load_vmlinux(self, map,
1850 symbol_conf.default_guest_vmlinux_name, filter);
1851 goto out_try_fixup;
1852 }
1853
1854 kallsyms_filename = symbol_conf.default_guest_kallsyms;
1855 if (!kallsyms_filename)
1856 return -1;
1857 } else {
1858 sprintf(path, "%s/proc/kallsyms", machine->root_dir);
1859 kallsyms_filename = path;
1860 }
1861
1862 err = dso__load_kallsyms(self, kallsyms_filename, map, filter);
1863 if (err > 0)
1864 pr_debug("Using %s for symbols\n", kallsyms_filename);
1865
1866out_try_fixup:
1867 if (err > 0) {
1868 if (kallsyms_filename != NULL) {
1869 machine__mmap_name(machine, path, sizeof(path));
1870 dso__set_long_name(self, strdup(path));
1871 }
1872 map__fixup_start(map);
1873 map__fixup_end(map);
1874 }
1875
1876 return err;
1877}
1568 1878
1569static void dsos__add(struct list_head *head, struct dso *dso) 1879static void dsos__add(struct list_head *head, struct dso *dso)
1570{ 1880{
@@ -1576,19 +1886,19 @@ static struct dso *dsos__find(struct list_head *head, const char *name)
1576 struct dso *pos; 1886 struct dso *pos;
1577 1887
1578 list_for_each_entry(pos, head, node) 1888 list_for_each_entry(pos, head, node)
1579 if (strcmp(pos->name, name) == 0) 1889 if (strcmp(pos->long_name, name) == 0)
1580 return pos; 1890 return pos;
1581 return NULL; 1891 return NULL;
1582} 1892}
1583 1893
1584struct dso *dsos__findnew(const char *name) 1894struct dso *__dsos__findnew(struct list_head *head, const char *name)
1585{ 1895{
1586 struct dso *dso = dsos__find(&dsos__user, name); 1896 struct dso *dso = dsos__find(head, name);
1587 1897
1588 if (!dso) { 1898 if (!dso) {
1589 dso = dso__new(name); 1899 dso = dso__new(name);
1590 if (dso != NULL) { 1900 if (dso != NULL) {
1591 dsos__add(&dsos__user, dso); 1901 dsos__add(head, dso);
1592 dso__set_basename(dso); 1902 dso__set_basename(dso);
1593 } 1903 }
1594 } 1904 }
@@ -1596,96 +1906,165 @@ struct dso *dsos__findnew(const char *name)
1596 return dso; 1906 return dso;
1597} 1907}
1598 1908
1599static void __dsos__fprintf(struct list_head *head, FILE *fp) 1909size_t __dsos__fprintf(struct list_head *head, FILE *fp)
1600{ 1910{
1601 struct dso *pos; 1911 struct dso *pos;
1912 size_t ret = 0;
1602 1913
1603 list_for_each_entry(pos, head, node) { 1914 list_for_each_entry(pos, head, node) {
1604 int i; 1915 int i;
1605 for (i = 0; i < MAP__NR_TYPES; ++i) 1916 for (i = 0; i < MAP__NR_TYPES; ++i)
1606 dso__fprintf(pos, i, fp); 1917 ret += dso__fprintf(pos, i, fp);
1607 } 1918 }
1919
1920 return ret;
1608} 1921}
1609 1922
1610void dsos__fprintf(FILE *fp) 1923size_t machines__fprintf_dsos(struct rb_root *self, FILE *fp)
1611{ 1924{
1612 __dsos__fprintf(&dsos__kernel, fp); 1925 struct rb_node *nd;
1613 __dsos__fprintf(&dsos__user, fp); 1926 size_t ret = 0;
1927
1928 for (nd = rb_first(self); nd; nd = rb_next(nd)) {
1929 struct machine *pos = rb_entry(nd, struct machine, rb_node);
1930 ret += __dsos__fprintf(&pos->kernel_dsos, fp);
1931 ret += __dsos__fprintf(&pos->user_dsos, fp);
1932 }
1933
1934 return ret;
1614} 1935}
1615 1936
1616static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp) 1937static size_t __dsos__fprintf_buildid(struct list_head *head, FILE *fp,
1938 bool with_hits)
1617{ 1939{
1618 struct dso *pos; 1940 struct dso *pos;
1619 size_t ret = 0; 1941 size_t ret = 0;
1620 1942
1621 list_for_each_entry(pos, head, node) { 1943 list_for_each_entry(pos, head, node) {
1944 if (with_hits && !pos->hit)
1945 continue;
1622 ret += dso__fprintf_buildid(pos, fp); 1946 ret += dso__fprintf_buildid(pos, fp);
1623 ret += fprintf(fp, " %s\n", pos->long_name); 1947 ret += fprintf(fp, " %s\n", pos->long_name);
1624 } 1948 }
1625 return ret; 1949 return ret;
1626} 1950}
1627 1951
1628size_t dsos__fprintf_buildid(FILE *fp) 1952size_t machine__fprintf_dsos_buildid(struct machine *self, FILE *fp, bool with_hits)
1629{ 1953{
1630 return (__dsos__fprintf_buildid(&dsos__kernel, fp) + 1954 return __dsos__fprintf_buildid(&self->kernel_dsos, fp, with_hits) +
1631 __dsos__fprintf_buildid(&dsos__user, fp)); 1955 __dsos__fprintf_buildid(&self->user_dsos, fp, with_hits);
1632} 1956}
1633 1957
1634static struct dso *dsos__create_kernel( const char *vmlinux) 1958size_t machines__fprintf_dsos_buildid(struct rb_root *self, FILE *fp, bool with_hits)
1635{ 1959{
1636 struct dso *kernel = dso__new(vmlinux ?: "[kernel.kallsyms]"); 1960 struct rb_node *nd;
1961 size_t ret = 0;
1637 1962
1638 if (kernel == NULL) 1963 for (nd = rb_first(self); nd; nd = rb_next(nd)) {
1639 return NULL; 1964 struct machine *pos = rb_entry(nd, struct machine, rb_node);
1965 ret += machine__fprintf_dsos_buildid(pos, fp, with_hits);
1966 }
1967 return ret;
1968}
1640 1969
1641 kernel->short_name = "[kernel]"; 1970struct dso *dso__new_kernel(const char *name)
1642 kernel->kernel = 1; 1971{
1972 struct dso *self = dso__new(name ?: "[kernel.kallsyms]");
1643 1973
1644 vdso = dso__new("[vdso]"); 1974 if (self != NULL) {
1645 if (vdso == NULL) 1975 dso__set_short_name(self, "[kernel]");
1646 goto out_delete_kernel_dso; 1976 self->kernel = DSO_TYPE_KERNEL;
1647 dso__set_loaded(vdso, MAP__FUNCTION); 1977 }
1648 1978
1649 if (sysfs__read_build_id("/sys/kernel/notes", kernel->build_id, 1979 return self;
1650 sizeof(kernel->build_id)) == 0) 1980}
1651 kernel->has_build_id = true;
1652 1981
1653 dsos__add(&dsos__kernel, kernel); 1982static struct dso *dso__new_guest_kernel(struct machine *machine,
1654 dsos__add(&dsos__user, vdso); 1983 const char *name)
1984{
1985 char bf[PATH_MAX];
1986 struct dso *self = dso__new(name ?: machine__mmap_name(machine, bf, sizeof(bf)));
1655 1987
1656 return kernel; 1988 if (self != NULL) {
1989 dso__set_short_name(self, "[guest.kernel]");
1990 self->kernel = DSO_TYPE_GUEST_KERNEL;
1991 }
1657 1992
1658out_delete_kernel_dso: 1993 return self;
1659 dso__delete(kernel);
1660 return NULL;
1661} 1994}
1662 1995
1663static int map_groups__create_kernel_maps(struct map_groups *self, const char *vmlinux) 1996void dso__read_running_kernel_build_id(struct dso *self, struct machine *machine)
1664{ 1997{
1665 struct map *functions, *variables; 1998 char path[PATH_MAX];
1666 struct dso *kernel = dsos__create_kernel(vmlinux);
1667 1999
1668 if (kernel == NULL) 2000 if (machine__is_default_guest(machine))
1669 return -1; 2001 return;
2002 sprintf(path, "%s/sys/kernel/notes", machine->root_dir);
2003 if (sysfs__read_build_id(path, self->build_id,
2004 sizeof(self->build_id)) == 0)
2005 self->has_build_id = true;
2006}
1670 2007
1671 functions = map__new2(0, kernel, MAP__FUNCTION); 2008static struct dso *machine__create_kernel(struct machine *self)
1672 if (functions == NULL) 2009{
1673 return -1; 2010 const char *vmlinux_name = NULL;
2011 struct dso *kernel;
1674 2012
1675 variables = map__new2(0, kernel, MAP__VARIABLE); 2013 if (machine__is_host(self)) {
1676 if (variables == NULL) { 2014 vmlinux_name = symbol_conf.vmlinux_name;
1677 map__delete(functions); 2015 kernel = dso__new_kernel(vmlinux_name);
1678 return -1; 2016 } else {
2017 if (machine__is_default_guest(self))
2018 vmlinux_name = symbol_conf.default_guest_vmlinux_name;
2019 kernel = dso__new_guest_kernel(self, vmlinux_name);
1679 } 2020 }
1680 2021
1681 functions->map_ip = functions->unmap_ip = 2022 if (kernel != NULL) {
1682 variables->map_ip = variables->unmap_ip = identity__map_ip; 2023 dso__read_running_kernel_build_id(kernel, self);
1683 map_groups__insert(self, functions); 2024 dsos__add(&self->kernel_dsos, kernel);
1684 map_groups__insert(self, variables); 2025 }
2026 return kernel;
2027}
2028
2029int __machine__create_kernel_maps(struct machine *self, struct dso *kernel)
2030{
2031 enum map_type type;
2032
2033 for (type = 0; type < MAP__NR_TYPES; ++type) {
2034 struct kmap *kmap;
2035
2036 self->vmlinux_maps[type] = map__new2(0, kernel, type);
2037 if (self->vmlinux_maps[type] == NULL)
2038 return -1;
2039
2040 self->vmlinux_maps[type]->map_ip =
2041 self->vmlinux_maps[type]->unmap_ip = identity__map_ip;
2042
2043 kmap = map__kmap(self->vmlinux_maps[type]);
2044 kmap->kmaps = &self->kmaps;
2045 map_groups__insert(&self->kmaps, self->vmlinux_maps[type]);
2046 }
1685 2047
1686 return 0; 2048 return 0;
1687} 2049}
1688 2050
2051int machine__create_kernel_maps(struct machine *self)
2052{
2053 struct dso *kernel = machine__create_kernel(self);
2054
2055 if (kernel == NULL ||
2056 __machine__create_kernel_maps(self, kernel) < 0)
2057 return -1;
2058
2059 if (symbol_conf.use_modules && machine__create_modules(self) < 0)
2060 pr_debug("Problems creating module maps, continuing anyway...\n");
2061 /*
2062 * Now that we have all the maps created, just set the ->end of them:
2063 */
2064 map_groups__fixup_end(&self->kmaps);
2065 return 0;
2066}
2067
1689static void vmlinux_path__exit(void) 2068static void vmlinux_path__exit(void)
1690{ 2069{
1691 while (--vmlinux_path__nr_entries >= 0) { 2070 while (--vmlinux_path__nr_entries >= 0) {
@@ -1741,6 +2120,25 @@ out_fail:
1741 return -1; 2120 return -1;
1742} 2121}
1743 2122
2123size_t machine__fprintf_vmlinux_path(struct machine *self, FILE *fp)
2124{
2125 int i;
2126 size_t printed = 0;
2127 struct dso *kdso = self->vmlinux_maps[MAP__FUNCTION]->dso;
2128
2129 if (kdso->has_build_id) {
2130 char filename[PATH_MAX];
2131 if (dso__build_id_filename(kdso, filename, sizeof(filename)))
2132 printed += fprintf(fp, "[0] %s\n", filename);
2133 }
2134
2135 for (i = 0; i < vmlinux_path__nr_entries; ++i)
2136 printed += fprintf(fp, "[%d] %s\n",
2137 i + kdso->has_build_id, vmlinux_path[i]);
2138
2139 return printed;
2140}
2141
1744static int setup_list(struct strlist **list, const char *list_str, 2142static int setup_list(struct strlist **list, const char *list_str,
1745 const char *list_name) 2143 const char *list_name)
1746{ 2144{
@@ -1791,19 +2189,129 @@ out_free_comm_list:
1791 return -1; 2189 return -1;
1792} 2190}
1793 2191
1794int perf_session__create_kernel_maps(struct perf_session *self) 2192int machines__create_kernel_maps(struct rb_root *self, pid_t pid)
1795{ 2193{
1796 if (map_groups__create_kernel_maps(&self->kmaps, 2194 struct machine *machine = machines__findnew(self, pid);
1797 symbol_conf.vmlinux_name) < 0) 2195
2196 if (machine == NULL)
1798 return -1; 2197 return -1;
1799 2198
1800 if (symbol_conf.use_modules && 2199 return machine__create_kernel_maps(machine);
1801 perf_session__create_module_maps(self) < 0) 2200}
1802 pr_debug("Failed to load list of modules for session %s, " 2201
1803 "continuing...\n", self->filename); 2202static int hex(char ch)
1804 /* 2203{
1805 * Now that we have all the maps created, just set the ->end of them: 2204 if ((ch >= '0') && (ch <= '9'))
1806 */ 2205 return ch - '0';
1807 map_groups__fixup_end(&self->kmaps); 2206 if ((ch >= 'a') && (ch <= 'f'))
1808 return 0; 2207 return ch - 'a' + 10;
2208 if ((ch >= 'A') && (ch <= 'F'))
2209 return ch - 'A' + 10;
2210 return -1;
2211}
2212
2213/*
2214 * While we find nice hex chars, build a long_val.
2215 * Return number of chars processed.
2216 */
2217int hex2u64(const char *ptr, u64 *long_val)
2218{
2219 const char *p = ptr;
2220 *long_val = 0;
2221
2222 while (*p) {
2223 const int hex_val = hex(*p);
2224
2225 if (hex_val < 0)
2226 break;
2227
2228 *long_val = (*long_val << 4) | hex_val;
2229 p++;
2230 }
2231
2232 return p - ptr;
2233}
2234
2235char *strxfrchar(char *s, char from, char to)
2236{
2237 char *p = s;
2238
2239 while ((p = strchr(p, from)) != NULL)
2240 *p++ = to;
2241
2242 return s;
2243}
2244
2245int machines__create_guest_kernel_maps(struct rb_root *self)
2246{
2247 int ret = 0;
2248 struct dirent **namelist = NULL;
2249 int i, items = 0;
2250 char path[PATH_MAX];
2251 pid_t pid;
2252
2253 if (symbol_conf.default_guest_vmlinux_name ||
2254 symbol_conf.default_guest_modules ||
2255 symbol_conf.default_guest_kallsyms) {
2256 machines__create_kernel_maps(self, DEFAULT_GUEST_KERNEL_ID);
2257 }
2258
2259 if (symbol_conf.guestmount) {
2260 items = scandir(symbol_conf.guestmount, &namelist, NULL, NULL);
2261 if (items <= 0)
2262 return -ENOENT;
2263 for (i = 0; i < items; i++) {
2264 if (!isdigit(namelist[i]->d_name[0])) {
2265 /* Filter out . and .. */
2266 continue;
2267 }
2268 pid = atoi(namelist[i]->d_name);
2269 sprintf(path, "%s/%s/proc/kallsyms",
2270 symbol_conf.guestmount,
2271 namelist[i]->d_name);
2272 ret = access(path, R_OK);
2273 if (ret) {
2274 pr_debug("Can't access file %s\n", path);
2275 goto failure;
2276 }
2277 machines__create_kernel_maps(self, pid);
2278 }
2279failure:
2280 free(namelist);
2281 }
2282
2283 return ret;
2284}
2285
2286int machine__load_kallsyms(struct machine *self, const char *filename,
2287 enum map_type type, symbol_filter_t filter)
2288{
2289 struct map *map = self->vmlinux_maps[type];
2290 int ret = dso__load_kallsyms(map->dso, filename, map, filter);
2291
2292 if (ret > 0) {
2293 dso__set_loaded(map->dso, type);
2294 /*
2295 * Since /proc/kallsyms will have multiple sessions for the
2296 * kernel, with modules between them, fixup the end of all
2297 * sections.
2298 */
2299 __map_groups__fixup_end(&self->kmaps, type);
2300 }
2301
2302 return ret;
2303}
2304
2305int machine__load_vmlinux_path(struct machine *self, enum map_type type,
2306 symbol_filter_t filter)
2307{
2308 struct map *map = self->vmlinux_maps[type];
2309 int ret = dso__load_vmlinux_path(map->dso, map, filter);
2310
2311 if (ret > 0) {
2312 dso__set_loaded(map->dso, type);
2313 map__reloc_vmlinux(map);
2314 }
2315
2316 return ret;
1809} 2317}
diff --git a/tools/perf/util/symbol.h b/tools/perf/util/symbol.h
index 8aded2356f79..5e02d2c17154 100644
--- a/tools/perf/util/symbol.h
+++ b/tools/perf/util/symbol.h
@@ -3,10 +3,13 @@
3 3
4#include <linux/types.h> 4#include <linux/types.h>
5#include <stdbool.h> 5#include <stdbool.h>
6#include "types.h" 6#include <stdint.h>
7#include "map.h"
7#include <linux/list.h> 8#include <linux/list.h>
8#include <linux/rbtree.h> 9#include <linux/rbtree.h>
9#include "event.h" 10#include <stdio.h>
11
12#define DEBUG_CACHE_DIR ".debug"
10 13
11#ifdef HAVE_CPLUS_DEMANGLE 14#ifdef HAVE_CPLUS_DEMANGLE
12extern char *cplus_demangle(const char *, int); 15extern char *cplus_demangle(const char *, int);
@@ -27,6 +30,9 @@ static inline char *bfd_demangle(void __used *v, const char __used *c,
27#endif 30#endif
28#endif 31#endif
29 32
33int hex2u64(const char *ptr, u64 *val);
34char *strxfrchar(char *s, char from, char to);
35
30/* 36/*
31 * libelf 0.8.x and earlier do not support ELF_C_READ_MMAP; 37 * libelf 0.8.x and earlier do not support ELF_C_READ_MMAP;
32 * for newer versions we can use mmap to reduce memory usage: 38 * for newer versions we can use mmap to reduce memory usage:
@@ -42,13 +48,18 @@ static inline char *bfd_demangle(void __used *v, const char __used *c,
42#define DMGL_ANSI (1 << 1) /* Include const, volatile, etc */ 48#define DMGL_ANSI (1 << 1) /* Include const, volatile, etc */
43#endif 49#endif
44 50
51#define BUILD_ID_SIZE 20
52
45struct symbol { 53struct symbol {
46 struct rb_node rb_node; 54 struct rb_node rb_node;
47 u64 start; 55 u64 start;
48 u64 end; 56 u64 end;
57 u16 namelen;
49 char name[0]; 58 char name[0];
50}; 59};
51 60
61void symbol__delete(struct symbol *self);
62
52struct strlist; 63struct strlist;
53 64
54struct symbol_conf { 65struct symbol_conf {
@@ -58,10 +69,16 @@ struct symbol_conf {
58 sort_by_name, 69 sort_by_name,
59 show_nr_samples, 70 show_nr_samples,
60 use_callchain, 71 use_callchain,
61 exclude_other; 72 exclude_other,
73 full_paths,
74 show_cpu_utilization;
62 const char *vmlinux_name, 75 const char *vmlinux_name,
63 *field_sep; 76 *field_sep;
64 char *dso_list_str, 77 const char *default_guest_vmlinux_name,
78 *default_guest_kallsyms,
79 *default_guest_modules;
80 const char *guestmount;
81 const char *dso_list_str,
65 *comm_list_str, 82 *comm_list_str,
66 *sym_list_str, 83 *sym_list_str,
67 *col_width_list_str; 84 *col_width_list_str;
@@ -77,6 +94,17 @@ static inline void *symbol__priv(struct symbol *self)
77 return ((void *)self) - symbol_conf.priv_size; 94 return ((void *)self) - symbol_conf.priv_size;
78} 95}
79 96
97struct ref_reloc_sym {
98 const char *name;
99 u64 addr;
100 u64 unrelocated_addr;
101};
102
103struct map_symbol {
104 struct map *map;
105 struct symbol *sym;
106};
107
80struct addr_location { 108struct addr_location {
81 struct thread *thread; 109 struct thread *thread;
82 struct map *map; 110 struct map *map;
@@ -84,6 +112,13 @@ struct addr_location {
84 u64 addr; 112 u64 addr;
85 char level; 113 char level;
86 bool filtered; 114 bool filtered;
115 unsigned int cpumode;
116};
117
118enum dso_kernel_type {
119 DSO_TYPE_USER = 0,
120 DSO_TYPE_KERNEL,
121 DSO_TYPE_GUEST_KERNEL
87}; 122};
88 123
89struct dso { 124struct dso {
@@ -93,49 +128,94 @@ struct dso {
93 u8 adjust_symbols:1; 128 u8 adjust_symbols:1;
94 u8 slen_calculated:1; 129 u8 slen_calculated:1;
95 u8 has_build_id:1; 130 u8 has_build_id:1;
96 u8 kernel:1; 131 enum dso_kernel_type kernel;
132 u8 hit:1;
133 u8 annotate_warned:1;
97 unsigned char origin; 134 unsigned char origin;
98 u8 sorted_by_name; 135 u8 sorted_by_name;
99 u8 loaded; 136 u8 loaded;
100 u8 build_id[BUILD_ID_SIZE]; 137 u8 build_id[BUILD_ID_SIZE];
101 u16 long_name_len;
102 const char *short_name; 138 const char *short_name;
103 char *long_name; 139 char *long_name;
140 u16 long_name_len;
141 u16 short_name_len;
104 char name[0]; 142 char name[0];
105}; 143};
106 144
107struct dso *dso__new(const char *name); 145struct dso *dso__new(const char *name);
146struct dso *dso__new_kernel(const char *name);
108void dso__delete(struct dso *self); 147void dso__delete(struct dso *self);
109 148
110bool dso__loaded(const struct dso *self, enum map_type type); 149bool dso__loaded(const struct dso *self, enum map_type type);
111bool dso__sorted_by_name(const struct dso *self, enum map_type type); 150bool dso__sorted_by_name(const struct dso *self, enum map_type type);
112 151
152static inline void dso__set_loaded(struct dso *self, enum map_type type)
153{
154 self->loaded |= (1 << type);
155}
156
113void dso__sort_by_name(struct dso *self, enum map_type type); 157void dso__sort_by_name(struct dso *self, enum map_type type);
114 158
115struct perf_session; 159struct dso *__dsos__findnew(struct list_head *head, const char *name);
160
161int dso__load(struct dso *self, struct map *map, symbol_filter_t filter);
162int dso__load_vmlinux_path(struct dso *self, struct map *map,
163 symbol_filter_t filter);
164int dso__load_kallsyms(struct dso *self, const char *filename, struct map *map,
165 symbol_filter_t filter);
166int machine__load_kallsyms(struct machine *self, const char *filename,
167 enum map_type type, symbol_filter_t filter);
168int machine__load_vmlinux_path(struct machine *self, enum map_type type,
169 symbol_filter_t filter);
170
171size_t __dsos__fprintf(struct list_head *head, FILE *fp);
116 172
117struct dso *dsos__findnew(const char *name); 173size_t machine__fprintf_dsos_buildid(struct machine *self, FILE *fp, bool with_hits);
118int dso__load(struct dso *self, struct map *map, struct perf_session *session, 174size_t machines__fprintf_dsos(struct rb_root *self, FILE *fp);
119 symbol_filter_t filter); 175size_t machines__fprintf_dsos_buildid(struct rb_root *self, FILE *fp, bool with_hits);
120void dsos__fprintf(FILE *fp);
121size_t dsos__fprintf_buildid(FILE *fp);
122 176
123size_t dso__fprintf_buildid(struct dso *self, FILE *fp); 177size_t dso__fprintf_buildid(struct dso *self, FILE *fp);
124size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp); 178size_t dso__fprintf(struct dso *self, enum map_type type, FILE *fp);
179
180enum dso_origin {
181 DSO__ORIG_KERNEL = 0,
182 DSO__ORIG_GUEST_KERNEL,
183 DSO__ORIG_JAVA_JIT,
184 DSO__ORIG_BUILD_ID_CACHE,
185 DSO__ORIG_FEDORA,
186 DSO__ORIG_UBUNTU,
187 DSO__ORIG_BUILDID,
188 DSO__ORIG_DSO,
189 DSO__ORIG_GUEST_KMODULE,
190 DSO__ORIG_KMODULE,
191 DSO__ORIG_NOT_FOUND,
192};
193
125char dso__symtab_origin(const struct dso *self); 194char dso__symtab_origin(const struct dso *self);
195void dso__set_long_name(struct dso *self, char *name);
126void dso__set_build_id(struct dso *self, void *build_id); 196void dso__set_build_id(struct dso *self, void *build_id);
197void dso__read_running_kernel_build_id(struct dso *self, struct machine *machine);
127struct symbol *dso__find_symbol(struct dso *self, enum map_type type, u64 addr); 198struct symbol *dso__find_symbol(struct dso *self, enum map_type type, u64 addr);
128struct symbol *dso__find_symbol_by_name(struct dso *self, enum map_type type, 199struct symbol *dso__find_symbol_by_name(struct dso *self, enum map_type type,
129 const char *name); 200 const char *name);
130 201
131int filename__read_build_id(const char *filename, void *bf, size_t size); 202int filename__read_build_id(const char *filename, void *bf, size_t size);
132int sysfs__read_build_id(const char *filename, void *bf, size_t size); 203int sysfs__read_build_id(const char *filename, void *bf, size_t size);
133bool dsos__read_build_ids(void); 204bool __dsos__read_build_ids(struct list_head *head, bool with_hits);
134int build_id__sprintf(u8 *self, int len, char *bf); 205int build_id__sprintf(const u8 *self, int len, char *bf);
206int kallsyms__parse(const char *filename, void *arg,
207 int (*process_symbol)(void *arg, const char *name,
208 char type, u64 start));
209
210int __machine__create_kernel_maps(struct machine *self, struct dso *kernel);
211int machine__create_kernel_maps(struct machine *self);
212
213int machines__create_kernel_maps(struct rb_root *self, pid_t pid);
214int machines__create_guest_kernel_maps(struct rb_root *self);
135 215
136int symbol__init(void); 216int symbol__init(void);
137int perf_session__create_kernel_maps(struct perf_session *self); 217bool symbol_type__is_a(char symbol_type, enum map_type map_type);
218
219size_t machine__fprintf_vmlinux_path(struct machine *self, FILE *fp);
138 220
139extern struct list_head dsos__user, dsos__kernel;
140extern struct dso *vdso;
141#endif /* __PERF_SYMBOL */ 221#endif /* __PERF_SYMBOL */
diff --git a/tools/perf/util/thread.c b/tools/perf/util/thread.c
index 4a08dcf50b68..9a448b47400c 100644
--- a/tools/perf/util/thread.c
+++ b/tools/perf/util/thread.c
@@ -7,13 +7,44 @@
7#include "util.h" 7#include "util.h"
8#include "debug.h" 8#include "debug.h"
9 9
10void map_groups__init(struct map_groups *self) 10/* Skip "." and ".." directories */
11static int filter(const struct dirent *dir)
11{ 12{
13 if (dir->d_name[0] == '.')
14 return 0;
15 else
16 return 1;
17}
18
19int find_all_tid(int pid, pid_t ** all_tid)
20{
21 char name[256];
22 int items;
23 struct dirent **namelist = NULL;
24 int ret = 0;
12 int i; 25 int i;
13 for (i = 0; i < MAP__NR_TYPES; ++i) { 26
14 self->maps[i] = RB_ROOT; 27 sprintf(name, "/proc/%d/task", pid);
15 INIT_LIST_HEAD(&self->removed_maps[i]); 28 items = scandir(name, &namelist, filter, NULL);
29 if (items <= 0)
30 return -ENOENT;
31 *all_tid = malloc(sizeof(pid_t) * items);
32 if (!*all_tid) {
33 ret = -ENOMEM;
34 goto failure;
16 } 35 }
36
37 for (i = 0; i < items; i++)
38 (*all_tid)[i] = atoi(namelist[i]->d_name);
39
40 ret = items;
41
42failure:
43 for (i=0; i<items; i++)
44 free(namelist[i]);
45 free(namelist);
46
47 return ret;
17} 48}
18 49
19static struct thread *thread__new(pid_t pid) 50static struct thread *thread__new(pid_t pid)
@@ -33,10 +64,17 @@ static struct thread *thread__new(pid_t pid)
33 64
34int thread__set_comm(struct thread *self, const char *comm) 65int thread__set_comm(struct thread *self, const char *comm)
35{ 66{
67 int err;
68
36 if (self->comm) 69 if (self->comm)
37 free(self->comm); 70 free(self->comm);
38 self->comm = strdup(comm); 71 self->comm = strdup(comm);
39 return self->comm ? 0 : -ENOMEM; 72 err = self->comm == NULL ? -ENOMEM : 0;
73 if (!err) {
74 self->comm_set = true;
75 map_groups__flush(&self->mg);
76 }
77 return err;
40} 78}
41 79
42int thread__comm_len(struct thread *self) 80int thread__comm_len(struct thread *self)
@@ -50,74 +88,10 @@ int thread__comm_len(struct thread *self)
50 return self->comm_len; 88 return self->comm_len;
51} 89}
52 90
53static const char *map_type__name[MAP__NR_TYPES] = {
54 [MAP__FUNCTION] = "Functions",
55 [MAP__VARIABLE] = "Variables",
56};
57
58static size_t __map_groups__fprintf_maps(struct map_groups *self,
59 enum map_type type, FILE *fp)
60{
61 size_t printed = fprintf(fp, "%s:\n", map_type__name[type]);
62 struct rb_node *nd;
63
64 for (nd = rb_first(&self->maps[type]); nd; nd = rb_next(nd)) {
65 struct map *pos = rb_entry(nd, struct map, rb_node);
66 printed += fprintf(fp, "Map:");
67 printed += map__fprintf(pos, fp);
68 if (verbose > 1) {
69 printed += dso__fprintf(pos->dso, type, fp);
70 printed += fprintf(fp, "--\n");
71 }
72 }
73
74 return printed;
75}
76
77size_t map_groups__fprintf_maps(struct map_groups *self, FILE *fp)
78{
79 size_t printed = 0, i;
80 for (i = 0; i < MAP__NR_TYPES; ++i)
81 printed += __map_groups__fprintf_maps(self, i, fp);
82 return printed;
83}
84
85static size_t __map_groups__fprintf_removed_maps(struct map_groups *self,
86 enum map_type type, FILE *fp)
87{
88 struct map *pos;
89 size_t printed = 0;
90
91 list_for_each_entry(pos, &self->removed_maps[type], node) {
92 printed += fprintf(fp, "Map:");
93 printed += map__fprintf(pos, fp);
94 if (verbose > 1) {
95 printed += dso__fprintf(pos->dso, type, fp);
96 printed += fprintf(fp, "--\n");
97 }
98 }
99 return printed;
100}
101
102static size_t map_groups__fprintf_removed_maps(struct map_groups *self, FILE *fp)
103{
104 size_t printed = 0, i;
105 for (i = 0; i < MAP__NR_TYPES; ++i)
106 printed += __map_groups__fprintf_removed_maps(self, i, fp);
107 return printed;
108}
109
110static size_t map_groups__fprintf(struct map_groups *self, FILE *fp)
111{
112 size_t printed = map_groups__fprintf_maps(self, fp);
113 printed += fprintf(fp, "Removed maps:\n");
114 return printed + map_groups__fprintf_removed_maps(self, fp);
115}
116
117static size_t thread__fprintf(struct thread *self, FILE *fp) 91static size_t thread__fprintf(struct thread *self, FILE *fp)
118{ 92{
119 return fprintf(fp, "Thread %d %s\n", self->pid, self->comm) + 93 return fprintf(fp, "Thread %d %s\n", self->pid, self->comm) +
120 map_groups__fprintf(&self->mg, fp); 94 map_groups__fprintf(&self->mg, verbose, fp);
121} 95}
122 96
123struct thread *perf_session__findnew(struct perf_session *self, pid_t pid) 97struct thread *perf_session__findnew(struct perf_session *self, pid_t pid)
@@ -159,107 +133,24 @@ struct thread *perf_session__findnew(struct perf_session *self, pid_t pid)
159 return th; 133 return th;
160} 134}
161 135
162static void map_groups__remove_overlappings(struct map_groups *self,
163 struct map *map)
164{
165 struct rb_root *root = &self->maps[map->type];
166 struct rb_node *next = rb_first(root);
167
168 while (next) {
169 struct map *pos = rb_entry(next, struct map, rb_node);
170 next = rb_next(&pos->rb_node);
171
172 if (!map__overlap(pos, map))
173 continue;
174
175 if (verbose >= 2) {
176 fputs("overlapping maps:\n", stderr);
177 map__fprintf(map, stderr);
178 map__fprintf(pos, stderr);
179 }
180
181 rb_erase(&pos->rb_node, root);
182 /*
183 * We may have references to this map, for instance in some
184 * hist_entry instances, so just move them to a separate
185 * list.
186 */
187 list_add_tail(&pos->node, &self->removed_maps[map->type]);
188 }
189}
190
191void maps__insert(struct rb_root *maps, struct map *map)
192{
193 struct rb_node **p = &maps->rb_node;
194 struct rb_node *parent = NULL;
195 const u64 ip = map->start;
196 struct map *m;
197
198 while (*p != NULL) {
199 parent = *p;
200 m = rb_entry(parent, struct map, rb_node);
201 if (ip < m->start)
202 p = &(*p)->rb_left;
203 else
204 p = &(*p)->rb_right;
205 }
206
207 rb_link_node(&map->rb_node, parent, p);
208 rb_insert_color(&map->rb_node, maps);
209}
210
211struct map *maps__find(struct rb_root *maps, u64 ip)
212{
213 struct rb_node **p = &maps->rb_node;
214 struct rb_node *parent = NULL;
215 struct map *m;
216
217 while (*p != NULL) {
218 parent = *p;
219 m = rb_entry(parent, struct map, rb_node);
220 if (ip < m->start)
221 p = &(*p)->rb_left;
222 else if (ip > m->end)
223 p = &(*p)->rb_right;
224 else
225 return m;
226 }
227
228 return NULL;
229}
230
231void thread__insert_map(struct thread *self, struct map *map) 136void thread__insert_map(struct thread *self, struct map *map)
232{ 137{
233 map_groups__remove_overlappings(&self->mg, map); 138 map_groups__fixup_overlappings(&self->mg, map, verbose, stderr);
234 map_groups__insert(&self->mg, map); 139 map_groups__insert(&self->mg, map);
235} 140}
236 141
237/*
238 * XXX This should not really _copy_ te maps, but refcount them.
239 */
240static int map_groups__clone(struct map_groups *self,
241 struct map_groups *parent, enum map_type type)
242{
243 struct rb_node *nd;
244 for (nd = rb_first(&parent->maps[type]); nd; nd = rb_next(nd)) {
245 struct map *map = rb_entry(nd, struct map, rb_node);
246 struct map *new = map__clone(map);
247 if (new == NULL)
248 return -ENOMEM;
249 map_groups__insert(self, new);
250 }
251 return 0;
252}
253
254int thread__fork(struct thread *self, struct thread *parent) 142int thread__fork(struct thread *self, struct thread *parent)
255{ 143{
256 int i; 144 int i;
257 145
258 if (self->comm) 146 if (parent->comm_set) {
259 free(self->comm); 147 if (self->comm)
260 self->comm = strdup(parent->comm); 148 free(self->comm);
261 if (!self->comm) 149 self->comm = strdup(parent->comm);
262 return -ENOMEM; 150 if (!self->comm)
151 return -ENOMEM;
152 self->comm_set = true;
153 }
263 154
264 for (i = 0; i < MAP__NR_TYPES; ++i) 155 for (i = 0; i < MAP__NR_TYPES; ++i)
265 if (map_groups__clone(&self->mg, &parent->mg, i) < 0) 156 if (map_groups__clone(&self->mg, &parent->mg, i) < 0)
@@ -280,16 +171,3 @@ size_t perf_session__fprintf(struct perf_session *self, FILE *fp)
280 171
281 return ret; 172 return ret;
282} 173}
283
284struct symbol *map_groups__find_symbol(struct map_groups *self,
285 struct perf_session *session,
286 enum map_type type, u64 addr,
287 symbol_filter_t filter)
288{
289 struct map *map = map_groups__find(self, type, addr);
290
291 if (map != NULL)
292 return map__find_symbol(map, session, map->map_ip(map, addr), filter);
293
294 return NULL;
295}
diff --git a/tools/perf/util/thread.h b/tools/perf/util/thread.h
index c206f72c8881..ee6bbcf277ca 100644
--- a/tools/perf/util/thread.h
+++ b/tools/perf/util/thread.h
@@ -5,66 +5,43 @@
5#include <unistd.h> 5#include <unistd.h>
6#include "symbol.h" 6#include "symbol.h"
7 7
8struct map_groups {
9 struct rb_root maps[MAP__NR_TYPES];
10 struct list_head removed_maps[MAP__NR_TYPES];
11};
12
13struct thread { 8struct thread {
14 struct rb_node rb_node; 9 union {
10 struct rb_node rb_node;
11 struct list_head node;
12 };
15 struct map_groups mg; 13 struct map_groups mg;
16 pid_t pid; 14 pid_t pid;
17 char shortname[3]; 15 char shortname[3];
16 bool comm_set;
18 char *comm; 17 char *comm;
19 int comm_len; 18 int comm_len;
20}; 19};
21 20
22void map_groups__init(struct map_groups *self); 21struct perf_session;
22
23int find_all_tid(int pid, pid_t ** all_tid);
23int thread__set_comm(struct thread *self, const char *comm); 24int thread__set_comm(struct thread *self, const char *comm);
24int thread__comm_len(struct thread *self); 25int thread__comm_len(struct thread *self);
25struct thread *perf_session__findnew(struct perf_session *self, pid_t pid); 26struct thread *perf_session__findnew(struct perf_session *self, pid_t pid);
26void thread__insert_map(struct thread *self, struct map *map); 27void thread__insert_map(struct thread *self, struct map *map);
27int thread__fork(struct thread *self, struct thread *parent); 28int thread__fork(struct thread *self, struct thread *parent);
28size_t map_groups__fprintf_maps(struct map_groups *self, FILE *fp);
29size_t perf_session__fprintf(struct perf_session *self, FILE *fp); 29size_t perf_session__fprintf(struct perf_session *self, FILE *fp);
30 30
31void maps__insert(struct rb_root *maps, struct map *map);
32struct map *maps__find(struct rb_root *maps, u64 addr);
33
34static inline void map_groups__insert(struct map_groups *self, struct map *map)
35{
36 maps__insert(&self->maps[map->type], map);
37}
38
39static inline struct map *map_groups__find(struct map_groups *self,
40 enum map_type type, u64 addr)
41{
42 return maps__find(&self->maps[type], addr);
43}
44
45static inline struct map *thread__find_map(struct thread *self, 31static inline struct map *thread__find_map(struct thread *self,
46 enum map_type type, u64 addr) 32 enum map_type type, u64 addr)
47{ 33{
48 return self ? map_groups__find(&self->mg, type, addr) : NULL; 34 return self ? map_groups__find(&self->mg, type, addr) : NULL;
49} 35}
50 36
37void thread__find_addr_map(struct thread *self,
38 struct perf_session *session, u8 cpumode,
39 enum map_type type, pid_t pid, u64 addr,
40 struct addr_location *al);
41
51void thread__find_addr_location(struct thread *self, 42void thread__find_addr_location(struct thread *self,
52 struct perf_session *session, u8 cpumode, 43 struct perf_session *session, u8 cpumode,
53 enum map_type type, u64 addr, 44 enum map_type type, pid_t pid, u64 addr,
54 struct addr_location *al, 45 struct addr_location *al,
55 symbol_filter_t filter); 46 symbol_filter_t filter);
56struct symbol *map_groups__find_symbol(struct map_groups *self,
57 struct perf_session *session,
58 enum map_type type, u64 addr,
59 symbol_filter_t filter);
60
61static inline struct symbol *
62map_groups__find_function(struct map_groups *self, struct perf_session *session,
63 u64 addr, symbol_filter_t filter)
64{
65 return map_groups__find_symbol(self, session, MAP__FUNCTION, addr, filter);
66}
67
68struct map *map_groups__find_by_name(struct map_groups *self,
69 enum map_type type, const char *name);
70#endif /* __PERF_THREAD_H */ 47#endif /* __PERF_THREAD_H */
diff --git a/tools/perf/util/trace-event-info.c b/tools/perf/util/trace-event-info.c
index cace35595530..b1572601286c 100644
--- a/tools/perf/util/trace-event-info.c
+++ b/tools/perf/util/trace-event-info.c
@@ -20,6 +20,7 @@
20 */ 20 */
21#define _GNU_SOURCE 21#define _GNU_SOURCE
22#include <dirent.h> 22#include <dirent.h>
23#include <mntent.h>
23#include <stdio.h> 24#include <stdio.h>
24#include <stdlib.h> 25#include <stdlib.h>
25#include <string.h> 26#include <string.h>
@@ -37,6 +38,7 @@
37 38
38#include "../perf.h" 39#include "../perf.h"
39#include "trace-event.h" 40#include "trace-event.h"
41#include "debugfs.h"
40 42
41#define VERSION "0.5" 43#define VERSION "0.5"
42 44
@@ -101,32 +103,12 @@ void *malloc_or_die(unsigned int size)
101 103
102static const char *find_debugfs(void) 104static const char *find_debugfs(void)
103{ 105{
104 static char debugfs[MAX_PATH+1]; 106 const char *path = debugfs_mount(NULL);
105 static int debugfs_found;
106 char type[100];
107 FILE *fp;
108
109 if (debugfs_found)
110 return debugfs;
111
112 if ((fp = fopen("/proc/mounts","r")) == NULL)
113 die("Can't open /proc/mounts for read");
114
115 while (fscanf(fp, "%*s %"
116 STR(MAX_PATH)
117 "s %99s %*s %*d %*d\n",
118 debugfs, type) == 2) {
119 if (strcmp(type, "debugfs") == 0)
120 break;
121 }
122 fclose(fp);
123
124 if (strcmp(type, "debugfs") != 0)
125 die("debugfs not mounted, please mount");
126 107
127 debugfs_found = 1; 108 if (!path)
109 die("Your kernel not support debugfs filesystem");
128 110
129 return debugfs; 111 return path;
130} 112}
131 113
132/* 114/*
@@ -172,10 +154,17 @@ static void put_tracing_file(char *file)
172 free(file); 154 free(file);
173} 155}
174 156
157static ssize_t calc_data_size;
158
175static ssize_t write_or_die(const void *buf, size_t len) 159static ssize_t write_or_die(const void *buf, size_t len)
176{ 160{
177 int ret; 161 int ret;
178 162
163 if (calc_data_size) {
164 calc_data_size += len;
165 return len;
166 }
167
179 ret = write(output_fd, buf, len); 168 ret = write(output_fd, buf, len);
180 if (ret < 0) 169 if (ret < 0)
181 die("writing to '%s'", output_file); 170 die("writing to '%s'", output_file);
@@ -271,6 +260,8 @@ static void read_header_files(void)
271 write_or_die("header_page", 12); 260 write_or_die("header_page", 12);
272 write_or_die(&size, 8); 261 write_or_die(&size, 8);
273 check_size = copy_file_fd(fd); 262 check_size = copy_file_fd(fd);
263 close(fd);
264
274 if (size != check_size) 265 if (size != check_size)
275 die("wrong size for '%s' size=%lld read=%lld", 266 die("wrong size for '%s' size=%lld read=%lld",
276 path, size, check_size); 267 path, size, check_size);
@@ -289,6 +280,7 @@ static void read_header_files(void)
289 if (size != check_size) 280 if (size != check_size)
290 die("wrong size for '%s'", path); 281 die("wrong size for '%s'", path);
291 put_tracing_file(path); 282 put_tracing_file(path);
283 close(fd);
292} 284}
293 285
294static bool name_in_tp_list(char *sys, struct tracepoint_path *tps) 286static bool name_in_tp_list(char *sys, struct tracepoint_path *tps)
@@ -317,7 +309,8 @@ static void copy_event_system(const char *sys, struct tracepoint_path *tps)
317 die("can't read directory '%s'", sys); 309 die("can't read directory '%s'", sys);
318 310
319 while ((dent = readdir(dir))) { 311 while ((dent = readdir(dir))) {
320 if (strcmp(dent->d_name, ".") == 0 || 312 if (dent->d_type != DT_DIR ||
313 strcmp(dent->d_name, ".") == 0 ||
321 strcmp(dent->d_name, "..") == 0 || 314 strcmp(dent->d_name, "..") == 0 ||
322 !name_in_tp_list(dent->d_name, tps)) 315 !name_in_tp_list(dent->d_name, tps))
323 continue; 316 continue;
@@ -334,7 +327,8 @@ static void copy_event_system(const char *sys, struct tracepoint_path *tps)
334 327
335 rewinddir(dir); 328 rewinddir(dir);
336 while ((dent = readdir(dir))) { 329 while ((dent = readdir(dir))) {
337 if (strcmp(dent->d_name, ".") == 0 || 330 if (dent->d_type != DT_DIR ||
331 strcmp(dent->d_name, ".") == 0 ||
338 strcmp(dent->d_name, "..") == 0 || 332 strcmp(dent->d_name, "..") == 0 ||
339 !name_in_tp_list(dent->d_name, tps)) 333 !name_in_tp_list(dent->d_name, tps))
340 continue; 334 continue;
@@ -353,6 +347,7 @@ static void copy_event_system(const char *sys, struct tracepoint_path *tps)
353 347
354 free(format); 348 free(format);
355 } 349 }
350 closedir(dir);
356} 351}
357 352
358static void read_ftrace_files(struct tracepoint_path *tps) 353static void read_ftrace_files(struct tracepoint_path *tps)
@@ -394,26 +389,21 @@ static void read_event_files(struct tracepoint_path *tps)
394 die("can't read directory '%s'", path); 389 die("can't read directory '%s'", path);
395 390
396 while ((dent = readdir(dir))) { 391 while ((dent = readdir(dir))) {
397 if (strcmp(dent->d_name, ".") == 0 || 392 if (dent->d_type != DT_DIR ||
393 strcmp(dent->d_name, ".") == 0 ||
398 strcmp(dent->d_name, "..") == 0 || 394 strcmp(dent->d_name, "..") == 0 ||
399 strcmp(dent->d_name, "ftrace") == 0 || 395 strcmp(dent->d_name, "ftrace") == 0 ||
400 !system_in_tp_list(dent->d_name, tps)) 396 !system_in_tp_list(dent->d_name, tps))
401 continue; 397 continue;
402 sys = malloc_or_die(strlen(path) + strlen(dent->d_name) + 2); 398 count++;
403 sprintf(sys, "%s/%s", path, dent->d_name);
404 ret = stat(sys, &st);
405 free(sys);
406 if (ret < 0)
407 continue;
408 if (S_ISDIR(st.st_mode))
409 count++;
410 } 399 }
411 400
412 write_or_die(&count, 4); 401 write_or_die(&count, 4);
413 402
414 rewinddir(dir); 403 rewinddir(dir);
415 while ((dent = readdir(dir))) { 404 while ((dent = readdir(dir))) {
416 if (strcmp(dent->d_name, ".") == 0 || 405 if (dent->d_type != DT_DIR ||
406 strcmp(dent->d_name, ".") == 0 ||
417 strcmp(dent->d_name, "..") == 0 || 407 strcmp(dent->d_name, "..") == 0 ||
418 strcmp(dent->d_name, "ftrace") == 0 || 408 strcmp(dent->d_name, "ftrace") == 0 ||
419 !system_in_tp_list(dent->d_name, tps)) 409 !system_in_tp_list(dent->d_name, tps))
@@ -422,14 +412,13 @@ static void read_event_files(struct tracepoint_path *tps)
422 sprintf(sys, "%s/%s", path, dent->d_name); 412 sprintf(sys, "%s/%s", path, dent->d_name);
423 ret = stat(sys, &st); 413 ret = stat(sys, &st);
424 if (ret >= 0) { 414 if (ret >= 0) {
425 if (S_ISDIR(st.st_mode)) { 415 write_or_die(dent->d_name, strlen(dent->d_name) + 1);
426 write_or_die(dent->d_name, strlen(dent->d_name) + 1); 416 copy_event_system(sys, tps);
427 copy_event_system(sys, tps);
428 }
429 } 417 }
430 free(sys); 418 free(sys);
431 } 419 }
432 420
421 closedir(dir);
433 put_tracing_file(path); 422 put_tracing_file(path);
434} 423}
435 424
@@ -498,6 +487,17 @@ get_tracepoints_path(struct perf_event_attr *pattrs, int nb_events)
498 return nr_tracepoints > 0 ? path.next : NULL; 487 return nr_tracepoints > 0 ? path.next : NULL;
499} 488}
500 489
490bool have_tracepoints(struct perf_event_attr *pattrs, int nb_events)
491{
492 int i;
493
494 for (i = 0; i < nb_events; i++)
495 if (pattrs[i].type == PERF_TYPE_TRACEPOINT)
496 return true;
497
498 return false;
499}
500
501int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events) 501int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events)
502{ 502{
503 char buf[BUFSIZ]; 503 char buf[BUFSIZ];
@@ -533,7 +533,7 @@ int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events)
533 write_or_die(buf, 1); 533 write_or_die(buf, 1);
534 534
535 /* save page_size */ 535 /* save page_size */
536 page_size = getpagesize(); 536 page_size = sysconf(_SC_PAGESIZE);
537 write_or_die(&page_size, 4); 537 write_or_die(&page_size, 4);
538 538
539 read_header_files(); 539 read_header_files();
@@ -544,3 +544,20 @@ int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events)
544 544
545 return 0; 545 return 0;
546} 546}
547
548ssize_t read_tracing_data_size(int fd, struct perf_event_attr *pattrs,
549 int nb_events)
550{
551 ssize_t size;
552 int err = 0;
553
554 calc_data_size = 1;
555 err = read_tracing_data(fd, pattrs, nb_events);
556 size = calc_data_size - 1;
557 calc_data_size = 0;
558
559 if (err < 0)
560 return err;
561
562 return size;
563}
diff --git a/tools/perf/util/trace-event-parse.c b/tools/perf/util/trace-event-parse.c
index c5c32be040bf..73a02223c629 100644
--- a/tools/perf/util/trace-event-parse.c
+++ b/tools/perf/util/trace-event-parse.c
@@ -37,10 +37,12 @@ int header_page_ts_offset;
37int header_page_ts_size; 37int header_page_ts_size;
38int header_page_size_offset; 38int header_page_size_offset;
39int header_page_size_size; 39int header_page_size_size;
40int header_page_overwrite_offset;
41int header_page_overwrite_size;
40int header_page_data_offset; 42int header_page_data_offset;
41int header_page_data_size; 43int header_page_data_size;
42 44
43int latency_format; 45bool latency_format;
44 46
45static char *input_buf; 47static char *input_buf;
46static unsigned long long input_buf_ptr; 48static unsigned long long input_buf_ptr;
@@ -628,23 +630,32 @@ static int test_type(enum event_type type, enum event_type expect)
628 return 0; 630 return 0;
629} 631}
630 632
631static int test_type_token(enum event_type type, char *token, 633static int __test_type_token(enum event_type type, char *token,
632 enum event_type expect, const char *expect_tok) 634 enum event_type expect, const char *expect_tok,
635 bool warn)
633{ 636{
634 if (type != expect) { 637 if (type != expect) {
635 warning("Error: expected type %d but read %d", 638 if (warn)
636 expect, type); 639 warning("Error: expected type %d but read %d",
640 expect, type);
637 return -1; 641 return -1;
638 } 642 }
639 643
640 if (strcmp(token, expect_tok) != 0) { 644 if (strcmp(token, expect_tok) != 0) {
641 warning("Error: expected '%s' but read '%s'", 645 if (warn)
642 expect_tok, token); 646 warning("Error: expected '%s' but read '%s'",
647 expect_tok, token);
643 return -1; 648 return -1;
644 } 649 }
645 return 0; 650 return 0;
646} 651}
647 652
653static int test_type_token(enum event_type type, char *token,
654 enum event_type expect, const char *expect_tok)
655{
656 return __test_type_token(type, token, expect, expect_tok, true);
657}
658
648static int __read_expect_type(enum event_type expect, char **tok, int newline_ok) 659static int __read_expect_type(enum event_type expect, char **tok, int newline_ok)
649{ 660{
650 enum event_type type; 661 enum event_type type;
@@ -661,7 +672,8 @@ static int read_expect_type(enum event_type expect, char **tok)
661 return __read_expect_type(expect, tok, 1); 672 return __read_expect_type(expect, tok, 1);
662} 673}
663 674
664static int __read_expected(enum event_type expect, const char *str, int newline_ok) 675static int __read_expected(enum event_type expect, const char *str,
676 int newline_ok, bool warn)
665{ 677{
666 enum event_type type; 678 enum event_type type;
667 char *token; 679 char *token;
@@ -672,7 +684,7 @@ static int __read_expected(enum event_type expect, const char *str, int newline_
672 else 684 else
673 type = read_token_item(&token); 685 type = read_token_item(&token);
674 686
675 ret = test_type_token(type, token, expect, str); 687 ret = __test_type_token(type, token, expect, str, warn);
676 688
677 free_token(token); 689 free_token(token);
678 690
@@ -681,12 +693,12 @@ static int __read_expected(enum event_type expect, const char *str, int newline_
681 693
682static int read_expected(enum event_type expect, const char *str) 694static int read_expected(enum event_type expect, const char *str)
683{ 695{
684 return __read_expected(expect, str, 1); 696 return __read_expected(expect, str, 1, true);
685} 697}
686 698
687static int read_expected_item(enum event_type expect, const char *str) 699static int read_expected_item(enum event_type expect, const char *str)
688{ 700{
689 return __read_expected(expect, str, 0); 701 return __read_expected(expect, str, 0, true);
690} 702}
691 703
692static char *event_read_name(void) 704static char *event_read_name(void)
@@ -744,7 +756,7 @@ static int field_is_string(struct format_field *field)
744 756
745static int field_is_dynamic(struct format_field *field) 757static int field_is_dynamic(struct format_field *field)
746{ 758{
747 if (!strcmp(field->type, "__data_loc")) 759 if (!strncmp(field->type, "__data_loc", 10))
748 return 1; 760 return 1;
749 761
750 return 0; 762 return 0;
@@ -1925,6 +1937,15 @@ void *raw_field_ptr(struct event *event, const char *name, void *data)
1925 if (!field) 1937 if (!field)
1926 return NULL; 1938 return NULL;
1927 1939
1940 if (field->flags & FIELD_IS_DYNAMIC) {
1941 int offset;
1942
1943 offset = *(int *)(data + field->offset);
1944 offset &= 0xffff;
1945
1946 return data + offset;
1947 }
1948
1928 return data + field->offset; 1949 return data + field->offset;
1929} 1950}
1930 1951
@@ -3078,88 +3099,6 @@ static void print_args(struct print_arg *args)
3078 } 3099 }
3079} 3100}
3080 3101
3081static void parse_header_field(const char *field,
3082 int *offset, int *size)
3083{
3084 char *token;
3085 int type;
3086
3087 if (read_expected(EVENT_ITEM, "field") < 0)
3088 return;
3089 if (read_expected(EVENT_OP, ":") < 0)
3090 return;
3091
3092 /* type */
3093 if (read_expect_type(EVENT_ITEM, &token) < 0)
3094 goto fail;
3095 free_token(token);
3096
3097 if (read_expected(EVENT_ITEM, field) < 0)
3098 return;
3099 if (read_expected(EVENT_OP, ";") < 0)
3100 return;
3101 if (read_expected(EVENT_ITEM, "offset") < 0)
3102 return;
3103 if (read_expected(EVENT_OP, ":") < 0)
3104 return;
3105 if (read_expect_type(EVENT_ITEM, &token) < 0)
3106 goto fail;
3107 *offset = atoi(token);
3108 free_token(token);
3109 if (read_expected(EVENT_OP, ";") < 0)
3110 return;
3111 if (read_expected(EVENT_ITEM, "size") < 0)
3112 return;
3113 if (read_expected(EVENT_OP, ":") < 0)
3114 return;
3115 if (read_expect_type(EVENT_ITEM, &token) < 0)
3116 goto fail;
3117 *size = atoi(token);
3118 free_token(token);
3119 if (read_expected(EVENT_OP, ";") < 0)
3120 return;
3121 type = read_token(&token);
3122 if (type != EVENT_NEWLINE) {
3123 /* newer versions of the kernel have a "signed" type */
3124 if (type != EVENT_ITEM)
3125 goto fail;
3126
3127 if (strcmp(token, "signed") != 0)
3128 goto fail;
3129
3130 free_token(token);
3131
3132 if (read_expected(EVENT_OP, ":") < 0)
3133 return;
3134
3135 if (read_expect_type(EVENT_ITEM, &token))
3136 goto fail;
3137
3138 free_token(token);
3139 if (read_expected(EVENT_OP, ";") < 0)
3140 return;
3141
3142 if (read_expect_type(EVENT_NEWLINE, &token))
3143 goto fail;
3144 }
3145 fail:
3146 free_token(token);
3147}
3148
3149int parse_header_page(char *buf, unsigned long size)
3150{
3151 init_input_buf(buf, size);
3152
3153 parse_header_field("timestamp", &header_page_ts_offset,
3154 &header_page_ts_size);
3155 parse_header_field("commit", &header_page_size_offset,
3156 &header_page_size_size);
3157 parse_header_field("data", &header_page_data_offset,
3158 &header_page_data_size);
3159
3160 return 0;
3161}
3162
3163int parse_ftrace_file(char *buf, unsigned long size) 3102int parse_ftrace_file(char *buf, unsigned long size)
3164{ 3103{
3165 struct format_field *field; 3104 struct format_field *field;
@@ -3277,3 +3216,18 @@ void parse_set_info(int nr_cpus, int long_sz)
3277 cpus = nr_cpus; 3216 cpus = nr_cpus;
3278 long_size = long_sz; 3217 long_size = long_sz;
3279} 3218}
3219
3220int common_pc(struct scripting_context *context)
3221{
3222 return parse_common_pc(context->event_data);
3223}
3224
3225int common_flags(struct scripting_context *context)
3226{
3227 return parse_common_flags(context->event_data);
3228}
3229
3230int common_lock_depth(struct scripting_context *context)
3231{
3232 return parse_common_lock_depth(context->event_data);
3233}
diff --git a/tools/perf/util/trace-event-perl.h b/tools/perf/util/trace-event-perl.h
deleted file mode 100644
index e88fb26137bb..000000000000
--- a/tools/perf/util/trace-event-perl.h
+++ /dev/null
@@ -1,55 +0,0 @@
1#ifndef __PERF_TRACE_EVENT_PERL_H
2#define __PERF_TRACE_EVENT_PERL_H
3#ifdef NO_LIBPERL
4typedef int INTERP;
5#define dSP
6#define ENTER
7#define SAVETMPS
8#define PUTBACK
9#define SPAGAIN
10#define FREETMPS
11#define LEAVE
12#define SP
13#define ERRSV
14#define G_SCALAR (0)
15#define G_DISCARD (0)
16#define G_NOARGS (0)
17#define PUSHMARK(a)
18#define SvTRUE(a) (0)
19#define XPUSHs(s)
20#define sv_2mortal(a)
21#define newSVpv(a,b)
22#define newSVuv(a)
23#define newSViv(a)
24#define get_cv(a,b) (0)
25#define call_pv(a,b) (0)
26#define perl_alloc() (0)
27#define perl_construct(a) (0)
28#define perl_parse(a,b,c,d,e) (0)
29#define perl_run(a) (0)
30#define perl_destruct(a) (0)
31#define perl_free(a) (0)
32#define pTHX void
33#define CV void
34#define dXSUB_SYS
35#define pTHX_
36static inline void newXS(const char *a, void *b, const char *c) {}
37static void boot_Perf__Trace__Context(pTHX_ CV *cv) {}
38static void boot_DynaLoader(pTHX_ CV *cv) {}
39#else
40#include <EXTERN.h>
41#include <perl.h>
42void boot_Perf__Trace__Context(pTHX_ CV *cv);
43void boot_DynaLoader(pTHX_ CV *cv);
44typedef PerlInterpreter * INTERP;
45#endif
46
47struct scripting_context {
48 void *event_data;
49};
50
51int common_pc(struct scripting_context *context);
52int common_flags(struct scripting_context *context);
53int common_lock_depth(struct scripting_context *context);
54
55#endif /* __PERF_TRACE_EVENT_PERL_H */
diff --git a/tools/perf/util/trace-event-read.c b/tools/perf/util/trace-event-read.c
index 1744422cafcb..f55cc3a765a1 100644
--- a/tools/perf/util/trace-event-read.c
+++ b/tools/perf/util/trace-event-read.c
@@ -18,7 +18,7 @@
18 * 18 *
19 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ 19 * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
20 */ 20 */
21#define _LARGEFILE64_SOURCE 21#define _FILE_OFFSET_BITS 64
22 22
23#include <dirent.h> 23#include <dirent.h>
24#include <stdio.h> 24#include <stdio.h>
@@ -50,17 +50,61 @@ static int long_size;
50 50
51static unsigned long page_size; 51static unsigned long page_size;
52 52
53static ssize_t calc_data_size;
54static bool repipe;
55
56static int do_read(int fd, void *buf, int size)
57{
58 int rsize = size;
59
60 while (size) {
61 int ret = read(fd, buf, size);
62
63 if (ret <= 0)
64 return -1;
65
66 if (repipe) {
67 int retw = write(STDOUT_FILENO, buf, ret);
68
69 if (retw <= 0 || retw != ret)
70 die("repiping input file");
71 }
72
73 size -= ret;
74 buf += ret;
75 }
76
77 return rsize;
78}
79
53static int read_or_die(void *data, int size) 80static int read_or_die(void *data, int size)
54{ 81{
55 int r; 82 int r;
56 83
57 r = read(input_fd, data, size); 84 r = do_read(input_fd, data, size);
58 if (r != size) 85 if (r <= 0)
59 die("reading input file (size expected=%d received=%d)", 86 die("reading input file (size expected=%d received=%d)",
60 size, r); 87 size, r);
88
89 if (calc_data_size)
90 calc_data_size += r;
91
61 return r; 92 return r;
62} 93}
63 94
95/* If it fails, the next read will report it */
96static void skip(int size)
97{
98 char buf[BUFSIZ];
99 int r;
100
101 while (size) {
102 r = size > BUFSIZ ? BUFSIZ : size;
103 read_or_die(buf, r);
104 size -= r;
105 };
106}
107
64static unsigned int read4(void) 108static unsigned int read4(void)
65{ 109{
66 unsigned int data; 110 unsigned int data;
@@ -82,57 +126,36 @@ static char *read_string(void)
82 char buf[BUFSIZ]; 126 char buf[BUFSIZ];
83 char *str = NULL; 127 char *str = NULL;
84 int size = 0; 128 int size = 0;
85 int i; 129 off_t r;
86 int r; 130 char c;
87 131
88 for (;;) { 132 for (;;) {
89 r = read(input_fd, buf, BUFSIZ); 133 r = read(input_fd, &c, 1);
90 if (r < 0) 134 if (r < 0)
91 die("reading input file"); 135 die("reading input file");
92 136
93 if (!r) 137 if (!r)
94 die("no data"); 138 die("no data");
95 139
96 for (i = 0; i < r; i++) { 140 if (repipe) {
97 if (!buf[i]) 141 int retw = write(STDOUT_FILENO, &c, 1);
98 break;
99 }
100 if (i < r)
101 break;
102 142
103 if (str) { 143 if (retw <= 0 || retw != r)
104 size += BUFSIZ; 144 die("repiping input file string");
105 str = realloc(str, size);
106 if (!str)
107 die("malloc of size %d", size);
108 memcpy(str + (size - BUFSIZ), buf, BUFSIZ);
109 } else {
110 size = BUFSIZ;
111 str = malloc_or_die(size);
112 memcpy(str, buf, size);
113 } 145 }
114 }
115 146
116 /* trailing \0: */ 147 buf[size++] = c;
117 i++; 148
118 149 if (!c)
119 /* move the file descriptor to the end of the string */ 150 break;
120 r = lseek(input_fd, -(r - i), SEEK_CUR);
121 if (r < 0)
122 die("lseek");
123
124 if (str) {
125 size += i;
126 str = realloc(str, size);
127 if (!str)
128 die("malloc of size %d", size);
129 memcpy(str + (size - i), buf, i);
130 } else {
131 size = i;
132 str = malloc_or_die(i);
133 memcpy(str, buf, i);
134 } 151 }
135 152
153 if (calc_data_size)
154 calc_data_size += size;
155
156 str = malloc_or_die(size);
157 memcpy(str, buf, size);
158
136 return str; 159 return str;
137} 160}
138 161
@@ -174,7 +197,6 @@ static void read_ftrace_printk(void)
174static void read_header_files(void) 197static void read_header_files(void)
175{ 198{
176 unsigned long long size; 199 unsigned long long size;
177 char *header_page;
178 char *header_event; 200 char *header_event;
179 char buf[BUFSIZ]; 201 char buf[BUFSIZ];
180 202
@@ -184,10 +206,7 @@ static void read_header_files(void)
184 die("did not read header page"); 206 die("did not read header page");
185 207
186 size = read8(); 208 size = read8();
187 header_page = malloc_or_die(size); 209 skip(size);
188 read_or_die(header_page, size);
189 parse_header_page(header_page, size);
190 free(header_page);
191 210
192 /* 211 /*
193 * The size field in the page is of type long, 212 * The size field in the page is of type long,
@@ -282,8 +301,8 @@ static void update_cpu_data_index(int cpu)
282 301
283static void get_next_page(int cpu) 302static void get_next_page(int cpu)
284{ 303{
285 off64_t save_seek; 304 off_t save_seek;
286 off64_t ret; 305 off_t ret;
287 306
288 if (!cpu_data[cpu].page) 307 if (!cpu_data[cpu].page)
289 return; 308 return;
@@ -298,17 +317,17 @@ static void get_next_page(int cpu)
298 update_cpu_data_index(cpu); 317 update_cpu_data_index(cpu);
299 318
300 /* other parts of the code may expect the pointer to not move */ 319 /* other parts of the code may expect the pointer to not move */
301 save_seek = lseek64(input_fd, 0, SEEK_CUR); 320 save_seek = lseek(input_fd, 0, SEEK_CUR);
302 321
303 ret = lseek64(input_fd, cpu_data[cpu].offset, SEEK_SET); 322 ret = lseek(input_fd, cpu_data[cpu].offset, SEEK_SET);
304 if (ret < 0) 323 if (ret == (off_t)-1)
305 die("failed to lseek"); 324 die("failed to lseek");
306 ret = read(input_fd, cpu_data[cpu].page, page_size); 325 ret = read(input_fd, cpu_data[cpu].page, page_size);
307 if (ret < 0) 326 if (ret < 0)
308 die("failed to read page"); 327 die("failed to read page");
309 328
310 /* reset the file pointer back */ 329 /* reset the file pointer back */
311 lseek64(input_fd, save_seek, SEEK_SET); 330 lseek(input_fd, save_seek, SEEK_SET);
312 331
313 return; 332 return;
314 } 333 }
@@ -459,7 +478,7 @@ struct record *trace_read_data(int cpu)
459 return data; 478 return data;
460} 479}
461 480
462void trace_report(int fd) 481ssize_t trace_report(int fd, bool __repipe)
463{ 482{
464 char buf[BUFSIZ]; 483 char buf[BUFSIZ];
465 char test[] = { 23, 8, 68 }; 484 char test[] = { 23, 8, 68 };
@@ -467,6 +486,10 @@ void trace_report(int fd)
467 int show_version = 0; 486 int show_version = 0;
468 int show_funcs = 0; 487 int show_funcs = 0;
469 int show_printk = 0; 488 int show_printk = 0;
489 ssize_t size;
490
491 calc_data_size = 1;
492 repipe = __repipe;
470 493
471 input_fd = fd; 494 input_fd = fd;
472 495
@@ -499,14 +522,18 @@ void trace_report(int fd)
499 read_proc_kallsyms(); 522 read_proc_kallsyms();
500 read_ftrace_printk(); 523 read_ftrace_printk();
501 524
525 size = calc_data_size - 1;
526 calc_data_size = 0;
527 repipe = false;
528
502 if (show_funcs) { 529 if (show_funcs) {
503 print_funcs(); 530 print_funcs();
504 return; 531 return size;
505 } 532 }
506 if (show_printk) { 533 if (show_printk) {
507 print_printk(); 534 print_printk();
508 return; 535 return size;
509 } 536 }
510 537
511 return; 538 return size;
512} 539}
diff --git a/tools/perf/util/trace-event-scripting.c b/tools/perf/util/trace-event-scripting.c
new file mode 100644
index 000000000000..7ea983acfaea
--- /dev/null
+++ b/tools/perf/util/trace-event-scripting.c
@@ -0,0 +1,167 @@
1/*
2 * trace-event-scripting. Scripting engine common and initialization code.
3 *
4 * Copyright (C) 2009-2010 Tom Zanussi <tzanussi@gmail.com>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19 *
20 */
21
22#include <stdio.h>
23#include <stdlib.h>
24#include <string.h>
25#include <ctype.h>
26#include <errno.h>
27
28#include "../perf.h"
29#include "util.h"
30#include "trace-event.h"
31
32struct scripting_context *scripting_context;
33
34static int stop_script_unsupported(void)
35{
36 return 0;
37}
38
39static void process_event_unsupported(int cpu __unused,
40 void *data __unused,
41 int size __unused,
42 unsigned long long nsecs __unused,
43 char *comm __unused)
44{
45}
46
47static void print_python_unsupported_msg(void)
48{
49 fprintf(stderr, "Python scripting not supported."
50 " Install libpython and rebuild perf to enable it.\n"
51 "For example:\n # apt-get install python-dev (ubuntu)"
52 "\n # yum install python-devel (Fedora)"
53 "\n etc.\n");
54}
55
56static int python_start_script_unsupported(const char *script __unused,
57 int argc __unused,
58 const char **argv __unused)
59{
60 print_python_unsupported_msg();
61
62 return -1;
63}
64
65static int python_generate_script_unsupported(const char *outfile __unused)
66{
67 print_python_unsupported_msg();
68
69 return -1;
70}
71
72struct scripting_ops python_scripting_unsupported_ops = {
73 .name = "Python",
74 .start_script = python_start_script_unsupported,
75 .stop_script = stop_script_unsupported,
76 .process_event = process_event_unsupported,
77 .generate_script = python_generate_script_unsupported,
78};
79
80static void register_python_scripting(struct scripting_ops *scripting_ops)
81{
82 int err;
83 err = script_spec_register("Python", scripting_ops);
84 if (err)
85 die("error registering Python script extension");
86
87 err = script_spec_register("py", scripting_ops);
88 if (err)
89 die("error registering py script extension");
90
91 scripting_context = malloc(sizeof(struct scripting_context));
92}
93
94#ifdef NO_LIBPYTHON
95void setup_python_scripting(void)
96{
97 register_python_scripting(&python_scripting_unsupported_ops);
98}
99#else
100struct scripting_ops python_scripting_ops;
101
102void setup_python_scripting(void)
103{
104 register_python_scripting(&python_scripting_ops);
105}
106#endif
107
108static void print_perl_unsupported_msg(void)
109{
110 fprintf(stderr, "Perl scripting not supported."
111 " Install libperl and rebuild perf to enable it.\n"
112 "For example:\n # apt-get install libperl-dev (ubuntu)"
113 "\n # yum install 'perl(ExtUtils::Embed)' (Fedora)"
114 "\n etc.\n");
115}
116
117static int perl_start_script_unsupported(const char *script __unused,
118 int argc __unused,
119 const char **argv __unused)
120{
121 print_perl_unsupported_msg();
122
123 return -1;
124}
125
126static int perl_generate_script_unsupported(const char *outfile __unused)
127{
128 print_perl_unsupported_msg();
129
130 return -1;
131}
132
133struct scripting_ops perl_scripting_unsupported_ops = {
134 .name = "Perl",
135 .start_script = perl_start_script_unsupported,
136 .stop_script = stop_script_unsupported,
137 .process_event = process_event_unsupported,
138 .generate_script = perl_generate_script_unsupported,
139};
140
141static void register_perl_scripting(struct scripting_ops *scripting_ops)
142{
143 int err;
144 err = script_spec_register("Perl", scripting_ops);
145 if (err)
146 die("error registering Perl script extension");
147
148 err = script_spec_register("pl", scripting_ops);
149 if (err)
150 die("error registering pl script extension");
151
152 scripting_context = malloc(sizeof(struct scripting_context));
153}
154
155#ifdef NO_LIBPERL
156void setup_perl_scripting(void)
157{
158 register_perl_scripting(&perl_scripting_unsupported_ops);
159}
160#else
161struct scripting_ops perl_scripting_ops;
162
163void setup_perl_scripting(void)
164{
165 register_perl_scripting(&perl_scripting_ops);
166}
167#endif
diff --git a/tools/perf/util/trace-event.h b/tools/perf/util/trace-event.h
index 6ad405620c9b..b3e86b1e4444 100644
--- a/tools/perf/util/trace-event.h
+++ b/tools/perf/util/trace-event.h
@@ -1,6 +1,7 @@
1#ifndef __PERF_TRACE_EVENTS_H 1#ifndef __PERF_TRACE_EVENTS_H
2#define __PERF_TRACE_EVENTS_H 2#define __PERF_TRACE_EVENTS_H
3 3
4#include <stdbool.h>
4#include "parse-events.h" 5#include "parse-events.h"
5 6
6#define __unused __attribute__((unused)) 7#define __unused __attribute__((unused))
@@ -162,7 +163,7 @@ struct record *trace_read_data(int cpu);
162 163
163void parse_set_info(int nr_cpus, int long_sz); 164void parse_set_info(int nr_cpus, int long_sz);
164 165
165void trace_report(int fd); 166ssize_t trace_report(int fd, bool repipe);
166 167
167void *malloc_or_die(unsigned int size); 168void *malloc_or_die(unsigned int size);
168 169
@@ -232,7 +233,12 @@ static inline unsigned long long __data2host8(unsigned long long data)
232 233
233#define data2host2(ptr) __data2host2(*(unsigned short *)ptr) 234#define data2host2(ptr) __data2host2(*(unsigned short *)ptr)
234#define data2host4(ptr) __data2host4(*(unsigned int *)ptr) 235#define data2host4(ptr) __data2host4(*(unsigned int *)ptr)
235#define data2host8(ptr) __data2host8(*(unsigned long long *)ptr) 236#define data2host8(ptr) ({ \
237 unsigned long long __val; \
238 \
239 memcpy(&__val, (ptr), sizeof(unsigned long long)); \
240 __data2host8(__val); \
241})
236 242
237extern int header_page_ts_offset; 243extern int header_page_ts_offset;
238extern int header_page_ts_size; 244extern int header_page_ts_size;
@@ -241,9 +247,8 @@ extern int header_page_size_size;
241extern int header_page_data_offset; 247extern int header_page_data_offset;
242extern int header_page_data_size; 248extern int header_page_data_size;
243 249
244extern int latency_format; 250extern bool latency_format;
245 251
246int parse_header_page(char *buf, unsigned long size);
247int trace_parse_common_type(void *data); 252int trace_parse_common_type(void *data);
248int trace_parse_common_pid(void *data); 253int trace_parse_common_pid(void *data);
249int parse_common_pc(void *data); 254int parse_common_pc(void *data);
@@ -258,6 +263,8 @@ void *raw_field_ptr(struct event *event, const char *name, void *data);
258unsigned long long eval_flag(const char *flag); 263unsigned long long eval_flag(const char *flag);
259 264
260int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events); 265int read_tracing_data(int fd, struct perf_event_attr *pattrs, int nb_events);
266ssize_t read_tracing_data_size(int fd, struct perf_event_attr *pattrs,
267 int nb_events);
261 268
262/* taken from kernel/trace/trace.h */ 269/* taken from kernel/trace/trace.h */
263enum trace_flag_type { 270enum trace_flag_type {
@@ -279,7 +286,15 @@ struct scripting_ops {
279 286
280int script_spec_register(const char *spec, struct scripting_ops *ops); 287int script_spec_register(const char *spec, struct scripting_ops *ops);
281 288
282extern struct scripting_ops perl_scripting_ops;
283void setup_perl_scripting(void); 289void setup_perl_scripting(void);
290void setup_python_scripting(void);
291
292struct scripting_context {
293 void *event_data;
294};
295
296int common_pc(struct scripting_context *context);
297int common_flags(struct scripting_context *context);
298int common_lock_depth(struct scripting_context *context);
284 299
285#endif /* __PERF_TRACE_EVENTS_H */ 300#endif /* __PERF_TRACE_EVENTS_H */
diff --git a/tools/perf/util/util.c b/tools/perf/util/util.c
new file mode 100644
index 000000000000..214265674ddd
--- /dev/null
+++ b/tools/perf/util/util.c
@@ -0,0 +1,116 @@
1#include "util.h"
2#include <sys/mman.h>
3
4int mkdir_p(char *path, mode_t mode)
5{
6 struct stat st;
7 int err;
8 char *d = path;
9
10 if (*d != '/')
11 return -1;
12
13 if (stat(path, &st) == 0)
14 return 0;
15
16 while (*++d == '/');
17
18 while ((d = strchr(d, '/'))) {
19 *d = '\0';
20 err = stat(path, &st) && mkdir(path, mode);
21 *d++ = '/';
22 if (err)
23 return -1;
24 while (*d == '/')
25 ++d;
26 }
27 return (stat(path, &st) && mkdir(path, mode)) ? -1 : 0;
28}
29
30static int slow_copyfile(const char *from, const char *to)
31{
32 int err = 0;
33 char *line = NULL;
34 size_t n;
35 FILE *from_fp = fopen(from, "r"), *to_fp;
36
37 if (from_fp == NULL)
38 goto out;
39
40 to_fp = fopen(to, "w");
41 if (to_fp == NULL)
42 goto out_fclose_from;
43
44 while (getline(&line, &n, from_fp) > 0)
45 if (fputs(line, to_fp) == EOF)
46 goto out_fclose_to;
47 err = 0;
48out_fclose_to:
49 fclose(to_fp);
50 free(line);
51out_fclose_from:
52 fclose(from_fp);
53out:
54 return err;
55}
56
57int copyfile(const char *from, const char *to)
58{
59 int fromfd, tofd;
60 struct stat st;
61 void *addr;
62 int err = -1;
63
64 if (stat(from, &st))
65 goto out;
66
67 if (st.st_size == 0) /* /proc? do it slowly... */
68 return slow_copyfile(from, to);
69
70 fromfd = open(from, O_RDONLY);
71 if (fromfd < 0)
72 goto out;
73
74 tofd = creat(to, 0755);
75 if (tofd < 0)
76 goto out_close_from;
77
78 addr = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, fromfd, 0);
79 if (addr == MAP_FAILED)
80 goto out_close_to;
81
82 if (write(tofd, addr, st.st_size) == st.st_size)
83 err = 0;
84
85 munmap(addr, st.st_size);
86out_close_to:
87 close(tofd);
88 if (err)
89 unlink(to);
90out_close_from:
91 close(fromfd);
92out:
93 return err;
94}
95
96unsigned long convert_unit(unsigned long value, char *unit)
97{
98 *unit = ' ';
99
100 if (value > 1000) {
101 value /= 1000;
102 *unit = 'K';
103 }
104
105 if (value > 1000) {
106 value /= 1000;
107 *unit = 'M';
108 }
109
110 if (value > 1000) {
111 value /= 1000;
112 *unit = 'G';
113 }
114
115 return value;
116}
diff --git a/tools/perf/util/util.h b/tools/perf/util/util.h
index c673d8825883..4e8b6b0c551c 100644
--- a/tools/perf/util/util.h
+++ b/tools/perf/util/util.h
@@ -42,12 +42,14 @@
42#define _ALL_SOURCE 1 42#define _ALL_SOURCE 1
43#define _GNU_SOURCE 1 43#define _GNU_SOURCE 1
44#define _BSD_SOURCE 1 44#define _BSD_SOURCE 1
45#define HAS_BOOL
45 46
46#include <unistd.h> 47#include <unistd.h>
47#include <stdio.h> 48#include <stdio.h>
48#include <sys/stat.h> 49#include <sys/stat.h>
49#include <sys/statfs.h> 50#include <sys/statfs.h>
50#include <fcntl.h> 51#include <fcntl.h>
52#include <stdbool.h>
51#include <stddef.h> 53#include <stddef.h>
52#include <stdlib.h> 54#include <stdlib.h>
53#include <stdarg.h> 55#include <stdarg.h>
@@ -78,7 +80,8 @@
78#include <pwd.h> 80#include <pwd.h>
79#include <inttypes.h> 81#include <inttypes.h>
80#include "../../../include/linux/magic.h" 82#include "../../../include/linux/magic.h"
81 83#include "types.h"
84#include <sys/ttydefaults.h>
82 85
83#ifndef NO_ICONV 86#ifndef NO_ICONV
84#include <iconv.h> 87#include <iconv.h>
@@ -149,7 +152,6 @@ extern void warning(const char *err, ...) __attribute__((format (printf, 1, 2)))
149extern void set_die_routine(void (*routine)(const char *err, va_list params) NORETURN); 152extern void set_die_routine(void (*routine)(const char *err, va_list params) NORETURN);
150 153
151extern int prefixcmp(const char *str, const char *prefix); 154extern int prefixcmp(const char *str, const char *prefix);
152extern time_t tm_to_time_t(const struct tm *tm);
153 155
154static inline const char *skip_prefix(const char *str, const char *prefix) 156static inline const char *skip_prefix(const char *str, const char *prefix)
155{ 157{
@@ -157,119 +159,6 @@ static inline const char *skip_prefix(const char *str, const char *prefix)
157 return strncmp(str, prefix, len) ? NULL : str + len; 159 return strncmp(str, prefix, len) ? NULL : str + len;
158} 160}
159 161
160#if defined(NO_MMAP) || defined(USE_WIN32_MMAP)
161
162#ifndef PROT_READ
163#define PROT_READ 1
164#define PROT_WRITE 2
165#define MAP_PRIVATE 1
166#define MAP_FAILED ((void*)-1)
167#endif
168
169#define mmap git_mmap
170#define munmap git_munmap
171extern void *git_mmap(void *start, size_t length, int prot, int flags, int fd, off_t offset);
172extern int git_munmap(void *start, size_t length);
173
174#else /* NO_MMAP || USE_WIN32_MMAP */
175
176#include <sys/mman.h>
177
178#endif /* NO_MMAP || USE_WIN32_MMAP */
179
180#ifdef NO_MMAP
181
182/* This value must be multiple of (pagesize * 2) */
183#define DEFAULT_PACKED_GIT_WINDOW_SIZE (1 * 1024 * 1024)
184
185#else /* NO_MMAP */
186
187/* This value must be multiple of (pagesize * 2) */
188#define DEFAULT_PACKED_GIT_WINDOW_SIZE \
189 (sizeof(void*) >= 8 \
190 ? 1 * 1024 * 1024 * 1024 \
191 : 32 * 1024 * 1024)
192
193#endif /* NO_MMAP */
194
195#ifdef NO_ST_BLOCKS_IN_STRUCT_STAT
196#define on_disk_bytes(st) ((st).st_size)
197#else
198#define on_disk_bytes(st) ((st).st_blocks * 512)
199#endif
200
201#define DEFAULT_PACKED_GIT_LIMIT \
202 ((1024L * 1024L) * (sizeof(void*) >= 8 ? 8192 : 256))
203
204#ifdef NO_PREAD
205#define pread git_pread
206extern ssize_t git_pread(int fd, void *buf, size_t count, off_t offset);
207#endif
208/*
209 * Forward decl that will remind us if its twin in cache.h changes.
210 * This function is used in compat/pread.c. But we can't include
211 * cache.h there.
212 */
213extern ssize_t read_in_full(int fd, void *buf, size_t count);
214
215#ifdef NO_SETENV
216#define setenv gitsetenv
217extern int gitsetenv(const char *, const char *, int);
218#endif
219
220#ifdef NO_MKDTEMP
221#define mkdtemp gitmkdtemp
222extern char *gitmkdtemp(char *);
223#endif
224
225#ifdef NO_UNSETENV
226#define unsetenv gitunsetenv
227extern void gitunsetenv(const char *);
228#endif
229
230#ifdef NO_STRCASESTR
231#define strcasestr gitstrcasestr
232extern char *gitstrcasestr(const char *haystack, const char *needle);
233#endif
234
235#ifdef NO_STRLCPY
236#define strlcpy gitstrlcpy
237extern size_t gitstrlcpy(char *, const char *, size_t);
238#endif
239
240#ifdef NO_STRTOUMAX
241#define strtoumax gitstrtoumax
242extern uintmax_t gitstrtoumax(const char *, char **, int);
243#endif
244
245#ifdef NO_HSTRERROR
246#define hstrerror githstrerror
247extern const char *githstrerror(int herror);
248#endif
249
250#ifdef NO_MEMMEM
251#define memmem gitmemmem
252void *gitmemmem(const void *haystack, size_t haystacklen,
253 const void *needle, size_t needlelen);
254#endif
255
256#ifdef FREAD_READS_DIRECTORIES
257#ifdef fopen
258#undef fopen
259#endif
260#define fopen(a,b) git_fopen(a,b)
261extern FILE *git_fopen(const char*, const char*);
262#endif
263
264#ifdef SNPRINTF_RETURNS_BOGUS
265#define snprintf git_snprintf
266extern int git_snprintf(char *str, size_t maxsize,
267 const char *format, ...);
268#define vsnprintf git_vsnprintf
269extern int git_vsnprintf(char *str, size_t maxsize,
270 const char *format, va_list ap);
271#endif
272
273#ifdef __GLIBC_PREREQ 162#ifdef __GLIBC_PREREQ
274#if __GLIBC_PREREQ(2, 1) 163#if __GLIBC_PREREQ(2, 1)
275#define HAVE_STRCHRNUL 164#define HAVE_STRCHRNUL
@@ -290,25 +179,19 @@ static inline char *gitstrchrnul(const char *s, int c)
290 * Wrappers: 179 * Wrappers:
291 */ 180 */
292extern char *xstrdup(const char *str); 181extern char *xstrdup(const char *str);
293extern void *xmalloc(size_t size) __attribute__((weak));
294extern void *xmemdupz(const void *data, size_t len);
295extern char *xstrndup(const char *str, size_t len);
296extern void *xrealloc(void *ptr, size_t size) __attribute__((weak)); 182extern void *xrealloc(void *ptr, size_t size) __attribute__((weak));
297 183
184
298static inline void *zalloc(size_t size) 185static inline void *zalloc(size_t size)
299{ 186{
300 return calloc(1, size); 187 return calloc(1, size);
301} 188}
302 189
303static inline size_t xsize_t(off_t len)
304{
305 return (size_t)len;
306}
307
308static inline int has_extension(const char *filename, const char *ext) 190static inline int has_extension(const char *filename, const char *ext)
309{ 191{
310 size_t len = strlen(filename); 192 size_t len = strlen(filename);
311 size_t extlen = strlen(ext); 193 size_t extlen = strlen(ext);
194
312 return len > extlen && !memcmp(filename + len - extlen, ext, extlen); 195 return len > extlen && !memcmp(filename + len - extlen, ext, extlen);
313} 196}
314 197
@@ -322,6 +205,7 @@ static inline int has_extension(const char *filename, const char *ext)
322#undef isalnum 205#undef isalnum
323#undef tolower 206#undef tolower
324#undef toupper 207#undef toupper
208
325extern unsigned char sane_ctype[256]; 209extern unsigned char sane_ctype[256];
326#define GIT_SPACE 0x01 210#define GIT_SPACE 0x01
327#define GIT_DIGIT 0x02 211#define GIT_DIGIT 0x02
@@ -339,8 +223,6 @@ extern unsigned char sane_ctype[256];
339#define isalpha(x) sane_istest(x,GIT_ALPHA) 223#define isalpha(x) sane_istest(x,GIT_ALPHA)
340#define isalnum(x) sane_istest(x,GIT_ALPHA | GIT_DIGIT) 224#define isalnum(x) sane_istest(x,GIT_ALPHA | GIT_DIGIT)
341#define isprint(x) sane_istest(x,GIT_PRINT) 225#define isprint(x) sane_istest(x,GIT_PRINT)
342#define is_glob_special(x) sane_istest(x,GIT_GLOB_SPECIAL)
343#define is_regex_special(x) sane_istest(x,GIT_GLOB_SPECIAL | GIT_REGEX_SPECIAL)
344#define tolower(x) sane_case((unsigned char)(x), 0x20) 226#define tolower(x) sane_case((unsigned char)(x), 0x20)
345#define toupper(x) sane_case((unsigned char)(x), 0) 227#define toupper(x) sane_case((unsigned char)(x), 0)
346 228
@@ -351,38 +233,6 @@ static inline int sane_case(int x, int high)
351 return x; 233 return x;
352} 234}
353 235
354static inline int strtoul_ui(char const *s, int base, unsigned int *result)
355{
356 unsigned long ul;
357 char *p;
358
359 errno = 0;
360 ul = strtoul(s, &p, base);
361 if (errno || *p || p == s || (unsigned int) ul != ul)
362 return -1;
363 *result = ul;
364 return 0;
365}
366
367static inline int strtol_i(char const *s, int base, int *result)
368{
369 long ul;
370 char *p;
371
372 errno = 0;
373 ul = strtol(s, &p, base);
374 if (errno || *p || p == s || (int) ul != ul)
375 return -1;
376 *result = ul;
377 return 0;
378}
379
380#ifdef INTERNAL_QSORT
381void git_qsort(void *base, size_t nmemb, size_t size,
382 int(*compar)(const void *, const void *));
383#define qsort git_qsort
384#endif
385
386#ifndef DIR_HAS_BSD_GROUP_SEMANTICS 236#ifndef DIR_HAS_BSD_GROUP_SEMANTICS
387# define FORCE_DIR_SET_GID S_ISGID 237# define FORCE_DIR_SET_GID S_ISGID
388#else 238#else
@@ -403,4 +253,30 @@ void git_qsort(void *base, size_t nmemb, size_t size,
403#endif 253#endif
404#endif 254#endif
405 255
256int mkdir_p(char *path, mode_t mode);
257int copyfile(const char *from, const char *to);
258
259s64 perf_atoll(const char *str);
260char **argv_split(const char *str, int *argcp);
261void argv_free(char **argv);
262bool strglobmatch(const char *str, const char *pat);
263bool strlazymatch(const char *str, const char *pat);
264unsigned long convert_unit(unsigned long value, char *unit);
265
266#ifndef ESC
267#define ESC 27
268#endif
269
270static inline bool is_exit_key(int key)
271{
272 char up;
273 if (key == CTRL('c') || key == ESC)
274 return true;
275 up = toupper(key);
276 return up == 'Q';
277}
278
279#define _STR(x) #x
280#define STR(x) _STR(x)
281
406#endif 282#endif
diff --git a/tools/perf/util/values.c b/tools/perf/util/values.c
index 1c15e39f99e3..cfa55d686e3b 100644
--- a/tools/perf/util/values.c
+++ b/tools/perf/util/values.c
@@ -169,6 +169,7 @@ static void perf_read_values__display_pretty(FILE *fp,
169 counterwidth[j], values->value[i][j]); 169 counterwidth[j], values->value[i][j]);
170 fprintf(fp, "\n"); 170 fprintf(fp, "\n");
171 } 171 }
172 free(counterwidth);
172} 173}
173 174
174static void perf_read_values__display_raw(FILE *fp, 175static void perf_read_values__display_raw(FILE *fp,
diff --git a/tools/perf/util/wrapper.c b/tools/perf/util/wrapper.c
index bf44ca85d23b..73e900edb5a2 100644
--- a/tools/perf/util/wrapper.c
+++ b/tools/perf/util/wrapper.c
@@ -23,46 +23,6 @@ char *xstrdup(const char *str)
23 return ret; 23 return ret;
24} 24}
25 25
26void *xmalloc(size_t size)
27{
28 void *ret = malloc(size);
29 if (!ret && !size)
30 ret = malloc(1);
31 if (!ret) {
32 release_pack_memory(size, -1);
33 ret = malloc(size);
34 if (!ret && !size)
35 ret = malloc(1);
36 if (!ret)
37 die("Out of memory, malloc failed");
38 }
39#ifdef XMALLOC_POISON
40 memset(ret, 0xA5, size);
41#endif
42 return ret;
43}
44
45/*
46 * xmemdupz() allocates (len + 1) bytes of memory, duplicates "len" bytes of
47 * "data" to the allocated memory, zero terminates the allocated memory,
48 * and returns a pointer to the allocated memory. If the allocation fails,
49 * the program dies.
50 */
51void *xmemdupz(const void *data, size_t len)
52{
53 char *p = xmalloc(len + 1);
54 memcpy(p, data, len);
55 p[len] = '\0';
56 return p;
57}
58
59char *xstrndup(const char *str, size_t len)
60{
61 char *p = memchr(str, '\0', len);
62
63 return xmemdupz(str, p ? (size_t)(p - str) : len);
64}
65
66void *xrealloc(void *ptr, size_t size) 26void *xrealloc(void *ptr, size_t size)
67{ 27{
68 void *ret = realloc(ptr, size); 28 void *ret = realloc(ptr, size);
@@ -78,73 +38,3 @@ void *xrealloc(void *ptr, size_t size)
78 } 38 }
79 return ret; 39 return ret;
80} 40}
81
82/*
83 * xread() is the same a read(), but it automatically restarts read()
84 * operations with a recoverable error (EAGAIN and EINTR). xread()
85 * DOES NOT GUARANTEE that "len" bytes is read even if the data is available.
86 */
87static ssize_t xread(int fd, void *buf, size_t len)
88{
89 ssize_t nr;
90 while (1) {
91 nr = read(fd, buf, len);
92 if ((nr < 0) && (errno == EAGAIN || errno == EINTR))
93 continue;
94 return nr;
95 }
96}
97
98/*
99 * xwrite() is the same a write(), but it automatically restarts write()
100 * operations with a recoverable error (EAGAIN and EINTR). xwrite() DOES NOT
101 * GUARANTEE that "len" bytes is written even if the operation is successful.
102 */
103static ssize_t xwrite(int fd, const void *buf, size_t len)
104{
105 ssize_t nr;
106 while (1) {
107 nr = write(fd, buf, len);
108 if ((nr < 0) && (errno == EAGAIN || errno == EINTR))
109 continue;
110 return nr;
111 }
112}
113
114ssize_t read_in_full(int fd, void *buf, size_t count)
115{
116 char *p = buf;
117 ssize_t total = 0;
118
119 while (count > 0) {
120 ssize_t loaded = xread(fd, p, count);
121 if (loaded <= 0)
122 return total ? total : loaded;
123 count -= loaded;
124 p += loaded;
125 total += loaded;
126 }
127
128 return total;
129}
130
131ssize_t write_in_full(int fd, const void *buf, size_t count)
132{
133 const char *p = buf;
134 ssize_t total = 0;
135
136 while (count > 0) {
137 ssize_t written = xwrite(fd, p, count);
138 if (written < 0)
139 return -1;
140 if (!written) {
141 errno = ENOSPC;
142 return -1;
143 }
144 count -= written;
145 p += written;
146 total += written;
147 }
148
149 return total;
150}
diff --git a/tools/usb/ffs-test.c b/tools/usb/ffs-test.c
new file mode 100644
index 000000000000..bbe2e3a2ea62
--- /dev/null
+++ b/tools/usb/ffs-test.c
@@ -0,0 +1,554 @@
1/*
2 * ffs-test.c.c -- user mode filesystem api for usb composite function
3 *
4 * Copyright (C) 2010 Samsung Electronics
5 * Author: Michal Nazarewicz <m.nazarewicz@samsung.com>
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 */
21
22/* $(CROSS_COMPILE)cc -Wall -Wextra -g -o ffs-test ffs-test.c -lpthread */
23
24
25#define _BSD_SOURCE /* for endian.h */
26
27#include <endian.h>
28#include <errno.h>
29#include <fcntl.h>
30#include <pthread.h>
31#include <stdarg.h>
32#include <stdio.h>
33#include <stdlib.h>
34#include <string.h>
35#include <sys/ioctl.h>
36#include <sys/stat.h>
37#include <sys/types.h>
38#include <unistd.h>
39
40#include <linux/usb/functionfs.h>
41
42
43/******************** Little Endian Handling ********************************/
44
45#define cpu_to_le16(x) htole16(x)
46#define cpu_to_le32(x) htole32(x)
47#define le32_to_cpu(x) le32toh(x)
48#define le16_to_cpu(x) le16toh(x)
49
50static inline __u16 get_unaligned_le16(const void *_ptr)
51{
52 const __u8 *ptr = _ptr;
53 return ptr[0] | (ptr[1] << 8);
54}
55
56static inline __u32 get_unaligned_le32(const void *_ptr)
57{
58 const __u8 *ptr = _ptr;
59 return ptr[0] | (ptr[1] << 8) | (ptr[2] << 16) | (ptr[3] << 24);
60}
61
62static inline void put_unaligned_le16(__u16 val, void *_ptr)
63{
64 __u8 *ptr = _ptr;
65 *ptr++ = val;
66 *ptr++ = val >> 8;
67}
68
69static inline void put_unaligned_le32(__u32 val, void *_ptr)
70{
71 __u8 *ptr = _ptr;
72 *ptr++ = val;
73 *ptr++ = val >> 8;
74 *ptr++ = val >> 16;
75 *ptr++ = val >> 24;
76}
77
78
79/******************** Messages and Errors ***********************************/
80
81static const char argv0[] = "ffs-test";
82
83static unsigned verbosity = 7;
84
85static void _msg(unsigned level, const char *fmt, ...)
86{
87 if (level < 2)
88 level = 2;
89 else if (level > 7)
90 level = 7;
91
92 if (level <= verbosity) {
93 static const char levels[8][6] = {
94 [2] = "crit:",
95 [3] = "err: ",
96 [4] = "warn:",
97 [5] = "note:",
98 [6] = "info:",
99 [7] = "dbg: "
100 };
101
102 int _errno = errno;
103 va_list ap;
104
105 fprintf(stderr, "%s: %s ", argv0, levels[level]);
106 va_start(ap, fmt);
107 vfprintf(stderr, fmt, ap);
108 va_end(ap);
109
110 if (fmt[strlen(fmt) - 1] != '\n') {
111 char buffer[128];
112 strerror_r(_errno, buffer, sizeof buffer);
113 fprintf(stderr, ": (-%d) %s\n", _errno, buffer);
114 }
115
116 fflush(stderr);
117 }
118}
119
120#define die(...) (_msg(2, __VA_ARGS__), exit(1))
121#define err(...) _msg(3, __VA_ARGS__)
122#define warn(...) _msg(4, __VA_ARGS__)
123#define note(...) _msg(5, __VA_ARGS__)
124#define info(...) _msg(6, __VA_ARGS__)
125#define debug(...) _msg(7, __VA_ARGS__)
126
127#define die_on(cond, ...) do { \
128 if (cond) \
129 die(__VA_ARGS__); \
130 } while (0)
131
132
133/******************** Descriptors and Strings *******************************/
134
135static const struct {
136 struct usb_functionfs_descs_head header;
137 struct {
138 struct usb_interface_descriptor intf;
139 struct usb_endpoint_descriptor_no_audio sink;
140 struct usb_endpoint_descriptor_no_audio source;
141 } __attribute__((packed)) fs_descs, hs_descs;
142} __attribute__((packed)) descriptors = {
143 .header = {
144 .magic = cpu_to_le32(FUNCTIONFS_DESCRIPTORS_MAGIC),
145 .length = cpu_to_le32(sizeof descriptors),
146 .fs_count = 3,
147 .hs_count = 3,
148 },
149 .fs_descs = {
150 .intf = {
151 .bLength = sizeof descriptors.fs_descs.intf,
152 .bDescriptorType = USB_DT_INTERFACE,
153 .bNumEndpoints = 2,
154 .bInterfaceClass = USB_CLASS_VENDOR_SPEC,
155 .iInterface = 1,
156 },
157 .sink = {
158 .bLength = sizeof descriptors.fs_descs.sink,
159 .bDescriptorType = USB_DT_ENDPOINT,
160 .bEndpointAddress = 1 | USB_DIR_IN,
161 .bmAttributes = USB_ENDPOINT_XFER_BULK,
162 /* .wMaxPacketSize = autoconfiguration (kernel) */
163 },
164 .source = {
165 .bLength = sizeof descriptors.fs_descs.source,
166 .bDescriptorType = USB_DT_ENDPOINT,
167 .bEndpointAddress = 2 | USB_DIR_OUT,
168 .bmAttributes = USB_ENDPOINT_XFER_BULK,
169 /* .wMaxPacketSize = autoconfiguration (kernel) */
170 },
171 },
172 .hs_descs = {
173 .intf = {
174 .bLength = sizeof descriptors.fs_descs.intf,
175 .bDescriptorType = USB_DT_INTERFACE,
176 .bNumEndpoints = 2,
177 .bInterfaceClass = USB_CLASS_VENDOR_SPEC,
178 .iInterface = 1,
179 },
180 .sink = {
181 .bLength = sizeof descriptors.hs_descs.sink,
182 .bDescriptorType = USB_DT_ENDPOINT,
183 .bEndpointAddress = 1 | USB_DIR_IN,
184 .bmAttributes = USB_ENDPOINT_XFER_BULK,
185 .wMaxPacketSize = cpu_to_le16(512),
186 },
187 .source = {
188 .bLength = sizeof descriptors.hs_descs.source,
189 .bDescriptorType = USB_DT_ENDPOINT,
190 .bEndpointAddress = 2 | USB_DIR_OUT,
191 .bmAttributes = USB_ENDPOINT_XFER_BULK,
192 .wMaxPacketSize = cpu_to_le16(512),
193 .bInterval = 1, /* NAK every 1 uframe */
194 },
195 },
196};
197
198
199#define STR_INTERFACE_ "Source/Sink"
200
201static const struct {
202 struct usb_functionfs_strings_head header;
203 struct {
204 __le16 code;
205 const char str1[sizeof STR_INTERFACE_];
206 } __attribute__((packed)) lang0;
207} __attribute__((packed)) strings = {
208 .header = {
209 .magic = cpu_to_le32(FUNCTIONFS_STRINGS_MAGIC),
210 .length = cpu_to_le32(sizeof strings),
211 .str_count = cpu_to_le32(1),
212 .lang_count = cpu_to_le32(1),
213 },
214 .lang0 = {
215 cpu_to_le16(0x0409), /* en-us */
216 STR_INTERFACE_,
217 },
218};
219
220#define STR_INTERFACE strings.lang0.str1
221
222
223/******************** Files and Threads Handling ****************************/
224
225struct thread;
226
227static ssize_t read_wrap(struct thread *t, void *buf, size_t nbytes);
228static ssize_t write_wrap(struct thread *t, const void *buf, size_t nbytes);
229static ssize_t ep0_consume(struct thread *t, const void *buf, size_t nbytes);
230static ssize_t fill_in_buf(struct thread *t, void *buf, size_t nbytes);
231static ssize_t empty_out_buf(struct thread *t, const void *buf, size_t nbytes);
232
233
234static struct thread {
235 const char *const filename;
236 size_t buf_size;
237
238 ssize_t (*in)(struct thread *, void *, size_t);
239 const char *const in_name;
240
241 ssize_t (*out)(struct thread *, const void *, size_t);
242 const char *const out_name;
243
244 int fd;
245 pthread_t id;
246 void *buf;
247 ssize_t status;
248} threads[] = {
249 {
250 "ep0", 4 * sizeof(struct usb_functionfs_event),
251 read_wrap, NULL,
252 ep0_consume, "<consume>",
253 0, 0, NULL, 0
254 },
255 {
256 "ep1", 8 * 1024,
257 fill_in_buf, "<in>",
258 write_wrap, NULL,
259 0, 0, NULL, 0
260 },
261 {
262 "ep2", 8 * 1024,
263 read_wrap, NULL,
264 empty_out_buf, "<out>",
265 0, 0, NULL, 0
266 },
267};
268
269
270static void init_thread(struct thread *t)
271{
272 t->buf = malloc(t->buf_size);
273 die_on(!t->buf, "malloc");
274
275 t->fd = open(t->filename, O_RDWR);
276 die_on(t->fd < 0, "%s", t->filename);
277}
278
279static void cleanup_thread(void *arg)
280{
281 struct thread *t = arg;
282 int ret, fd;
283
284 fd = t->fd;
285 if (t->fd < 0)
286 return;
287 t->fd = -1;
288
289 /* test the FIFO ioctls (non-ep0 code paths) */
290 if (t != threads) {
291 ret = ioctl(fd, FUNCTIONFS_FIFO_STATUS);
292 if (ret < 0) {
293 /* ENODEV reported after disconnect */
294 if (errno != ENODEV)
295 err("%s: get fifo status", t->filename);
296 } else if (ret) {
297 warn("%s: unclaimed = %d\n", t->filename, ret);
298 if (ioctl(fd, FUNCTIONFS_FIFO_FLUSH) < 0)
299 err("%s: fifo flush", t->filename);
300 }
301 }
302
303 if (close(fd) < 0)
304 err("%s: close", t->filename);
305
306 free(t->buf);
307 t->buf = NULL;
308}
309
310static void *start_thread_helper(void *arg)
311{
312 const char *name, *op, *in_name, *out_name;
313 struct thread *t = arg;
314 ssize_t ret;
315
316 info("%s: starts\n", t->filename);
317 in_name = t->in_name ? t->in_name : t->filename;
318 out_name = t->out_name ? t->out_name : t->filename;
319
320 pthread_cleanup_push(cleanup_thread, arg);
321
322 for (;;) {
323 pthread_testcancel();
324
325 ret = t->in(t, t->buf, t->buf_size);
326 if (ret > 0) {
327 ret = t->out(t, t->buf, t->buf_size);
328 name = out_name;
329 op = "write";
330 } else {
331 name = in_name;
332 op = "read";
333 }
334
335 if (ret > 0) {
336 /* nop */
337 } else if (!ret) {
338 debug("%s: %s: EOF", name, op);
339 break;
340 } else if (errno == EINTR || errno == EAGAIN) {
341 debug("%s: %s", name, op);
342 } else {
343 warn("%s: %s", name, op);
344 break;
345 }
346 }
347
348 pthread_cleanup_pop(1);
349
350 t->status = ret;
351 info("%s: ends\n", t->filename);
352 return NULL;
353}
354
355static void start_thread(struct thread *t)
356{
357 debug("%s: starting\n", t->filename);
358
359 die_on(pthread_create(&t->id, NULL, start_thread_helper, t) < 0,
360 "pthread_create(%s)", t->filename);
361}
362
363static void join_thread(struct thread *t)
364{
365 int ret = pthread_join(t->id, NULL);
366
367 if (ret < 0)
368 err("%s: joining thread", t->filename);
369 else
370 debug("%s: joined\n", t->filename);
371}
372
373
374static ssize_t read_wrap(struct thread *t, void *buf, size_t nbytes)
375{
376 return read(t->fd, buf, nbytes);
377}
378
379static ssize_t write_wrap(struct thread *t, const void *buf, size_t nbytes)
380{
381 return write(t->fd, buf, nbytes);
382}
383
384
385/******************** Empty/Fill buffer routines ****************************/
386
387/* 0 -- stream of zeros, 1 -- i % 63, 2 -- pipe */
388enum pattern { PAT_ZERO, PAT_SEQ, PAT_PIPE };
389static enum pattern pattern;
390
391static ssize_t
392fill_in_buf(struct thread *ignore, void *buf, size_t nbytes)
393{
394 size_t i;
395 __u8 *p;
396
397 (void)ignore;
398
399 switch (pattern) {
400 case PAT_ZERO:
401 memset(buf, 0, nbytes);
402 break;
403
404 case PAT_SEQ:
405 for (p = buf, i = 0; i < nbytes; ++i, ++p)
406 *p = i % 63;
407 break;
408
409 case PAT_PIPE:
410 return fread(buf, 1, nbytes, stdin);
411 }
412
413 return nbytes;
414}
415
416static ssize_t
417empty_out_buf(struct thread *ignore, const void *buf, size_t nbytes)
418{
419 const __u8 *p;
420 __u8 expected;
421 ssize_t ret;
422 size_t len;
423
424 (void)ignore;
425
426 switch (pattern) {
427 case PAT_ZERO:
428 expected = 0;
429 for (p = buf, len = 0; len < nbytes; ++p, ++len)
430 if (*p)
431 goto invalid;
432 break;
433
434 case PAT_SEQ:
435 for (p = buf, len = 0; len < nbytes; ++p, ++len)
436 if (*p != len % 63) {
437 expected = len % 63;
438 goto invalid;
439 }
440 break;
441
442 case PAT_PIPE:
443 ret = fwrite(buf, nbytes, 1, stdout);
444 if (ret > 0)
445 fflush(stdout);
446 break;
447
448invalid:
449 err("bad OUT byte %zd, expected %02x got %02x\n",
450 len, expected, *p);
451 for (p = buf, len = 0; len < nbytes; ++p, ++len) {
452 if (0 == (len % 32))
453 fprintf(stderr, "%4d:", len);
454 fprintf(stderr, " %02x", *p);
455 if (31 == (len % 32))
456 fprintf(stderr, "\n");
457 }
458 fflush(stderr);
459 errno = EILSEQ;
460 return -1;
461 }
462
463 return len;
464}
465
466
467/******************** Endpoints routines ************************************/
468
469static void handle_setup(const struct usb_ctrlrequest *setup)
470{
471 printf("bRequestType = %d\n", setup->bRequestType);
472 printf("bRequest = %d\n", setup->bRequest);
473 printf("wValue = %d\n", le16_to_cpu(setup->wValue));
474 printf("wIndex = %d\n", le16_to_cpu(setup->wIndex));
475 printf("wLength = %d\n", le16_to_cpu(setup->wLength));
476}
477
478static ssize_t
479ep0_consume(struct thread *ignore, const void *buf, size_t nbytes)
480{
481 static const char *const names[] = {
482 [FUNCTIONFS_BIND] = "BIND",
483 [FUNCTIONFS_UNBIND] = "UNBIND",
484 [FUNCTIONFS_ENABLE] = "ENABLE",
485 [FUNCTIONFS_DISABLE] = "DISABLE",
486 [FUNCTIONFS_SETUP] = "SETUP",
487 [FUNCTIONFS_SUSPEND] = "SUSPEND",
488 [FUNCTIONFS_RESUME] = "RESUME",
489 };
490
491 const struct usb_functionfs_event *event = buf;
492 size_t n;
493
494 (void)ignore;
495
496 for (n = nbytes / sizeof *event; n; --n, ++event)
497 switch (event->type) {
498 case FUNCTIONFS_BIND:
499 case FUNCTIONFS_UNBIND:
500 case FUNCTIONFS_ENABLE:
501 case FUNCTIONFS_DISABLE:
502 case FUNCTIONFS_SETUP:
503 case FUNCTIONFS_SUSPEND:
504 case FUNCTIONFS_RESUME:
505 printf("Event %s\n", names[event->type]);
506 if (event->type == FUNCTIONFS_SETUP)
507 handle_setup(&event->u.setup);
508 break;
509
510 default:
511 printf("Event %03u (unknown)\n", event->type);
512 }
513
514 return nbytes;
515}
516
517static void ep0_init(struct thread *t)
518{
519 ssize_t ret;
520
521 info("%s: writing descriptors\n", t->filename);
522 ret = write(t->fd, &descriptors, sizeof descriptors);
523 die_on(ret < 0, "%s: write: descriptors", t->filename);
524
525 info("%s: writing strings\n", t->filename);
526 ret = write(t->fd, &strings, sizeof strings);
527 die_on(ret < 0, "%s: write: strings", t->filename);
528}
529
530
531/******************** Main **************************************************/
532
533int main(void)
534{
535 unsigned i;
536
537 /* XXX TODO: Argument parsing missing */
538
539 init_thread(threads);
540 ep0_init(threads);
541
542 for (i = 1; i < sizeof threads / sizeof *threads; ++i)
543 init_thread(threads + i);
544
545 for (i = 1; i < sizeof threads / sizeof *threads; ++i)
546 start_thread(threads + i);
547
548 start_thread_helper(threads);
549
550 for (i = 1; i < sizeof threads / sizeof *threads; ++i)
551 join_thread(threads + i);
552
553 return 0;
554}
diff --git a/tools/usb/testusb.c b/tools/usb/testusb.c
new file mode 100644
index 000000000000..f08e89463842
--- /dev/null
+++ b/tools/usb/testusb.c
@@ -0,0 +1,547 @@
1/* $(CROSS_COMPILE)cc -Wall -Wextra -g -lpthread -o testusb testusb.c */
2
3/*
4 * Copyright (c) 2002 by David Brownell
5 * Copyright (c) 2010 by Samsung Electronics
6 * Author: Michal Nazarewicz <m.nazarewicz@samsung.com>
7 *
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of the GNU General Public License as published by the
10 * Free Software Foundation; either version 2 of the License, or (at your
11 * option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful, but
14 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
15 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
16 * for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software Foundation,
20 * Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
21 */
22
23/*
24 * This program issues ioctls to perform the tests implemented by the
25 * kernel driver. It can generate a variety of transfer patterns; you
26 * should make sure to test both regular streaming and mixes of
27 * transfer sizes (including short transfers).
28 *
29 * For more information on how this can be used and on USB testing
30 * refer to <URL:http://www.linux-usb.org/usbtest/>.
31 */
32
33#include <stdio.h>
34#include <string.h>
35#include <ftw.h>
36#include <stdlib.h>
37#include <pthread.h>
38#include <unistd.h>
39#include <errno.h>
40#include <limits.h>
41
42#include <sys/types.h>
43#include <sys/stat.h>
44#include <fcntl.h>
45
46#include <sys/ioctl.h>
47#include <linux/usbdevice_fs.h>
48
49/*-------------------------------------------------------------------------*/
50
51#define TEST_CASES 30
52
53// FIXME make these public somewhere; usbdevfs.h?
54
55struct usbtest_param {
56 // inputs
57 unsigned test_num; /* 0..(TEST_CASES-1) */
58 unsigned iterations;
59 unsigned length;
60 unsigned vary;
61 unsigned sglen;
62
63 // outputs
64 struct timeval duration;
65};
66#define USBTEST_REQUEST _IOWR('U', 100, struct usbtest_param)
67
68/*-------------------------------------------------------------------------*/
69
70/* #include <linux/usb_ch9.h> */
71
72#define USB_DT_DEVICE 0x01
73#define USB_DT_INTERFACE 0x04
74
75#define USB_CLASS_PER_INTERFACE 0 /* for DeviceClass */
76#define USB_CLASS_VENDOR_SPEC 0xff
77
78
79struct usb_device_descriptor {
80 __u8 bLength;
81 __u8 bDescriptorType;
82 __u16 bcdUSB;
83 __u8 bDeviceClass;
84 __u8 bDeviceSubClass;
85 __u8 bDeviceProtocol;
86 __u8 bMaxPacketSize0;
87 __u16 idVendor;
88 __u16 idProduct;
89 __u16 bcdDevice;
90 __u8 iManufacturer;
91 __u8 iProduct;
92 __u8 iSerialNumber;
93 __u8 bNumConfigurations;
94} __attribute__ ((packed));
95
96struct usb_interface_descriptor {
97 __u8 bLength;
98 __u8 bDescriptorType;
99
100 __u8 bInterfaceNumber;
101 __u8 bAlternateSetting;
102 __u8 bNumEndpoints;
103 __u8 bInterfaceClass;
104 __u8 bInterfaceSubClass;
105 __u8 bInterfaceProtocol;
106 __u8 iInterface;
107} __attribute__ ((packed));
108
109enum usb_device_speed {
110 USB_SPEED_UNKNOWN = 0, /* enumerating */
111 USB_SPEED_LOW, USB_SPEED_FULL, /* usb 1.1 */
112 USB_SPEED_HIGH /* usb 2.0 */
113};
114
115/*-------------------------------------------------------------------------*/
116
117static char *speed (enum usb_device_speed s)
118{
119 switch (s) {
120 case USB_SPEED_UNKNOWN: return "unknown";
121 case USB_SPEED_LOW: return "low";
122 case USB_SPEED_FULL: return "full";
123 case USB_SPEED_HIGH: return "high";
124 default: return "??";
125 }
126}
127
128struct testdev {
129 struct testdev *next;
130 char *name;
131 pthread_t thread;
132 enum usb_device_speed speed;
133 unsigned ifnum : 8;
134 unsigned forever : 1;
135 int test;
136
137 struct usbtest_param param;
138};
139static struct testdev *testdevs;
140
141static int testdev_ffs_ifnum(FILE *fd)
142{
143 union {
144 char buf[255];
145 struct usb_interface_descriptor intf;
146 } u;
147
148 for (;;) {
149 if (fread(u.buf, 1, 1, fd) != 1)
150 return -1;
151 if (fread(u.buf + 1, (unsigned char)u.buf[0] - 1, 1, fd) != 1)
152 return -1;
153
154 if (u.intf.bLength == sizeof u.intf
155 && u.intf.bDescriptorType == USB_DT_INTERFACE
156 && u.intf.bNumEndpoints == 2
157 && u.intf.bInterfaceClass == USB_CLASS_VENDOR_SPEC
158 && u.intf.bInterfaceSubClass == 0
159 && u.intf.bInterfaceProtocol == 0)
160 return (unsigned char)u.intf.bInterfaceNumber;
161 }
162}
163
164static int testdev_ifnum(FILE *fd)
165{
166 struct usb_device_descriptor dev;
167
168 if (fread(&dev, sizeof dev, 1, fd) != 1)
169 return -1;
170
171 if (dev.bLength != sizeof dev || dev.bDescriptorType != USB_DT_DEVICE)
172 return -1;
173
174 /* FX2 with (tweaked) bulksrc firmware */
175 if (dev.idVendor == 0x0547 && dev.idProduct == 0x1002)
176 return 0;
177
178 /*----------------------------------------------------*/
179
180 /* devices that start up using the EZ-USB default device and
181 * which we can use after loading simple firmware. hotplug
182 * can fxload it, and then run this test driver.
183 *
184 * we return false positives in two cases:
185 * - the device has a "real" driver (maybe usb-serial) that
186 * renumerates. the device should vanish quickly.
187 * - the device doesn't have the test firmware installed.
188 */
189
190 /* generic EZ-USB FX controller */
191 if (dev.idVendor == 0x0547 && dev.idProduct == 0x2235)
192 return 0;
193
194 /* generic EZ-USB FX2 controller */
195 if (dev.idVendor == 0x04b4 && dev.idProduct == 0x8613)
196 return 0;
197
198 /* CY3671 development board with EZ-USB FX */
199 if (dev.idVendor == 0x0547 && dev.idProduct == 0x0080)
200 return 0;
201
202 /* Keyspan 19Qi uses an21xx (original EZ-USB) */
203 if (dev.idVendor == 0x06cd && dev.idProduct == 0x010b)
204 return 0;
205
206 /*----------------------------------------------------*/
207
208 /* "gadget zero", Linux-USB test software */
209 if (dev.idVendor == 0x0525 && dev.idProduct == 0xa4a0)
210 return 0;
211
212 /* user mode subset of that */
213 if (dev.idVendor == 0x0525 && dev.idProduct == 0xa4a4)
214 return testdev_ffs_ifnum(fd);
215 /* return 0; */
216
217 /* iso version of usermode code */
218 if (dev.idVendor == 0x0525 && dev.idProduct == 0xa4a3)
219 return 0;
220
221 /* some GPL'd test firmware uses these IDs */
222
223 if (dev.idVendor == 0xfff0 && dev.idProduct == 0xfff0)
224 return 0;
225
226 /*----------------------------------------------------*/
227
228 /* iBOT2 high speed webcam */
229 if (dev.idVendor == 0x0b62 && dev.idProduct == 0x0059)
230 return 0;
231
232 /*----------------------------------------------------*/
233
234 /* the FunctionFS gadget can have the source/sink interface
235 * anywhere. We look for an interface descriptor that match
236 * what we expect. We ignore configuratiens thou. */
237
238 if (dev.idVendor == 0x0525 && dev.idProduct == 0xa4ac
239 && (dev.bDeviceClass == USB_CLASS_PER_INTERFACE
240 || dev.bDeviceClass == USB_CLASS_VENDOR_SPEC))
241 return testdev_ffs_ifnum(fd);
242
243 return -1;
244}
245
246static int find_testdev(const char *name, const struct stat *sb, int flag)
247{
248 FILE *fd;
249 int ifnum;
250 struct testdev *entry;
251
252 (void)sb; /* unused */
253
254 if (flag != FTW_F)
255 return 0;
256 /* ignore /proc/bus/usb/{devices,drivers} */
257 if (strrchr(name, '/')[1] == 'd')
258 return 0;
259
260 fd = fopen(name, "rb");
261 if (!fd) {
262 perror(name);
263 return 0;
264 }
265
266 ifnum = testdev_ifnum(fd);
267 fclose(fd);
268 if (ifnum < 0)
269 return 0;
270
271 entry = calloc(1, sizeof *entry);
272 if (!entry)
273 goto nomem;
274
275 entry->name = strdup(name);
276 if (!entry->name) {
277 free(entry);
278nomem:
279 perror("malloc");
280 return 0;
281 }
282
283 entry->ifnum = ifnum;
284
285 /* FIXME ask usbfs what speed; update USBDEVFS_CONNECTINFO so
286 * it tells about high speed etc */
287
288 fprintf(stderr, "%s speed\t%s\t%u\n",
289 speed(entry->speed), entry->name, entry->ifnum);
290
291 entry->next = testdevs;
292 testdevs = entry;
293 return 0;
294}
295
296static int
297usbdev_ioctl (int fd, int ifno, unsigned request, void *param)
298{
299 struct usbdevfs_ioctl wrapper;
300
301 wrapper.ifno = ifno;
302 wrapper.ioctl_code = request;
303 wrapper.data = param;
304
305 return ioctl (fd, USBDEVFS_IOCTL, &wrapper);
306}
307
308static void *handle_testdev (void *arg)
309{
310 struct testdev *dev = arg;
311 int fd, i;
312 int status;
313
314 if ((fd = open (dev->name, O_RDWR)) < 0) {
315 perror ("can't open dev file r/w");
316 return 0;
317 }
318
319restart:
320 for (i = 0; i < TEST_CASES; i++) {
321 if (dev->test != -1 && dev->test != i)
322 continue;
323 dev->param.test_num = i;
324
325 status = usbdev_ioctl (fd, dev->ifnum,
326 USBTEST_REQUEST, &dev->param);
327 if (status < 0 && errno == EOPNOTSUPP)
328 continue;
329
330 /* FIXME need a "syslog it" option for background testing */
331
332 /* NOTE: each thread emits complete lines; no fragments! */
333 if (status < 0) {
334 char buf [80];
335 int err = errno;
336
337 if (strerror_r (errno, buf, sizeof buf)) {
338 snprintf (buf, sizeof buf, "error %d", err);
339 errno = err;
340 }
341 printf ("%s test %d --> %d (%s)\n",
342 dev->name, i, errno, buf);
343 } else
344 printf ("%s test %d, %4d.%.06d secs\n", dev->name, i,
345 (int) dev->param.duration.tv_sec,
346 (int) dev->param.duration.tv_usec);
347
348 fflush (stdout);
349 }
350 if (dev->forever)
351 goto restart;
352
353 close (fd);
354 return arg;
355}
356
357static const char *usbfs_dir_find(void)
358{
359 static char usbfs_path_0[] = "/dev/usb/devices";
360 static char usbfs_path_1[] = "/proc/bus/usb/devices";
361
362 static char *const usbfs_paths[] = {
363 usbfs_path_0, usbfs_path_1
364 };
365
366 static char *const *
367 end = usbfs_paths + sizeof usbfs_paths / sizeof *usbfs_paths;
368
369 char *const *it = usbfs_paths;
370 do {
371 int fd = open(*it, O_RDONLY);
372 close(fd);
373 if (fd >= 0) {
374 strrchr(*it, '/')[0] = '\0';
375 return *it;
376 }
377 } while (++it != end);
378
379 return NULL;
380}
381
382static int parse_num(unsigned *num, const char *str)
383{
384 unsigned long val;
385 char *end;
386
387 errno = 0;
388 val = strtoul(str, &end, 0);
389 if (errno || *end || val > UINT_MAX)
390 return -1;
391 *num = val;
392 return 0;
393}
394
395int main (int argc, char **argv)
396{
397
398 int c;
399 struct testdev *entry;
400 char *device;
401 const char *usbfs_dir = NULL;
402 int all = 0, forever = 0, not = 0;
403 int test = -1 /* all */;
404 struct usbtest_param param;
405
406 /* pick defaults that works with all speeds, without short packets.
407 *
408 * Best per-frame data rates:
409 * high speed, bulk 512 * 13 * 8 = 53248
410 * interrupt 1024 * 3 * 8 = 24576
411 * full speed, bulk/intr 64 * 19 = 1216
412 * interrupt 64 * 1 = 64
413 * low speed, interrupt 8 * 1 = 8
414 */
415 param.iterations = 1000;
416 param.length = 512;
417 param.vary = 512;
418 param.sglen = 32;
419
420 /* for easy use when hotplugging */
421 device = getenv ("DEVICE");
422
423 while ((c = getopt (argc, argv, "D:aA:c:g:hns:t:v:")) != EOF)
424 switch (c) {
425 case 'D': /* device, if only one */
426 device = optarg;
427 continue;
428 case 'A': /* use all devices with specified usbfs dir */
429 usbfs_dir = optarg;
430 /* FALL THROUGH */
431 case 'a': /* use all devices */
432 device = NULL;
433 all = 1;
434 continue;
435 case 'c': /* count iterations */
436 if (parse_num(&param.iterations, optarg))
437 goto usage;
438 continue;
439 case 'g': /* scatter/gather entries */
440 if (parse_num(&param.sglen, optarg))
441 goto usage;
442 continue;
443 case 'l': /* loop forever */
444 forever = 1;
445 continue;
446 case 'n': /* no test running! */
447 not = 1;
448 continue;
449 case 's': /* size of packet */
450 if (parse_num(&param.length, optarg))
451 goto usage;
452 continue;
453 case 't': /* run just one test */
454 test = atoi (optarg);
455 if (test < 0)
456 goto usage;
457 continue;
458 case 'v': /* vary packet size by ... */
459 if (parse_num(&param.vary, optarg))
460 goto usage;
461 continue;
462 case '?':
463 case 'h':
464 default:
465usage:
466 fprintf (stderr, "usage: %s [-n] [-D dev | -a | -A usbfs-dir]\n"
467 "\t[-c iterations] [-t testnum]\n"
468 "\t[-s packetsize] [-g sglen] [-v vary]\n",
469 argv [0]);
470 return 1;
471 }
472 if (optind != argc)
473 goto usage;
474 if (!all && !device) {
475 fprintf (stderr, "must specify '-a' or '-D dev', "
476 "or DEVICE=/proc/bus/usb/BBB/DDD in env\n");
477 goto usage;
478 }
479
480 /* Find usbfs mount point */
481 if (!usbfs_dir) {
482 usbfs_dir = usbfs_dir_find();
483 if (!usbfs_dir) {
484 fputs ("usbfs files are missing\n", stderr);
485 return -1;
486 }
487 }
488
489 /* collect and list the test devices */
490 if (ftw (usbfs_dir, find_testdev, 3) != 0) {
491 fputs ("ftw failed; is usbfs missing?\n", stderr);
492 return -1;
493 }
494
495 /* quit, run single test, or create test threads */
496 if (!testdevs && !device) {
497 fputs ("no test devices recognized\n", stderr);
498 return -1;
499 }
500 if (not)
501 return 0;
502 if (testdevs && testdevs->next == 0 && !device)
503 device = testdevs->name;
504 for (entry = testdevs; entry; entry = entry->next) {
505 int status;
506
507 entry->param = param;
508 entry->forever = forever;
509 entry->test = test;
510
511 if (device) {
512 if (strcmp (entry->name, device))
513 continue;
514 return handle_testdev (entry) != entry;
515 }
516 status = pthread_create (&entry->thread, 0, handle_testdev, entry);
517 if (status) {
518 perror ("pthread_create");
519 continue;
520 }
521 }
522 if (device) {
523 struct testdev dev;
524
525 /* kernel can recognize test devices we don't */
526 fprintf (stderr, "%s: %s may see only control tests\n",
527 argv [0], device);
528
529 memset (&dev, 0, sizeof dev);
530 dev.name = device;
531 dev.param = param;
532 dev.forever = forever;
533 dev.test = test;
534 return handle_testdev (&dev) != &dev;
535 }
536
537 /* wait for tests to complete */
538 for (entry = testdevs; entry; entry = entry->next) {
539 void *retval;
540
541 if (pthread_join (entry->thread, &retval))
542 perror ("pthread_join");
543 /* testing errors discarded! */
544 }
545
546 return 0;
547}