aboutsummaryrefslogtreecommitdiffstats
path: root/tools/perf
diff options
context:
space:
mode:
authorArnaldo Carvalho de Melo <acme@redhat.com>2009-09-28 13:48:46 -0400
committerIngo Molnar <mingo@elte.hu>2009-09-30 07:57:56 -0400
commit1b46cddfccfec4cc67b187fb53d78198de6a057c (patch)
tree813836ec58396e15008bfb39e7209a6bcc6e2f58 /tools/perf
parent3d1d07ecd2009f65cb2091563fa21f9600c36774 (diff)
perf tools: Use rb_tree for maps
Threads can have many and kernel modules will be represented as a tree of maps as well. Ah, and for a perf.data with 146607 samples: Before: [root@doppio ~]# perf stat -r 5 perf report > /dev/null Performance counter stats for 'perf report' (5 runs): 699.823680 task-clock-msecs # 0.991 CPUs ( +- 0.454% ) 74 context-switches # 0.000 M/sec ( +- 1.709% ) 2 CPU-migrations # 0.000 M/sec ( +- 17.008% ) 23114 page-faults # 0.033 M/sec ( +- 0.000% ) 1381257019 cycles # 1973.721 M/sec ( +- 0.290% ) 1456894438 instructions # 1.055 IPC ( +- 0.007% ) 18779818 cache-references # 26.835 M/sec ( +- 0.380% ) 641799 cache-misses # 0.917 M/sec ( +- 1.200% ) 0.705972729 seconds time elapsed ( +- 0.501% ) [root@doppio ~]# After Performance counter stats for 'perf report' (5 runs): 691.261451 task-clock-msecs # 0.993 CPUs ( +- 0.307% ) 72 context-switches # 0.000 M/sec ( +- 0.829% ) 6 CPU-migrations # 0.000 M/sec ( +- 18.409% ) 23127 page-faults # 0.033 M/sec ( +- 0.000% ) 1366395876 cycles # 1976.670 M/sec ( +- 0.153% ) 1443136016 instructions # 1.056 IPC ( +- 0.012% ) 17956402 cache-references # 25.976 M/sec ( +- 0.325% ) 661924 cache-misses # 0.958 M/sec ( +- 1.335% ) 0.696127275 seconds time elapsed ( +- 0.377% ) I.e. we see some speedup too. Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com> Cc: Frédéric Weisbecker <fweisbec@gmail.com> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Mike Galbraith <efault@gmx.de> Cc: "H. Peter Anvin" <hpa@zytor.com> LKML-Reference: <20090928174846.GA3361@ghostprotocols.net> Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'tools/perf')
-rw-r--r--tools/perf/Makefile1
-rw-r--r--tools/perf/util/event.h4
-rw-r--r--tools/perf/util/thread.c129
-rw-r--r--tools/perf/util/thread.h12
4 files changed, 95 insertions, 51 deletions
diff --git a/tools/perf/Makefile b/tools/perf/Makefile
index 3a99a9fda645..055290a5b835 100644
--- a/tools/perf/Makefile
+++ b/tools/perf/Makefile
@@ -341,6 +341,7 @@ LIB_H += util/color.h
341LIB_H += util/values.h 341LIB_H += util/values.h
342LIB_H += util/sort.h 342LIB_H += util/sort.h
343LIB_H += util/hist.h 343LIB_H += util/hist.h
344LIB_H += util/thread.h
344 345
345LIB_OBJS += util/abspath.o 346LIB_OBJS += util/abspath.o
346LIB_OBJS += util/alias.o 347LIB_OBJS += util/alias.o
diff --git a/tools/perf/util/event.h b/tools/perf/util/event.h
index c31a5da6458b..4c69eb553807 100644
--- a/tools/perf/util/event.h
+++ b/tools/perf/util/event.h
@@ -3,7 +3,7 @@
3 3
4#include "../perf.h" 4#include "../perf.h"
5#include "util.h" 5#include "util.h"
6#include <linux/list.h> 6#include <linux/rbtree.h>
7 7
8enum { 8enum {
9 SHOW_KERNEL = 1, 9 SHOW_KERNEL = 1,
@@ -79,7 +79,7 @@ typedef union event_union {
79} event_t; 79} event_t;
80 80
81struct map { 81struct map {
82 struct list_head node; 82 struct rb_node rb_node;
83 u64 start; 83 u64 start;
84 u64 end; 84 u64 end;
85 u64 pgoff; 85 u64 pgoff;
diff --git a/tools/perf/util/thread.c b/tools/perf/util/thread.c
index 45efb5db0d19..9d0945cc66d1 100644
--- a/tools/perf/util/thread.c
+++ b/tools/perf/util/thread.c
@@ -15,7 +15,7 @@ static struct thread *thread__new(pid_t pid)
15 self->comm = malloc(32); 15 self->comm = malloc(32);
16 if (self->comm) 16 if (self->comm)
17 snprintf(self->comm, 32, ":%d", self->pid); 17 snprintf(self->comm, 32, ":%d", self->pid);
18 INIT_LIST_HEAD(&self->maps); 18 self->maps = RB_ROOT;
19 } 19 }
20 20
21 return self; 21 return self;
@@ -31,11 +31,13 @@ int thread__set_comm(struct thread *self, const char *comm)
31 31
32static size_t thread__fprintf(struct thread *self, FILE *fp) 32static size_t thread__fprintf(struct thread *self, FILE *fp)
33{ 33{
34 struct map *pos; 34 struct rb_node *nd;
35 size_t ret = fprintf(fp, "Thread %d %s\n", self->pid, self->comm); 35 size_t ret = fprintf(fp, "Thread %d %s\n", self->pid, self->comm);
36 36
37 list_for_each_entry(pos, &self->maps, node) 37 for (nd = rb_first(&self->maps); nd; nd = rb_next(nd)) {
38 struct map *pos = rb_entry(nd, struct map, rb_node);
38 ret += map__fprintf(pos, fp); 39 ret += map__fprintf(pos, fp);
40 }
39 41
40 return ret; 42 return ret;
41} 43}
@@ -93,42 +95,90 @@ register_idle_thread(struct rb_root *threads, struct thread **last_match)
93 return thread; 95 return thread;
94} 96}
95 97
96void thread__insert_map(struct thread *self, struct map *map) 98static void thread__remove_overlappings(struct thread *self, struct map *map)
97{ 99{
98 struct map *pos, *tmp; 100 struct rb_node *next = rb_first(&self->maps);
99 101
100 list_for_each_entry_safe(pos, tmp, &self->maps, node) { 102 while (next) {
101 if (map__overlap(pos, map)) { 103 struct map *pos = rb_entry(next, struct map, rb_node);
102 if (verbose >= 2) { 104 next = rb_next(&pos->rb_node);
103 printf("overlapping maps:\n"); 105
104 map__fprintf(map, stdout); 106 if (!map__overlap(pos, map))
105 map__fprintf(pos, stdout); 107 continue;
106 } 108
107 109 if (verbose >= 2) {
108 if (map->start <= pos->start && map->end > pos->start) 110 printf("overlapping maps:\n");
109 pos->start = map->end; 111 map__fprintf(map, stdout);
110 112 map__fprintf(pos, stdout);
111 if (map->end >= pos->end && map->start < pos->end) 113 }
112 pos->end = map->start; 114
113 115 if (map->start <= pos->start && map->end > pos->start)
114 if (verbose >= 2) { 116 pos->start = map->end;
115 printf("after collision:\n"); 117
116 map__fprintf(pos, stdout); 118 if (map->end >= pos->end && map->start < pos->end)
117 } 119 pos->end = map->start;
118 120
119 if (pos->start >= pos->end) { 121 if (verbose >= 2) {
120 list_del_init(&pos->node); 122 printf("after collision:\n");
121 free(pos); 123 map__fprintf(pos, stdout);
122 } 124 }
125
126 if (pos->start >= pos->end) {
127 rb_erase(&pos->rb_node, &self->maps);
128 free(pos);
123 } 129 }
124 } 130 }
131}
132
133void maps__insert(struct rb_root *maps, struct map *map)
134{
135 struct rb_node **p = &maps->rb_node;
136 struct rb_node *parent = NULL;
137 const u64 ip = map->start;
138 struct map *m;
139
140 while (*p != NULL) {
141 parent = *p;
142 m = rb_entry(parent, struct map, rb_node);
143 if (ip < m->start)
144 p = &(*p)->rb_left;
145 else
146 p = &(*p)->rb_right;
147 }
148
149 rb_link_node(&map->rb_node, parent, p);
150 rb_insert_color(&map->rb_node, maps);
151}
152
153struct map *maps__find(struct rb_root *maps, u64 ip)
154{
155 struct rb_node **p = &maps->rb_node;
156 struct rb_node *parent = NULL;
157 struct map *m;
158
159 while (*p != NULL) {
160 parent = *p;
161 m = rb_entry(parent, struct map, rb_node);
162 if (ip < m->start)
163 p = &(*p)->rb_left;
164 else if (ip > m->end)
165 p = &(*p)->rb_right;
166 else
167 return m;
168 }
169
170 return NULL;
171}
125 172
126 list_add_tail(&map->node, &self->maps); 173void thread__insert_map(struct thread *self, struct map *map)
174{
175 thread__remove_overlappings(self, map);
176 maps__insert(&self->maps, map);
127} 177}
128 178
129int thread__fork(struct thread *self, struct thread *parent) 179int thread__fork(struct thread *self, struct thread *parent)
130{ 180{
131 struct map *map; 181 struct rb_node *nd;
132 182
133 if (self->comm) 183 if (self->comm)
134 free(self->comm); 184 free(self->comm);
@@ -136,7 +186,8 @@ int thread__fork(struct thread *self, struct thread *parent)
136 if (!self->comm) 186 if (!self->comm)
137 return -ENOMEM; 187 return -ENOMEM;
138 188
139 list_for_each_entry(map, &parent->maps, node) { 189 for (nd = rb_first(&parent->maps); nd; nd = rb_next(nd)) {
190 struct map *map = rb_entry(nd, struct map, rb_node);
140 struct map *new = map__clone(map); 191 struct map *new = map__clone(map);
141 if (!new) 192 if (!new)
142 return -ENOMEM; 193 return -ENOMEM;
@@ -146,20 +197,6 @@ int thread__fork(struct thread *self, struct thread *parent)
146 return 0; 197 return 0;
147} 198}
148 199
149struct map *thread__find_map(struct thread *self, u64 ip)
150{
151 struct map *pos;
152
153 if (self == NULL)
154 return NULL;
155
156 list_for_each_entry(pos, &self->maps, node)
157 if (ip >= pos->start && ip <= pos->end)
158 return pos;
159
160 return NULL;
161}
162
163size_t threads__fprintf(FILE *fp, struct rb_root *threads) 200size_t threads__fprintf(FILE *fp, struct rb_root *threads)
164{ 201{
165 size_t ret = 0; 202 size_t ret = 0;
diff --git a/tools/perf/util/thread.h b/tools/perf/util/thread.h
index 693ed1ea10b4..bbb37c1a52ee 100644
--- a/tools/perf/util/thread.h
+++ b/tools/perf/util/thread.h
@@ -2,13 +2,12 @@
2#define __PERF_THREAD_H 2#define __PERF_THREAD_H
3 3
4#include <linux/rbtree.h> 4#include <linux/rbtree.h>
5#include <linux/list.h>
6#include <unistd.h> 5#include <unistd.h>
7#include "symbol.h" 6#include "symbol.h"
8 7
9struct thread { 8struct thread {
10 struct rb_node rb_node; 9 struct rb_node rb_node;
11 struct list_head maps; 10 struct rb_root maps;
12 pid_t pid; 11 pid_t pid;
13 char shortname[3]; 12 char shortname[3];
14 char *comm; 13 char *comm;
@@ -21,7 +20,14 @@ struct thread *
21register_idle_thread(struct rb_root *threads, struct thread **last_match); 20register_idle_thread(struct rb_root *threads, struct thread **last_match);
22void thread__insert_map(struct thread *self, struct map *map); 21void thread__insert_map(struct thread *self, struct map *map);
23int thread__fork(struct thread *self, struct thread *parent); 22int thread__fork(struct thread *self, struct thread *parent);
24struct map *thread__find_map(struct thread *self, u64 ip);
25size_t threads__fprintf(FILE *fp, struct rb_root *threads); 23size_t threads__fprintf(FILE *fp, struct rb_root *threads);
26 24
25void maps__insert(struct rb_root *maps, struct map *map);
26struct map *maps__find(struct rb_root *maps, u64 ip);
27
28static inline struct map *thread__find_map(struct thread *self, u64 ip)
29{
30 return self ? maps__find(&self->maps, ip) : NULL;
31}
32
27#endif /* __PERF_THREAD_H */ 33#endif /* __PERF_THREAD_H */