aboutsummaryrefslogtreecommitdiffstats
path: root/tools/perf
diff options
context:
space:
mode:
authorKirill Smelkov <kirr@landau.phys.spbu.ru>2010-02-07 08:46:15 -0500
committerIngo Molnar <mingo@elte.hu>2010-02-07 11:30:20 -0500
commitee11b90b12eb1ec25e1044bac861e90bfd19ec9e (patch)
tree987838529d9b80246841d63755db48b1e87ce30c /tools/perf
parent5ecaafdbf44b1ba400b746c60c401d54c7ee0863 (diff)
perf top: Fix annotate for userspace
First, for programs and prelinked libraries, annotate code was fooled by objdump output IPs (src->eip in the code) being wrongly converted to absolute IPs. In such case there were no conversion needed, but in src->eip = strtoull(src->line, NULL, 16); src->eip = map->unmap_ip(map, src->eip); // = eip + map->start - map->pgoff we were reading absolute address from objdump (e.g. 8048604) and then almost doubling it, because eip & map->start are approximately close for small programs. Needless to say, that later, in record_precise_ip() there was no matching with real runtime IPs. And second, like with `perf annotate` the problem with non-prelinked *.so was that we were doing rip -> objdump address conversion wrong. Also, because unlike `perf annotate`, `perf top` code does annotation based on absolute IPs for performance reasons(*), new helper for mapping objdump addresse to IP is introduced. (*) we get samples info in absolute IPs, and since we do lots of hit-testing on absolute IPs at runtime in record_precise_ip(), it's better to convert objdump addresses to IPs once and do no conversion at runtime. I also had to fix how objdump output is parsed (with hardcoded 8/16 characters format, which was inappropriate for ET_DYN dsos with small addresses like '4ac') Also note, that not all objdump output lines has associtated IPs, e.g. look at source lines here: 000004ac <my_strlen>: extern "C" int my_strlen(const char *s) 4ac: 55 push %ebp 4ad: 89 e5 mov %esp,%ebp 4af: 83 ec 10 sub $0x10,%esp { int len = 0; 4b2: c7 45 fc 00 00 00 00 movl $0x0,-0x4(%ebp) 4b9: eb 08 jmp 4c3 <my_strlen+0x17> while (*s) { ++len; 4bb: 83 45 fc 01 addl $0x1,-0x4(%ebp) ++s; 4bf: 83 45 08 01 addl $0x1,0x8(%ebp) So we mark them with eip=0, and ignore such lines in annotate lookup code. Signed-off-by: Kirill Smelkov <kirr@landau.phys.spbu.ru> [ Note: one hunk of this patch was applied by Mike in 57d8188 ] Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com> Cc: Mike Galbraith <efault@gmx.de> LKML-Reference: <1265550376-12665-1-git-send-email-acme@infradead.org> Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'tools/perf')
-rw-r--r--tools/perf/builtin-top.c18
-rw-r--r--tools/perf/util/map.c8
-rw-r--r--tools/perf/util/map.h4
3 files changed, 19 insertions, 11 deletions
diff --git a/tools/perf/builtin-top.c b/tools/perf/builtin-top.c
index e4156bc4566d..befa57e2284d 100644
--- a/tools/perf/builtin-top.c
+++ b/tools/perf/builtin-top.c
@@ -216,7 +216,7 @@ static void parse_source(struct sym_entry *syme)
216 while (!feof(file)) { 216 while (!feof(file)) {
217 struct source_line *src; 217 struct source_line *src;
218 size_t dummy = 0; 218 size_t dummy = 0;
219 char *c; 219 char *c, *sep;
220 220
221 src = malloc(sizeof(struct source_line)); 221 src = malloc(sizeof(struct source_line));
222 assert(src != NULL); 222 assert(src != NULL);
@@ -235,14 +235,11 @@ static void parse_source(struct sym_entry *syme)
235 *source->lines_tail = src; 235 *source->lines_tail = src;
236 source->lines_tail = &src->next; 236 source->lines_tail = &src->next;
237 237
238 if (strlen(src->line)>8 && src->line[8] == ':') { 238 src->eip = strtoull(src->line, &sep, 16);
239 src->eip = strtoull(src->line, NULL, 16); 239 if (*sep == ':')
240 src->eip = map->unmap_ip(map, src->eip); 240 src->eip = map__objdump_2ip(map, src->eip);
241 } 241 else /* this line has no ip info (e.g. source line) */
242 if (strlen(src->line)>8 && src->line[16] == ':') { 242 src->eip = 0;
243 src->eip = strtoull(src->line, NULL, 16);
244 src->eip = map->unmap_ip(map, src->eip);
245 }
246 } 243 }
247 pclose(file); 244 pclose(file);
248out_assign: 245out_assign:
@@ -277,6 +274,9 @@ static void record_precise_ip(struct sym_entry *syme, int counter, u64 ip)
277 goto out_unlock; 274 goto out_unlock;
278 275
279 for (line = syme->src->lines; line; line = line->next) { 276 for (line = syme->src->lines; line; line = line->next) {
277 /* skip lines without IP info */
278 if (line->eip == 0)
279 continue;
280 if (line->eip == ip) { 280 if (line->eip == ip) {
281 line->count[counter]++; 281 line->count[counter]++;
282 break; 282 break;
diff --git a/tools/perf/util/map.c b/tools/perf/util/map.c
index af5805f51314..138e3cb2b727 100644
--- a/tools/perf/util/map.c
+++ b/tools/perf/util/map.c
@@ -222,3 +222,11 @@ u64 map__rip_2objdump(struct map *map, u64 rip)
222 rip; 222 rip;
223 return addr; 223 return addr;
224} 224}
225
226u64 map__objdump_2ip(struct map *map, u64 addr)
227{
228 u64 ip = map->dso->adjust_symbols ?
229 addr :
230 map->unmap_ip(map, addr); /* RIP -> IP */
231 return ip;
232}
diff --git a/tools/perf/util/map.h b/tools/perf/util/map.h
index 9cee9c788dbf..86f77cb1d060 100644
--- a/tools/perf/util/map.h
+++ b/tools/perf/util/map.h
@@ -61,9 +61,9 @@ static inline u64 identity__map_ip(struct map *map __used, u64 ip)
61} 61}
62 62
63 63
64/* rip -> addr suitable for passing to `objdump --start-address=` */ 64/* rip/ip <-> addr suitable for passing to `objdump --start-address=` */
65u64 map__rip_2objdump(struct map *map, u64 rip); 65u64 map__rip_2objdump(struct map *map, u64 rip);
66 66u64 map__objdump_2ip(struct map *map, u64 addr);
67 67
68struct symbol; 68struct symbol;
69struct mmap_event; 69struct mmap_event;