diff options
author | Kirill Smelkov <kirr@landau.phys.spbu.ru> | 2010-02-07 08:46:15 -0500 |
---|---|---|
committer | Ingo Molnar <mingo@elte.hu> | 2010-02-07 11:30:20 -0500 |
commit | ee11b90b12eb1ec25e1044bac861e90bfd19ec9e (patch) | |
tree | 987838529d9b80246841d63755db48b1e87ce30c /tools/perf | |
parent | 5ecaafdbf44b1ba400b746c60c401d54c7ee0863 (diff) |
perf top: Fix annotate for userspace
First, for programs and prelinked libraries, annotate code was
fooled by objdump output IPs (src->eip in the code) being
wrongly converted to absolute IPs. In such case there were no
conversion needed, but in
src->eip = strtoull(src->line, NULL, 16);
src->eip = map->unmap_ip(map, src->eip); // = eip + map->start - map->pgoff
we were reading absolute address from objdump (e.g. 8048604) and
then almost doubling it, because eip & map->start are
approximately close for small programs.
Needless to say, that later, in record_precise_ip() there was no
matching with real runtime IPs.
And second, like with `perf annotate` the problem with
non-prelinked *.so was that we were doing rip -> objdump address
conversion wrong.
Also, because unlike `perf annotate`, `perf top` code does
annotation based on absolute IPs for performance reasons(*), new
helper for mapping objdump addresse to IP is introduced.
(*) we get samples info in absolute IPs, and since we do lots of
hit-testing on absolute IPs at runtime in record_precise_ip(), it's
better to convert objdump addresses to IPs once and do no conversion
at runtime.
I also had to fix how objdump output is parsed (with hardcoded
8/16 characters format, which was inappropriate for ET_DYN dsos
with small addresses like '4ac')
Also note, that not all objdump output lines has associtated
IPs, e.g. look at source lines here:
000004ac <my_strlen>:
extern "C"
int my_strlen(const char *s)
4ac: 55 push %ebp
4ad: 89 e5 mov %esp,%ebp
4af: 83 ec 10 sub $0x10,%esp
{
int len = 0;
4b2: c7 45 fc 00 00 00 00 movl $0x0,-0x4(%ebp)
4b9: eb 08 jmp 4c3 <my_strlen+0x17>
while (*s) {
++len;
4bb: 83 45 fc 01 addl $0x1,-0x4(%ebp)
++s;
4bf: 83 45 08 01 addl $0x1,0x8(%ebp)
So we mark them with eip=0, and ignore such lines in annotate
lookup code.
Signed-off-by: Kirill Smelkov <kirr@landau.phys.spbu.ru>
[ Note: one hunk of this patch was applied by Mike in 57d8188 ]
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Mike Galbraith <efault@gmx.de>
LKML-Reference: <1265550376-12665-1-git-send-email-acme@infradead.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'tools/perf')
-rw-r--r-- | tools/perf/builtin-top.c | 18 | ||||
-rw-r--r-- | tools/perf/util/map.c | 8 | ||||
-rw-r--r-- | tools/perf/util/map.h | 4 |
3 files changed, 19 insertions, 11 deletions
diff --git a/tools/perf/builtin-top.c b/tools/perf/builtin-top.c index e4156bc4566d..befa57e2284d 100644 --- a/tools/perf/builtin-top.c +++ b/tools/perf/builtin-top.c | |||
@@ -216,7 +216,7 @@ static void parse_source(struct sym_entry *syme) | |||
216 | while (!feof(file)) { | 216 | while (!feof(file)) { |
217 | struct source_line *src; | 217 | struct source_line *src; |
218 | size_t dummy = 0; | 218 | size_t dummy = 0; |
219 | char *c; | 219 | char *c, *sep; |
220 | 220 | ||
221 | src = malloc(sizeof(struct source_line)); | 221 | src = malloc(sizeof(struct source_line)); |
222 | assert(src != NULL); | 222 | assert(src != NULL); |
@@ -235,14 +235,11 @@ static void parse_source(struct sym_entry *syme) | |||
235 | *source->lines_tail = src; | 235 | *source->lines_tail = src; |
236 | source->lines_tail = &src->next; | 236 | source->lines_tail = &src->next; |
237 | 237 | ||
238 | if (strlen(src->line)>8 && src->line[8] == ':') { | 238 | src->eip = strtoull(src->line, &sep, 16); |
239 | src->eip = strtoull(src->line, NULL, 16); | 239 | if (*sep == ':') |
240 | src->eip = map->unmap_ip(map, src->eip); | 240 | src->eip = map__objdump_2ip(map, src->eip); |
241 | } | 241 | else /* this line has no ip info (e.g. source line) */ |
242 | if (strlen(src->line)>8 && src->line[16] == ':') { | 242 | src->eip = 0; |
243 | src->eip = strtoull(src->line, NULL, 16); | ||
244 | src->eip = map->unmap_ip(map, src->eip); | ||
245 | } | ||
246 | } | 243 | } |
247 | pclose(file); | 244 | pclose(file); |
248 | out_assign: | 245 | out_assign: |
@@ -277,6 +274,9 @@ static void record_precise_ip(struct sym_entry *syme, int counter, u64 ip) | |||
277 | goto out_unlock; | 274 | goto out_unlock; |
278 | 275 | ||
279 | for (line = syme->src->lines; line; line = line->next) { | 276 | for (line = syme->src->lines; line; line = line->next) { |
277 | /* skip lines without IP info */ | ||
278 | if (line->eip == 0) | ||
279 | continue; | ||
280 | if (line->eip == ip) { | 280 | if (line->eip == ip) { |
281 | line->count[counter]++; | 281 | line->count[counter]++; |
282 | break; | 282 | break; |
diff --git a/tools/perf/util/map.c b/tools/perf/util/map.c index af5805f51314..138e3cb2b727 100644 --- a/tools/perf/util/map.c +++ b/tools/perf/util/map.c | |||
@@ -222,3 +222,11 @@ u64 map__rip_2objdump(struct map *map, u64 rip) | |||
222 | rip; | 222 | rip; |
223 | return addr; | 223 | return addr; |
224 | } | 224 | } |
225 | |||
226 | u64 map__objdump_2ip(struct map *map, u64 addr) | ||
227 | { | ||
228 | u64 ip = map->dso->adjust_symbols ? | ||
229 | addr : | ||
230 | map->unmap_ip(map, addr); /* RIP -> IP */ | ||
231 | return ip; | ||
232 | } | ||
diff --git a/tools/perf/util/map.h b/tools/perf/util/map.h index 9cee9c788dbf..86f77cb1d060 100644 --- a/tools/perf/util/map.h +++ b/tools/perf/util/map.h | |||
@@ -61,9 +61,9 @@ static inline u64 identity__map_ip(struct map *map __used, u64 ip) | |||
61 | } | 61 | } |
62 | 62 | ||
63 | 63 | ||
64 | /* rip -> addr suitable for passing to `objdump --start-address=` */ | 64 | /* rip/ip <-> addr suitable for passing to `objdump --start-address=` */ |
65 | u64 map__rip_2objdump(struct map *map, u64 rip); | 65 | u64 map__rip_2objdump(struct map *map, u64 rip); |
66 | 66 | u64 map__objdump_2ip(struct map *map, u64 addr); | |
67 | 67 | ||
68 | struct symbol; | 68 | struct symbol; |
69 | struct mmap_event; | 69 | struct mmap_event; |