aboutsummaryrefslogtreecommitdiffstats
path: root/tools/perf/builtin-record.c
diff options
context:
space:
mode:
authorIngo Molnar <mingo@elte.hu>2009-09-13 12:15:54 -0400
committerIngo Molnar <mingo@elte.hu>2009-09-14 09:45:11 -0400
commitea57c4f5203d82c7844c54cdef54e972cf4e9d1f (patch)
tree13eb76a07480adbfe1bcabd25cde7cdd12907ddb /tools/perf/builtin-record.c
parentaa1ab9d26ae9fe2566a9036e3cb83e7d555b3987 (diff)
perf tools: Implement counter output multiplexing
Finish the -M/--multiplex option implementation: - separate it out from group_fd - correctly set it via the ioctl and dont mmap counters that are multiplexed - modify the perf record event loop to deal with buffer-less counters. - remove the -g option from perf sched record - account for unordered events in perf sched latency - (add -f to perf sched record to ease measurements) - skip idle threads (pid==0) in latency output The result is better latency output by 'perf sched latency': ----------------------------------------------------------------------------------- Task | Runtime ms | Switches | Average delay ms | Maximum delay ms | ----------------------------------------------------------------------------------- ksoftirqd/8 | 0.071 ms | 2 | avg: 0.458 ms | max: 0.913 ms | at-spi-registry | 0.609 ms | 19 | avg: 0.013 ms | max: 0.023 ms | perf | 3.316 ms | 16 | avg: 0.013 ms | max: 0.054 ms | Xorg | 0.392 ms | 19 | avg: 0.011 ms | max: 0.018 ms | sleep | 0.537 ms | 2 | avg: 0.009 ms | max: 0.009 ms | ----------------------------------------------------------------------------------- TOTAL: | 4.925 ms | 58 | --------------------------------------------- Cc: Peter Zijlstra <a.p.zijlstra@chello.nl> Cc: Mike Galbraith <efault@gmx.de> Cc: Paul Mackerras <paulus@samba.org> Cc: Arnaldo Carvalho de Melo <acme@redhat.com> Cc: Frederic Weisbecker <fweisbec@gmail.com> LKML-Reference: <new-submission> Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'tools/perf/builtin-record.c')
-rw-r--r--tools/perf/builtin-record.c43
1 files changed, 26 insertions, 17 deletions
diff --git a/tools/perf/builtin-record.c b/tools/perf/builtin-record.c
index 79f99dba5be0..5f3127e7a615 100644
--- a/tools/perf/builtin-record.c
+++ b/tools/perf/builtin-record.c
@@ -49,6 +49,7 @@ static int inherit_stat = 0;
49static int no_samples = 0; 49static int no_samples = 0;
50static int sample_address = 0; 50static int sample_address = 0;
51static int multiplex = 0; 51static int multiplex = 0;
52static int multiplex_fd = -1;
52 53
53static long samples; 54static long samples;
54static struct timeval last_read; 55static struct timeval last_read;
@@ -471,23 +472,29 @@ try_again:
471 */ 472 */
472 if (group && group_fd == -1) 473 if (group && group_fd == -1)
473 group_fd = fd[nr_cpu][counter]; 474 group_fd = fd[nr_cpu][counter];
475 if (multiplex && multiplex_fd == -1)
476 multiplex_fd = fd[nr_cpu][counter];
474 477
475 event_array[nr_poll].fd = fd[nr_cpu][counter]; 478 if (multiplex && fd[nr_cpu][counter] != multiplex_fd) {
476 event_array[nr_poll].events = POLLIN; 479 int ret;
477 nr_poll++;
478
479 mmap_array[nr_cpu][counter].counter = counter;
480 mmap_array[nr_cpu][counter].prev = 0;
481 mmap_array[nr_cpu][counter].mask = mmap_pages*page_size - 1;
482 mmap_array[nr_cpu][counter].base = mmap(NULL, (mmap_pages+1)*page_size,
483 PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter], 0);
484 if (mmap_array[nr_cpu][counter].base == MAP_FAILED) {
485 error("failed to mmap with %d (%s)\n", errno, strerror(errno));
486 exit(-1);
487 }
488 480
489 if (multiplex && fd[nr_cpu][counter] != group_fd) 481 ret = ioctl(fd[nr_cpu][counter], PERF_COUNTER_IOC_SET_OUTPUT, multiplex_fd);
490 ioctl(fd[nr_cpu][counter], PERF_COUNTER_IOC_SET_OUTPUT, group_fd); 482 assert(ret != -1);
483 } else {
484 event_array[nr_poll].fd = fd[nr_cpu][counter];
485 event_array[nr_poll].events = POLLIN;
486 nr_poll++;
487
488 mmap_array[nr_cpu][counter].counter = counter;
489 mmap_array[nr_cpu][counter].prev = 0;
490 mmap_array[nr_cpu][counter].mask = mmap_pages*page_size - 1;
491 mmap_array[nr_cpu][counter].base = mmap(NULL, (mmap_pages+1)*page_size,
492 PROT_READ|PROT_WRITE, MAP_SHARED, fd[nr_cpu][counter], 0);
493 if (mmap_array[nr_cpu][counter].base == MAP_FAILED) {
494 error("failed to mmap with %d (%s)\n", errno, strerror(errno));
495 exit(-1);
496 }
497 }
491 498
492 ioctl(fd[nr_cpu][counter], PERF_COUNTER_IOC_ENABLE); 499 ioctl(fd[nr_cpu][counter], PERF_COUNTER_IOC_ENABLE);
493} 500}
@@ -618,8 +625,10 @@ static int __cmd_record(int argc, const char **argv)
618 int hits = samples; 625 int hits = samples;
619 626
620 for (i = 0; i < nr_cpu; i++) { 627 for (i = 0; i < nr_cpu; i++) {
621 for (counter = 0; counter < nr_counters; counter++) 628 for (counter = 0; counter < nr_counters; counter++) {
622 mmap_read(&mmap_array[i][counter]); 629 if (mmap_array[i][counter].base)
630 mmap_read(&mmap_array[i][counter]);
631 }
623 } 632 }
624 633
625 if (hits == samples) { 634 if (hits == samples) {