diff options
author | Paul Mackerras <paulus@samba.org> | 2009-03-23 13:22:08 -0400 |
---|---|---|
committer | Ingo Molnar <mingo@elte.hu> | 2009-04-06 03:30:26 -0400 |
commit | 37d81828385f8ff823caaaf1a83e72d065b6cfa1 (patch) | |
tree | 972900a193a6a5ab1bdc14adcd7ab72bf0a51c13 /arch/powerpc/kernel/perf_counter.c | |
parent | 96f6d4444302bb2ea2cf409529eef816462f6ce0 (diff) |
perf_counter: add an mmap method to allow userspace to read hardware counters
Impact: new feature giving performance improvement
This adds the ability for userspace to do an mmap on a hardware counter
fd and get access to a read-only page that contains the information
needed to translate a hardware counter value to the full 64-bit
counter value that would be returned by a read on the fd. This is
useful on architectures that allow user programs to read the hardware
counters, such as PowerPC.
The mmap will only succeed if the counter is a hardware counter
monitoring the current process.
On my quad 2.5GHz PowerPC 970MP machine, userspace can read a counter
and translate it to the full 64-bit value in about 30ns using the
mmapped page, compared to about 830ns for the read syscall on the
counter, so this does give a significant performance improvement.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl>
Orig-LKML-Reference: <20090323172417.297057964@chello.nl>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'arch/powerpc/kernel/perf_counter.c')
-rw-r--r-- | arch/powerpc/kernel/perf_counter.c | 6 |
1 files changed, 6 insertions, 0 deletions
diff --git a/arch/powerpc/kernel/perf_counter.c b/arch/powerpc/kernel/perf_counter.c index d05651584d43..e4349281b07d 100644 --- a/arch/powerpc/kernel/perf_counter.c +++ b/arch/powerpc/kernel/perf_counter.c | |||
@@ -417,6 +417,8 @@ void hw_perf_restore(u64 disable) | |||
417 | atomic64_set(&counter->hw.prev_count, val); | 417 | atomic64_set(&counter->hw.prev_count, val); |
418 | counter->hw.idx = hwc_index[i] + 1; | 418 | counter->hw.idx = hwc_index[i] + 1; |
419 | write_pmc(counter->hw.idx, val); | 419 | write_pmc(counter->hw.idx, val); |
420 | if (counter->user_page) | ||
421 | perf_counter_update_userpage(counter); | ||
420 | } | 422 | } |
421 | mb(); | 423 | mb(); |
422 | cpuhw->mmcr[0] |= MMCR0_PMXE | MMCR0_FCECE; | 424 | cpuhw->mmcr[0] |= MMCR0_PMXE | MMCR0_FCECE; |
@@ -572,6 +574,8 @@ static void power_perf_disable(struct perf_counter *counter) | |||
572 | ppmu->disable_pmc(counter->hw.idx - 1, cpuhw->mmcr); | 574 | ppmu->disable_pmc(counter->hw.idx - 1, cpuhw->mmcr); |
573 | write_pmc(counter->hw.idx, 0); | 575 | write_pmc(counter->hw.idx, 0); |
574 | counter->hw.idx = 0; | 576 | counter->hw.idx = 0; |
577 | if (counter->user_page) | ||
578 | perf_counter_update_userpage(counter); | ||
575 | break; | 579 | break; |
576 | } | 580 | } |
577 | } | 581 | } |
@@ -698,6 +702,8 @@ static void record_and_restart(struct perf_counter *counter, long val, | |||
698 | write_pmc(counter->hw.idx, val); | 702 | write_pmc(counter->hw.idx, val); |
699 | atomic64_set(&counter->hw.prev_count, val); | 703 | atomic64_set(&counter->hw.prev_count, val); |
700 | atomic64_set(&counter->hw.period_left, left); | 704 | atomic64_set(&counter->hw.period_left, left); |
705 | if (counter->user_page) | ||
706 | perf_counter_update_userpage(counter); | ||
701 | 707 | ||
702 | /* | 708 | /* |
703 | * Finally record data if requested. | 709 | * Finally record data if requested. |