aboutsummaryrefslogtreecommitdiffstats
path: root/arch/powerpc/kernel/perf_counter.c
diff options
context:
space:
mode:
authorPaul Mackerras <paulus@samba.org>2009-03-23 13:22:08 -0400
committerIngo Molnar <mingo@elte.hu>2009-04-06 03:30:26 -0400
commit37d81828385f8ff823caaaf1a83e72d065b6cfa1 (patch)
tree972900a193a6a5ab1bdc14adcd7ab72bf0a51c13 /arch/powerpc/kernel/perf_counter.c
parent96f6d4444302bb2ea2cf409529eef816462f6ce0 (diff)
perf_counter: add an mmap method to allow userspace to read hardware counters
Impact: new feature giving performance improvement This adds the ability for userspace to do an mmap on a hardware counter fd and get access to a read-only page that contains the information needed to translate a hardware counter value to the full 64-bit counter value that would be returned by a read on the fd. This is useful on architectures that allow user programs to read the hardware counters, such as PowerPC. The mmap will only succeed if the counter is a hardware counter monitoring the current process. On my quad 2.5GHz PowerPC 970MP machine, userspace can read a counter and translate it to the full 64-bit value in about 30ns using the mmapped page, compared to about 830ns for the read syscall on the counter, so this does give a significant performance improvement. Signed-off-by: Paul Mackerras <paulus@samba.org> Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Orig-LKML-Reference: <20090323172417.297057964@chello.nl> Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'arch/powerpc/kernel/perf_counter.c')
-rw-r--r--arch/powerpc/kernel/perf_counter.c6
1 files changed, 6 insertions, 0 deletions
diff --git a/arch/powerpc/kernel/perf_counter.c b/arch/powerpc/kernel/perf_counter.c
index d05651584d43..e4349281b07d 100644
--- a/arch/powerpc/kernel/perf_counter.c
+++ b/arch/powerpc/kernel/perf_counter.c
@@ -417,6 +417,8 @@ void hw_perf_restore(u64 disable)
417 atomic64_set(&counter->hw.prev_count, val); 417 atomic64_set(&counter->hw.prev_count, val);
418 counter->hw.idx = hwc_index[i] + 1; 418 counter->hw.idx = hwc_index[i] + 1;
419 write_pmc(counter->hw.idx, val); 419 write_pmc(counter->hw.idx, val);
420 if (counter->user_page)
421 perf_counter_update_userpage(counter);
420 } 422 }
421 mb(); 423 mb();
422 cpuhw->mmcr[0] |= MMCR0_PMXE | MMCR0_FCECE; 424 cpuhw->mmcr[0] |= MMCR0_PMXE | MMCR0_FCECE;
@@ -572,6 +574,8 @@ static void power_perf_disable(struct perf_counter *counter)
572 ppmu->disable_pmc(counter->hw.idx - 1, cpuhw->mmcr); 574 ppmu->disable_pmc(counter->hw.idx - 1, cpuhw->mmcr);
573 write_pmc(counter->hw.idx, 0); 575 write_pmc(counter->hw.idx, 0);
574 counter->hw.idx = 0; 576 counter->hw.idx = 0;
577 if (counter->user_page)
578 perf_counter_update_userpage(counter);
575 break; 579 break;
576 } 580 }
577 } 581 }
@@ -698,6 +702,8 @@ static void record_and_restart(struct perf_counter *counter, long val,
698 write_pmc(counter->hw.idx, val); 702 write_pmc(counter->hw.idx, val);
699 atomic64_set(&counter->hw.prev_count, val); 703 atomic64_set(&counter->hw.prev_count, val);
700 atomic64_set(&counter->hw.period_left, left); 704 atomic64_set(&counter->hw.period_left, left);
705 if (counter->user_page)
706 perf_counter_update_userpage(counter);
701 707
702 /* 708 /*
703 * Finally record data if requested. 709 * Finally record data if requested.