diff options
author | sukadev@linux.vnet.ibm.com <sukadev@linux.vnet.ibm.com> | 2012-09-18 16:56:11 -0400 |
---|---|---|
committer | Benjamin Herrenschmidt <benh@kernel.crashing.org> | 2012-09-26 22:51:05 -0400 |
commit | e6878835ac4794f25385522d29c634b7bbb7cca9 (patch) | |
tree | 31abcefb32c9388588b176bbca8709d97c5d3559 /arch/powerpc/perf | |
parent | e8294de53bb788b3a6f7c09d143c7cdc60b65753 (diff) |
powerpc/perf: Sample only if SIAR-Valid bit is set in P7+
powerpc/perf: Sample only if SIAR-Valid bit is set in P7+
On POWER7+ two new bits (mmcra[35] and mmcra[36]) indicate whether the
contents of SIAR and SDAR are valid.
For marked instructions on P7+, we must save the contents of SIAR and
SDAR registers only if these new bits are set.
This code/check for the SIAR-Valid bit is specific to P7+, so rather than
waste a CPU-feature bit use the PVR flag.
Note that Carl Love proposed a similar change for oprofile:
https://lkml.org/lkml/2012/6/22/309
Signed-off-by: Sukadev Bhattiprolu <sukadev@linux.vnet.ibm.com>
Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
Diffstat (limited to 'arch/powerpc/perf')
-rw-r--r-- | arch/powerpc/perf/core-book3s.c | 44 | ||||
-rw-r--r-- | arch/powerpc/perf/power7-pmu.c | 3 |
2 files changed, 41 insertions, 6 deletions
diff --git a/arch/powerpc/perf/core-book3s.c b/arch/powerpc/perf/core-book3s.c index fb55da91aa45..0db88f501f91 100644 --- a/arch/powerpc/perf/core-book3s.c +++ b/arch/powerpc/perf/core-book3s.c | |||
@@ -82,6 +82,11 @@ static inline int perf_intr_is_nmi(struct pt_regs *regs) | |||
82 | return 0; | 82 | return 0; |
83 | } | 83 | } |
84 | 84 | ||
85 | static inline int siar_valid(struct pt_regs *regs) | ||
86 | { | ||
87 | return 1; | ||
88 | } | ||
89 | |||
85 | #endif /* CONFIG_PPC32 */ | 90 | #endif /* CONFIG_PPC32 */ |
86 | 91 | ||
87 | /* | 92 | /* |
@@ -106,14 +111,20 @@ static inline unsigned long perf_ip_adjust(struct pt_regs *regs) | |||
106 | * If we're not doing instruction sampling, give them the SDAR | 111 | * If we're not doing instruction sampling, give them the SDAR |
107 | * (sampled data address). If we are doing instruction sampling, then | 112 | * (sampled data address). If we are doing instruction sampling, then |
108 | * only give them the SDAR if it corresponds to the instruction | 113 | * only give them the SDAR if it corresponds to the instruction |
109 | * pointed to by SIAR; this is indicated by the [POWER6_]MMCRA_SDSYNC | 114 | * pointed to by SIAR; this is indicated by the [POWER6_]MMCRA_SDSYNC or |
110 | * bit in MMCRA. | 115 | * the [POWER7P_]MMCRA_SDAR_VALID bit in MMCRA. |
111 | */ | 116 | */ |
112 | static inline void perf_get_data_addr(struct pt_regs *regs, u64 *addrp) | 117 | static inline void perf_get_data_addr(struct pt_regs *regs, u64 *addrp) |
113 | { | 118 | { |
114 | unsigned long mmcra = regs->dsisr; | 119 | unsigned long mmcra = regs->dsisr; |
115 | unsigned long sdsync = (ppmu->flags & PPMU_ALT_SIPR) ? | 120 | unsigned long sdsync; |
116 | POWER6_MMCRA_SDSYNC : MMCRA_SDSYNC; | 121 | |
122 | if (ppmu->flags & PPMU_SIAR_VALID) | ||
123 | sdsync = POWER7P_MMCRA_SDAR_VALID; | ||
124 | else if (ppmu->flags & PPMU_ALT_SIPR) | ||
125 | sdsync = POWER6_MMCRA_SDSYNC; | ||
126 | else | ||
127 | sdsync = MMCRA_SDSYNC; | ||
117 | 128 | ||
118 | if (!(mmcra & MMCRA_SAMPLE_ENABLE) || (mmcra & sdsync)) | 129 | if (!(mmcra & MMCRA_SAMPLE_ENABLE) || (mmcra & sdsync)) |
119 | *addrp = mfspr(SPRN_SDAR); | 130 | *addrp = mfspr(SPRN_SDAR); |
@@ -230,6 +241,24 @@ static inline int perf_intr_is_nmi(struct pt_regs *regs) | |||
230 | return !regs->softe; | 241 | return !regs->softe; |
231 | } | 242 | } |
232 | 243 | ||
244 | /* | ||
245 | * On processors like P7+ that have the SIAR-Valid bit, marked instructions | ||
246 | * must be sampled only if the SIAR-valid bit is set. | ||
247 | * | ||
248 | * For unmarked instructions and for processors that don't have the SIAR-Valid | ||
249 | * bit, assume that SIAR is valid. | ||
250 | */ | ||
251 | static inline int siar_valid(struct pt_regs *regs) | ||
252 | { | ||
253 | unsigned long mmcra = regs->dsisr; | ||
254 | int marked = mmcra & MMCRA_SAMPLE_ENABLE; | ||
255 | |||
256 | if ((ppmu->flags & PPMU_SIAR_VALID) && marked) | ||
257 | return mmcra & POWER7P_MMCRA_SIAR_VALID; | ||
258 | |||
259 | return 1; | ||
260 | } | ||
261 | |||
233 | #endif /* CONFIG_PPC64 */ | 262 | #endif /* CONFIG_PPC64 */ |
234 | 263 | ||
235 | static void perf_event_interrupt(struct pt_regs *regs); | 264 | static void perf_event_interrupt(struct pt_regs *regs); |
@@ -1291,6 +1320,7 @@ struct pmu power_pmu = { | |||
1291 | .event_idx = power_pmu_event_idx, | 1320 | .event_idx = power_pmu_event_idx, |
1292 | }; | 1321 | }; |
1293 | 1322 | ||
1323 | |||
1294 | /* | 1324 | /* |
1295 | * A counter has overflowed; update its count and record | 1325 | * A counter has overflowed; update its count and record |
1296 | * things if requested. Note that interrupts are hard-disabled | 1326 | * things if requested. Note that interrupts are hard-disabled |
@@ -1324,7 +1354,7 @@ static void record_and_restart(struct perf_event *event, unsigned long val, | |||
1324 | left += period; | 1354 | left += period; |
1325 | if (left <= 0) | 1355 | if (left <= 0) |
1326 | left = period; | 1356 | left = period; |
1327 | record = 1; | 1357 | record = siar_valid(regs); |
1328 | event->hw.last_period = event->hw.sample_period; | 1358 | event->hw.last_period = event->hw.sample_period; |
1329 | } | 1359 | } |
1330 | if (left < 0x80000000LL) | 1360 | if (left < 0x80000000LL) |
@@ -1374,8 +1404,10 @@ unsigned long perf_instruction_pointer(struct pt_regs *regs) | |||
1374 | { | 1404 | { |
1375 | unsigned long use_siar = regs->result; | 1405 | unsigned long use_siar = regs->result; |
1376 | 1406 | ||
1377 | if (use_siar) | 1407 | if (use_siar && siar_valid(regs)) |
1378 | return mfspr(SPRN_SIAR) + perf_ip_adjust(regs); | 1408 | return mfspr(SPRN_SIAR) + perf_ip_adjust(regs); |
1409 | else if (use_siar) | ||
1410 | return 0; // no valid instruction pointer | ||
1379 | else | 1411 | else |
1380 | return regs->nip; | 1412 | return regs->nip; |
1381 | } | 1413 | } |
diff --git a/arch/powerpc/perf/power7-pmu.c b/arch/powerpc/perf/power7-pmu.c index 1251e4d7e262..441af08edf43 100644 --- a/arch/powerpc/perf/power7-pmu.c +++ b/arch/powerpc/perf/power7-pmu.c | |||
@@ -373,6 +373,9 @@ static int __init init_power7_pmu(void) | |||
373 | strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc64/power7")) | 373 | strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc64/power7")) |
374 | return -ENODEV; | 374 | return -ENODEV; |
375 | 375 | ||
376 | if (pvr_version_is(PVR_POWER7p)) | ||
377 | power7_pmu.flags |= PPMU_SIAR_VALID; | ||
378 | |||
376 | return register_power_pmu(&power7_pmu); | 379 | return register_power_pmu(&power7_pmu); |
377 | } | 380 | } |
378 | 381 | ||