diff options
-rw-r--r-- | arch/powerpc/include/asm/perf_event.h | 109 | ||||
-rw-r--r-- | arch/powerpc/include/asm/perf_event_fsl_emb.h | 50 | ||||
-rw-r--r-- | arch/powerpc/include/asm/perf_event_server.h | 110 | ||||
-rw-r--r-- | arch/powerpc/include/asm/reg_fsl_emb.h | 2 | ||||
-rw-r--r-- | arch/powerpc/kernel/Makefile | 4 | ||||
-rw-r--r-- | arch/powerpc/kernel/cputable.c | 2 | ||||
-rw-r--r-- | arch/powerpc/kernel/e500-pmu.c | 129 | ||||
-rw-r--r-- | arch/powerpc/kernel/perf_event_fsl_emb.c | 654 | ||||
-rw-r--r-- | arch/powerpc/platforms/Kconfig.cputype | 10 |
9 files changed, 970 insertions, 100 deletions
diff --git a/arch/powerpc/include/asm/perf_event.h b/arch/powerpc/include/asm/perf_event.h index 3288ce3997e0..e6d4ce69b126 100644 --- a/arch/powerpc/include/asm/perf_event.h +++ b/arch/powerpc/include/asm/perf_event.h | |||
@@ -1,110 +1,23 @@ | |||
1 | /* | 1 | /* |
2 | * Performance event support - PowerPC-specific definitions. | 2 | * Performance event support - hardware-specific disambiguation |
3 | * | 3 | * |
4 | * Copyright 2008-2009 Paul Mackerras, IBM Corporation. | 4 | * For now this is a compile-time decision, but eventually it should be |
5 | * runtime. This would allow multiplatform perf event support for e300 (fsl | ||
6 | * embedded perf counters) plus server/classic, and would accommodate | ||
7 | * devices other than the core which provide their own performance counters. | ||
8 | * | ||
9 | * Copyright 2010 Freescale Semiconductor, Inc. | ||
5 | * | 10 | * |
6 | * This program is free software; you can redistribute it and/or | 11 | * This program is free software; you can redistribute it and/or |
7 | * modify it under the terms of the GNU General Public License | 12 | * modify it under the terms of the GNU General Public License |
8 | * as published by the Free Software Foundation; either version | 13 | * as published by the Free Software Foundation; either version |
9 | * 2 of the License, or (at your option) any later version. | 14 | * 2 of the License, or (at your option) any later version. |
10 | */ | 15 | */ |
11 | #include <linux/types.h> | ||
12 | |||
13 | #include <asm/hw_irq.h> | ||
14 | |||
15 | #define MAX_HWEVENTS 8 | ||
16 | #define MAX_EVENT_ALTERNATIVES 8 | ||
17 | #define MAX_LIMITED_HWCOUNTERS 2 | ||
18 | |||
19 | /* | ||
20 | * This struct provides the constants and functions needed to | ||
21 | * describe the PMU on a particular POWER-family CPU. | ||
22 | */ | ||
23 | struct power_pmu { | ||
24 | const char *name; | ||
25 | int n_counter; | ||
26 | int max_alternatives; | ||
27 | unsigned long add_fields; | ||
28 | unsigned long test_adder; | ||
29 | int (*compute_mmcr)(u64 events[], int n_ev, | ||
30 | unsigned int hwc[], unsigned long mmcr[]); | ||
31 | int (*get_constraint)(u64 event_id, unsigned long *mskp, | ||
32 | unsigned long *valp); | ||
33 | int (*get_alternatives)(u64 event_id, unsigned int flags, | ||
34 | u64 alt[]); | ||
35 | void (*disable_pmc)(unsigned int pmc, unsigned long mmcr[]); | ||
36 | int (*limited_pmc_event)(u64 event_id); | ||
37 | u32 flags; | ||
38 | int n_generic; | ||
39 | int *generic_events; | ||
40 | int (*cache_events)[PERF_COUNT_HW_CACHE_MAX] | ||
41 | [PERF_COUNT_HW_CACHE_OP_MAX] | ||
42 | [PERF_COUNT_HW_CACHE_RESULT_MAX]; | ||
43 | }; | ||
44 | |||
45 | /* | ||
46 | * Values for power_pmu.flags | ||
47 | */ | ||
48 | #define PPMU_LIMITED_PMC5_6 1 /* PMC5/6 have limited function */ | ||
49 | #define PPMU_ALT_SIPR 2 /* uses alternate posn for SIPR/HV */ | ||
50 | |||
51 | /* | ||
52 | * Values for flags to get_alternatives() | ||
53 | */ | ||
54 | #define PPMU_LIMITED_PMC_OK 1 /* can put this on a limited PMC */ | ||
55 | #define PPMU_LIMITED_PMC_REQD 2 /* have to put this on a limited PMC */ | ||
56 | #define PPMU_ONLY_COUNT_RUN 4 /* only counting in run state */ | ||
57 | |||
58 | extern int register_power_pmu(struct power_pmu *); | ||
59 | 16 | ||
60 | struct pt_regs; | ||
61 | extern unsigned long perf_misc_flags(struct pt_regs *regs); | ||
62 | extern unsigned long perf_instruction_pointer(struct pt_regs *regs); | ||
63 | |||
64 | #define PERF_EVENT_INDEX_OFFSET 1 | ||
65 | |||
66 | /* | ||
67 | * Only override the default definitions in include/linux/perf_event.h | ||
68 | * if we have hardware PMU support. | ||
69 | */ | ||
70 | #ifdef CONFIG_PPC_PERF_CTRS | 17 | #ifdef CONFIG_PPC_PERF_CTRS |
71 | #define perf_misc_flags(regs) perf_misc_flags(regs) | 18 | #include <asm/perf_event_server.h> |
72 | #endif | 19 | #endif |
73 | 20 | ||
74 | /* | 21 | #ifdef CONFIG_FSL_EMB_PERF_EVENT |
75 | * The power_pmu.get_constraint function returns a 32/64-bit value and | 22 | #include <asm/perf_event_fsl_emb.h> |
76 | * a 32/64-bit mask that express the constraints between this event_id and | 23 | #endif |
77 | * other events. | ||
78 | * | ||
79 | * The value and mask are divided up into (non-overlapping) bitfields | ||
80 | * of three different types: | ||
81 | * | ||
82 | * Select field: this expresses the constraint that some set of bits | ||
83 | * in MMCR* needs to be set to a specific value for this event_id. For a | ||
84 | * select field, the mask contains 1s in every bit of the field, and | ||
85 | * the value contains a unique value for each possible setting of the | ||
86 | * MMCR* bits. The constraint checking code will ensure that two events | ||
87 | * that set the same field in their masks have the same value in their | ||
88 | * value dwords. | ||
89 | * | ||
90 | * Add field: this expresses the constraint that there can be at most | ||
91 | * N events in a particular class. A field of k bits can be used for | ||
92 | * N <= 2^(k-1) - 1. The mask has the most significant bit of the field | ||
93 | * set (and the other bits 0), and the value has only the least significant | ||
94 | * bit of the field set. In addition, the 'add_fields' and 'test_adder' | ||
95 | * in the struct power_pmu for this processor come into play. The | ||
96 | * add_fields value contains 1 in the LSB of the field, and the | ||
97 | * test_adder contains 2^(k-1) - 1 - N in the field. | ||
98 | * | ||
99 | * NAND field: this expresses the constraint that you may not have events | ||
100 | * in all of a set of classes. (For example, on PPC970, you can't select | ||
101 | * events from the FPU, ISU and IDU simultaneously, although any two are | ||
102 | * possible.) For N classes, the field is N+1 bits wide, and each class | ||
103 | * is assigned one bit from the least-significant N bits. The mask has | ||
104 | * only the most-significant bit set, and the value has only the bit | ||
105 | * for the event_id's class set. The test_adder has the least significant | ||
106 | * bit set in the field. | ||
107 | * | ||
108 | * If an event_id is not subject to the constraint expressed by a particular | ||
109 | * field, then it will have 0 in both the mask and value for that field. | ||
110 | */ | ||
diff --git a/arch/powerpc/include/asm/perf_event_fsl_emb.h b/arch/powerpc/include/asm/perf_event_fsl_emb.h new file mode 100644 index 000000000000..718a9fa94e68 --- /dev/null +++ b/arch/powerpc/include/asm/perf_event_fsl_emb.h | |||
@@ -0,0 +1,50 @@ | |||
1 | /* | ||
2 | * Performance event support - Freescale embedded specific definitions. | ||
3 | * | ||
4 | * Copyright 2008-2009 Paul Mackerras, IBM Corporation. | ||
5 | * Copyright 2010 Freescale Semiconductor, Inc. | ||
6 | * | ||
7 | * This program is free software; you can redistribute it and/or | ||
8 | * modify it under the terms of the GNU General Public License | ||
9 | * as published by the Free Software Foundation; either version | ||
10 | * 2 of the License, or (at your option) any later version. | ||
11 | */ | ||
12 | |||
13 | #include <linux/types.h> | ||
14 | #include <asm/hw_irq.h> | ||
15 | |||
16 | #define MAX_HWEVENTS 4 | ||
17 | |||
18 | /* event flags */ | ||
19 | #define FSL_EMB_EVENT_VALID 1 | ||
20 | #define FSL_EMB_EVENT_RESTRICTED 2 | ||
21 | |||
22 | /* upper half of event flags is PMLCb */ | ||
23 | #define FSL_EMB_EVENT_THRESHMUL 0x0000070000000000ULL | ||
24 | #define FSL_EMB_EVENT_THRESH 0x0000003f00000000ULL | ||
25 | |||
26 | struct fsl_emb_pmu { | ||
27 | const char *name; | ||
28 | int n_counter; /* total number of counters */ | ||
29 | |||
30 | /* | ||
31 | * The number of contiguous counters starting at zero that | ||
32 | * can hold restricted events, or zero if there are no | ||
33 | * restricted events. | ||
34 | * | ||
35 | * This isn't a very flexible method of expressing constraints, | ||
36 | * but it's very simple and is adequate for existing chips. | ||
37 | */ | ||
38 | int n_restricted; | ||
39 | |||
40 | /* Returns event flags and PMLCb (FSL_EMB_EVENT_*) */ | ||
41 | u64 (*xlate_event)(u64 event_id); | ||
42 | |||
43 | int n_generic; | ||
44 | int *generic_events; | ||
45 | int (*cache_events)[PERF_COUNT_HW_CACHE_MAX] | ||
46 | [PERF_COUNT_HW_CACHE_OP_MAX] | ||
47 | [PERF_COUNT_HW_CACHE_RESULT_MAX]; | ||
48 | }; | ||
49 | |||
50 | int register_fsl_emb_pmu(struct fsl_emb_pmu *); | ||
diff --git a/arch/powerpc/include/asm/perf_event_server.h b/arch/powerpc/include/asm/perf_event_server.h new file mode 100644 index 000000000000..8f1df1208d23 --- /dev/null +++ b/arch/powerpc/include/asm/perf_event_server.h | |||
@@ -0,0 +1,110 @@ | |||
1 | /* | ||
2 | * Performance event support - PowerPC classic/server specific definitions. | ||
3 | * | ||
4 | * Copyright 2008-2009 Paul Mackerras, IBM Corporation. | ||
5 | * | ||
6 | * This program is free software; you can redistribute it and/or | ||
7 | * modify it under the terms of the GNU General Public License | ||
8 | * as published by the Free Software Foundation; either version | ||
9 | * 2 of the License, or (at your option) any later version. | ||
10 | */ | ||
11 | |||
12 | #include <linux/types.h> | ||
13 | #include <asm/hw_irq.h> | ||
14 | |||
15 | #define MAX_HWEVENTS 8 | ||
16 | #define MAX_EVENT_ALTERNATIVES 8 | ||
17 | #define MAX_LIMITED_HWCOUNTERS 2 | ||
18 | |||
19 | /* | ||
20 | * This struct provides the constants and functions needed to | ||
21 | * describe the PMU on a particular POWER-family CPU. | ||
22 | */ | ||
23 | struct power_pmu { | ||
24 | const char *name; | ||
25 | int n_counter; | ||
26 | int max_alternatives; | ||
27 | unsigned long add_fields; | ||
28 | unsigned long test_adder; | ||
29 | int (*compute_mmcr)(u64 events[], int n_ev, | ||
30 | unsigned int hwc[], unsigned long mmcr[]); | ||
31 | int (*get_constraint)(u64 event_id, unsigned long *mskp, | ||
32 | unsigned long *valp); | ||
33 | int (*get_alternatives)(u64 event_id, unsigned int flags, | ||
34 | u64 alt[]); | ||
35 | void (*disable_pmc)(unsigned int pmc, unsigned long mmcr[]); | ||
36 | int (*limited_pmc_event)(u64 event_id); | ||
37 | u32 flags; | ||
38 | int n_generic; | ||
39 | int *generic_events; | ||
40 | int (*cache_events)[PERF_COUNT_HW_CACHE_MAX] | ||
41 | [PERF_COUNT_HW_CACHE_OP_MAX] | ||
42 | [PERF_COUNT_HW_CACHE_RESULT_MAX]; | ||
43 | }; | ||
44 | |||
45 | /* | ||
46 | * Values for power_pmu.flags | ||
47 | */ | ||
48 | #define PPMU_LIMITED_PMC5_6 1 /* PMC5/6 have limited function */ | ||
49 | #define PPMU_ALT_SIPR 2 /* uses alternate posn for SIPR/HV */ | ||
50 | |||
51 | /* | ||
52 | * Values for flags to get_alternatives() | ||
53 | */ | ||
54 | #define PPMU_LIMITED_PMC_OK 1 /* can put this on a limited PMC */ | ||
55 | #define PPMU_LIMITED_PMC_REQD 2 /* have to put this on a limited PMC */ | ||
56 | #define PPMU_ONLY_COUNT_RUN 4 /* only counting in run state */ | ||
57 | |||
58 | extern int register_power_pmu(struct power_pmu *); | ||
59 | |||
60 | struct pt_regs; | ||
61 | extern unsigned long perf_misc_flags(struct pt_regs *regs); | ||
62 | extern unsigned long perf_instruction_pointer(struct pt_regs *regs); | ||
63 | |||
64 | #define PERF_EVENT_INDEX_OFFSET 1 | ||
65 | |||
66 | /* | ||
67 | * Only override the default definitions in include/linux/perf_event.h | ||
68 | * if we have hardware PMU support. | ||
69 | */ | ||
70 | #ifdef CONFIG_PPC_PERF_CTRS | ||
71 | #define perf_misc_flags(regs) perf_misc_flags(regs) | ||
72 | #endif | ||
73 | |||
74 | /* | ||
75 | * The power_pmu.get_constraint function returns a 32/64-bit value and | ||
76 | * a 32/64-bit mask that express the constraints between this event_id and | ||
77 | * other events. | ||
78 | * | ||
79 | * The value and mask are divided up into (non-overlapping) bitfields | ||
80 | * of three different types: | ||
81 | * | ||
82 | * Select field: this expresses the constraint that some set of bits | ||
83 | * in MMCR* needs to be set to a specific value for this event_id. For a | ||
84 | * select field, the mask contains 1s in every bit of the field, and | ||
85 | * the value contains a unique value for each possible setting of the | ||
86 | * MMCR* bits. The constraint checking code will ensure that two events | ||
87 | * that set the same field in their masks have the same value in their | ||
88 | * value dwords. | ||
89 | * | ||
90 | * Add field: this expresses the constraint that there can be at most | ||
91 | * N events in a particular class. A field of k bits can be used for | ||
92 | * N <= 2^(k-1) - 1. The mask has the most significant bit of the field | ||
93 | * set (and the other bits 0), and the value has only the least significant | ||
94 | * bit of the field set. In addition, the 'add_fields' and 'test_adder' | ||
95 | * in the struct power_pmu for this processor come into play. The | ||
96 | * add_fields value contains 1 in the LSB of the field, and the | ||
97 | * test_adder contains 2^(k-1) - 1 - N in the field. | ||
98 | * | ||
99 | * NAND field: this expresses the constraint that you may not have events | ||
100 | * in all of a set of classes. (For example, on PPC970, you can't select | ||
101 | * events from the FPU, ISU and IDU simultaneously, although any two are | ||
102 | * possible.) For N classes, the field is N+1 bits wide, and each class | ||
103 | * is assigned one bit from the least-significant N bits. The mask has | ||
104 | * only the most-significant bit set, and the value has only the bit | ||
105 | * for the event_id's class set. The test_adder has the least significant | ||
106 | * bit set in the field. | ||
107 | * | ||
108 | * If an event_id is not subject to the constraint expressed by a particular | ||
109 | * field, then it will have 0 in both the mask and value for that field. | ||
110 | */ | ||
diff --git a/arch/powerpc/include/asm/reg_fsl_emb.h b/arch/powerpc/include/asm/reg_fsl_emb.h index 0de404dfee8b..77bb71cfd991 100644 --- a/arch/powerpc/include/asm/reg_fsl_emb.h +++ b/arch/powerpc/include/asm/reg_fsl_emb.h | |||
@@ -31,7 +31,7 @@ | |||
31 | #define PMLCA_FCM0 0x08000000 /* Freeze when PMM==0 */ | 31 | #define PMLCA_FCM0 0x08000000 /* Freeze when PMM==0 */ |
32 | #define PMLCA_CE 0x04000000 /* Condition Enable */ | 32 | #define PMLCA_CE 0x04000000 /* Condition Enable */ |
33 | 33 | ||
34 | #define PMLCA_EVENT_MASK 0x007f0000 /* Event field */ | 34 | #define PMLCA_EVENT_MASK 0x00ff0000 /* Event field */ |
35 | #define PMLCA_EVENT_SHIFT 16 | 35 | #define PMLCA_EVENT_SHIFT 16 |
36 | 36 | ||
37 | #define PMRN_PMLCB0 0x110 /* PM Local Control B0 */ | 37 | #define PMRN_PMLCB0 0x110 /* PM Local Control B0 */ |
diff --git a/arch/powerpc/kernel/Makefile b/arch/powerpc/kernel/Makefile index 93fd1629f10e..877326320e74 100644 --- a/arch/powerpc/kernel/Makefile +++ b/arch/powerpc/kernel/Makefile | |||
@@ -99,11 +99,15 @@ obj64-$(CONFIG_AUDIT) += compat_audit.o | |||
99 | obj-$(CONFIG_DYNAMIC_FTRACE) += ftrace.o | 99 | obj-$(CONFIG_DYNAMIC_FTRACE) += ftrace.o |
100 | obj-$(CONFIG_FUNCTION_GRAPH_TRACER) += ftrace.o | 100 | obj-$(CONFIG_FUNCTION_GRAPH_TRACER) += ftrace.o |
101 | obj-$(CONFIG_PERF_EVENTS) += perf_callchain.o | 101 | obj-$(CONFIG_PERF_EVENTS) += perf_callchain.o |
102 | |||
102 | obj-$(CONFIG_PPC_PERF_CTRS) += perf_event.o | 103 | obj-$(CONFIG_PPC_PERF_CTRS) += perf_event.o |
103 | obj64-$(CONFIG_PPC_PERF_CTRS) += power4-pmu.o ppc970-pmu.o power5-pmu.o \ | 104 | obj64-$(CONFIG_PPC_PERF_CTRS) += power4-pmu.o ppc970-pmu.o power5-pmu.o \ |
104 | power5+-pmu.o power6-pmu.o power7-pmu.o | 105 | power5+-pmu.o power6-pmu.o power7-pmu.o |
105 | obj32-$(CONFIG_PPC_PERF_CTRS) += mpc7450-pmu.o | 106 | obj32-$(CONFIG_PPC_PERF_CTRS) += mpc7450-pmu.o |
106 | 107 | ||
108 | obj-$(CONFIG_FSL_EMB_PERF_EVENT) += perf_event_fsl_emb.o | ||
109 | obj-$(CONFIG_FSL_EMB_PERF_EVENT_E500) += e500-pmu.o | ||
110 | |||
107 | obj-$(CONFIG_8XX_MINIMAL_FPEMU) += softemu8xx.o | 111 | obj-$(CONFIG_8XX_MINIMAL_FPEMU) += softemu8xx.o |
108 | 112 | ||
109 | ifneq ($(CONFIG_PPC_INDIRECT_IO),y) | 113 | ifneq ($(CONFIG_PPC_INDIRECT_IO),y) |
diff --git a/arch/powerpc/kernel/cputable.c b/arch/powerpc/kernel/cputable.c index 2fc82bac3bbc..8af4949434b2 100644 --- a/arch/powerpc/kernel/cputable.c +++ b/arch/powerpc/kernel/cputable.c | |||
@@ -1808,7 +1808,7 @@ static struct cpu_spec __initdata cpu_specs[] = { | |||
1808 | .icache_bsize = 64, | 1808 | .icache_bsize = 64, |
1809 | .dcache_bsize = 64, | 1809 | .dcache_bsize = 64, |
1810 | .num_pmcs = 4, | 1810 | .num_pmcs = 4, |
1811 | .oprofile_cpu_type = "ppc/e500", /* xxx - galak, e500mc? */ | 1811 | .oprofile_cpu_type = "ppc/e500mc", |
1812 | .oprofile_type = PPC_OPROFILE_FSL_EMB, | 1812 | .oprofile_type = PPC_OPROFILE_FSL_EMB, |
1813 | .cpu_setup = __setup_cpu_e500mc, | 1813 | .cpu_setup = __setup_cpu_e500mc, |
1814 | .machine_check = machine_check_e500, | 1814 | .machine_check = machine_check_e500, |
diff --git a/arch/powerpc/kernel/e500-pmu.c b/arch/powerpc/kernel/e500-pmu.c new file mode 100644 index 000000000000..7c07de0d8943 --- /dev/null +++ b/arch/powerpc/kernel/e500-pmu.c | |||
@@ -0,0 +1,129 @@ | |||
1 | /* | ||
2 | * Performance counter support for e500 family processors. | ||
3 | * | ||
4 | * Copyright 2008-2009 Paul Mackerras, IBM Corporation. | ||
5 | * Copyright 2010 Freescale Semiconductor, Inc. | ||
6 | * | ||
7 | * This program is free software; you can redistribute it and/or | ||
8 | * modify it under the terms of the GNU General Public License | ||
9 | * as published by the Free Software Foundation; either version | ||
10 | * 2 of the License, or (at your option) any later version. | ||
11 | */ | ||
12 | #include <linux/string.h> | ||
13 | #include <linux/perf_event.h> | ||
14 | #include <asm/reg.h> | ||
15 | #include <asm/cputable.h> | ||
16 | |||
17 | /* | ||
18 | * Map of generic hardware event types to hardware events | ||
19 | * Zero if unsupported | ||
20 | */ | ||
21 | static int e500_generic_events[] = { | ||
22 | [PERF_COUNT_HW_CPU_CYCLES] = 1, | ||
23 | [PERF_COUNT_HW_INSTRUCTIONS] = 2, | ||
24 | [PERF_COUNT_HW_CACHE_MISSES] = 41, /* Data L1 cache reloads */ | ||
25 | [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = 12, | ||
26 | [PERF_COUNT_HW_BRANCH_MISSES] = 15, | ||
27 | }; | ||
28 | |||
29 | #define C(x) PERF_COUNT_HW_CACHE_##x | ||
30 | |||
31 | /* | ||
32 | * Table of generalized cache-related events. | ||
33 | * 0 means not supported, -1 means nonsensical, other values | ||
34 | * are event codes. | ||
35 | */ | ||
36 | static int e500_cache_events[C(MAX)][C(OP_MAX)][C(RESULT_MAX)] = { | ||
37 | /* | ||
38 | * D-cache misses are not split into read/write/prefetch; | ||
39 | * use raw event 41. | ||
40 | */ | ||
41 | [C(L1D)] = { /* RESULT_ACCESS RESULT_MISS */ | ||
42 | [C(OP_READ)] = { 27, 0 }, | ||
43 | [C(OP_WRITE)] = { 28, 0 }, | ||
44 | [C(OP_PREFETCH)] = { 29, 0 }, | ||
45 | }, | ||
46 | [C(L1I)] = { /* RESULT_ACCESS RESULT_MISS */ | ||
47 | [C(OP_READ)] = { 2, 60 }, | ||
48 | [C(OP_WRITE)] = { -1, -1 }, | ||
49 | [C(OP_PREFETCH)] = { 0, 0 }, | ||
50 | }, | ||
51 | /* | ||
52 | * Assuming LL means L2, it's not a good match for this model. | ||
53 | * It allocates only on L1 castout or explicit prefetch, and | ||
54 | * does not have separate read/write events (but it does have | ||
55 | * separate instruction/data events). | ||
56 | */ | ||
57 | [C(LL)] = { /* RESULT_ACCESS RESULT_MISS */ | ||
58 | [C(OP_READ)] = { 0, 0 }, | ||
59 | [C(OP_WRITE)] = { 0, 0 }, | ||
60 | [C(OP_PREFETCH)] = { 0, 0 }, | ||
61 | }, | ||
62 | /* | ||
63 | * There are data/instruction MMU misses, but that's a miss on | ||
64 | * the chip's internal level-one TLB which is probably not | ||
65 | * what the user wants. Instead, unified level-two TLB misses | ||
66 | * are reported here. | ||
67 | */ | ||
68 | [C(DTLB)] = { /* RESULT_ACCESS RESULT_MISS */ | ||
69 | [C(OP_READ)] = { 26, 66 }, | ||
70 | [C(OP_WRITE)] = { -1, -1 }, | ||
71 | [C(OP_PREFETCH)] = { -1, -1 }, | ||
72 | }, | ||
73 | [C(BPU)] = { /* RESULT_ACCESS RESULT_MISS */ | ||
74 | [C(OP_READ)] = { 12, 15 }, | ||
75 | [C(OP_WRITE)] = { -1, -1 }, | ||
76 | [C(OP_PREFETCH)] = { -1, -1 }, | ||
77 | }, | ||
78 | }; | ||
79 | |||
80 | static int num_events = 128; | ||
81 | |||
82 | /* Upper half of event id is PMLCb, for threshold events */ | ||
83 | static u64 e500_xlate_event(u64 event_id) | ||
84 | { | ||
85 | u32 event_low = (u32)event_id; | ||
86 | u64 ret; | ||
87 | |||
88 | if (event_low >= num_events) | ||
89 | return 0; | ||
90 | |||
91 | ret = FSL_EMB_EVENT_VALID; | ||
92 | |||
93 | if (event_low >= 76 && event_low <= 81) { | ||
94 | ret |= FSL_EMB_EVENT_RESTRICTED; | ||
95 | ret |= event_id & | ||
96 | (FSL_EMB_EVENT_THRESHMUL | FSL_EMB_EVENT_THRESH); | ||
97 | } else if (event_id & | ||
98 | (FSL_EMB_EVENT_THRESHMUL | FSL_EMB_EVENT_THRESH)) { | ||
99 | /* Threshold requested on non-threshold event */ | ||
100 | return 0; | ||
101 | } | ||
102 | |||
103 | return ret; | ||
104 | } | ||
105 | |||
106 | static struct fsl_emb_pmu e500_pmu = { | ||
107 | .name = "e500 family", | ||
108 | .n_counter = 4, | ||
109 | .n_restricted = 2, | ||
110 | .xlate_event = e500_xlate_event, | ||
111 | .n_generic = ARRAY_SIZE(e500_generic_events), | ||
112 | .generic_events = e500_generic_events, | ||
113 | .cache_events = &e500_cache_events, | ||
114 | }; | ||
115 | |||
116 | static int init_e500_pmu(void) | ||
117 | { | ||
118 | if (!cur_cpu_spec->oprofile_cpu_type) | ||
119 | return -ENODEV; | ||
120 | |||
121 | if (!strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc/e500mc")) | ||
122 | num_events = 256; | ||
123 | else if (strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc/e500")) | ||
124 | return -ENODEV; | ||
125 | |||
126 | return register_fsl_emb_pmu(&e500_pmu); | ||
127 | } | ||
128 | |||
129 | arch_initcall(init_e500_pmu); | ||
diff --git a/arch/powerpc/kernel/perf_event_fsl_emb.c b/arch/powerpc/kernel/perf_event_fsl_emb.c new file mode 100644 index 000000000000..369872f6cf78 --- /dev/null +++ b/arch/powerpc/kernel/perf_event_fsl_emb.c | |||
@@ -0,0 +1,654 @@ | |||
1 | /* | ||
2 | * Performance event support - Freescale Embedded Performance Monitor | ||
3 | * | ||
4 | * Copyright 2008-2009 Paul Mackerras, IBM Corporation. | ||
5 | * Copyright 2010 Freescale Semiconductor, Inc. | ||
6 | * | ||
7 | * This program is free software; you can redistribute it and/or | ||
8 | * modify it under the terms of the GNU General Public License | ||
9 | * as published by the Free Software Foundation; either version | ||
10 | * 2 of the License, or (at your option) any later version. | ||
11 | */ | ||
12 | #include <linux/kernel.h> | ||
13 | #include <linux/sched.h> | ||
14 | #include <linux/perf_event.h> | ||
15 | #include <linux/percpu.h> | ||
16 | #include <linux/hardirq.h> | ||
17 | #include <asm/reg_fsl_emb.h> | ||
18 | #include <asm/pmc.h> | ||
19 | #include <asm/machdep.h> | ||
20 | #include <asm/firmware.h> | ||
21 | #include <asm/ptrace.h> | ||
22 | |||
23 | struct cpu_hw_events { | ||
24 | int n_events; | ||
25 | int disabled; | ||
26 | u8 pmcs_enabled; | ||
27 | struct perf_event *event[MAX_HWEVENTS]; | ||
28 | }; | ||
29 | static DEFINE_PER_CPU(struct cpu_hw_events, cpu_hw_events); | ||
30 | |||
31 | static struct fsl_emb_pmu *ppmu; | ||
32 | |||
33 | /* Number of perf_events counting hardware events */ | ||
34 | static atomic_t num_events; | ||
35 | /* Used to avoid races in calling reserve/release_pmc_hardware */ | ||
36 | static DEFINE_MUTEX(pmc_reserve_mutex); | ||
37 | |||
38 | /* | ||
39 | * If interrupts were soft-disabled when a PMU interrupt occurs, treat | ||
40 | * it as an NMI. | ||
41 | */ | ||
42 | static inline int perf_intr_is_nmi(struct pt_regs *regs) | ||
43 | { | ||
44 | #ifdef __powerpc64__ | ||
45 | return !regs->softe; | ||
46 | #else | ||
47 | return 0; | ||
48 | #endif | ||
49 | } | ||
50 | |||
51 | static void perf_event_interrupt(struct pt_regs *regs); | ||
52 | |||
53 | /* | ||
54 | * Read one performance monitor counter (PMC). | ||
55 | */ | ||
56 | static unsigned long read_pmc(int idx) | ||
57 | { | ||
58 | unsigned long val; | ||
59 | |||
60 | switch (idx) { | ||
61 | case 0: | ||
62 | val = mfpmr(PMRN_PMC0); | ||
63 | break; | ||
64 | case 1: | ||
65 | val = mfpmr(PMRN_PMC1); | ||
66 | break; | ||
67 | case 2: | ||
68 | val = mfpmr(PMRN_PMC2); | ||
69 | break; | ||
70 | case 3: | ||
71 | val = mfpmr(PMRN_PMC3); | ||
72 | break; | ||
73 | default: | ||
74 | printk(KERN_ERR "oops trying to read PMC%d\n", idx); | ||
75 | val = 0; | ||
76 | } | ||
77 | return val; | ||
78 | } | ||
79 | |||
80 | /* | ||
81 | * Write one PMC. | ||
82 | */ | ||
83 | static void write_pmc(int idx, unsigned long val) | ||
84 | { | ||
85 | switch (idx) { | ||
86 | case 0: | ||
87 | mtpmr(PMRN_PMC0, val); | ||
88 | break; | ||
89 | case 1: | ||
90 | mtpmr(PMRN_PMC1, val); | ||
91 | break; | ||
92 | case 2: | ||
93 | mtpmr(PMRN_PMC2, val); | ||
94 | break; | ||
95 | case 3: | ||
96 | mtpmr(PMRN_PMC3, val); | ||
97 | break; | ||
98 | default: | ||
99 | printk(KERN_ERR "oops trying to write PMC%d\n", idx); | ||
100 | } | ||
101 | |||
102 | isync(); | ||
103 | } | ||
104 | |||
105 | /* | ||
106 | * Write one local control A register | ||
107 | */ | ||
108 | static void write_pmlca(int idx, unsigned long val) | ||
109 | { | ||
110 | switch (idx) { | ||
111 | case 0: | ||
112 | mtpmr(PMRN_PMLCA0, val); | ||
113 | break; | ||
114 | case 1: | ||
115 | mtpmr(PMRN_PMLCA1, val); | ||
116 | break; | ||
117 | case 2: | ||
118 | mtpmr(PMRN_PMLCA2, val); | ||
119 | break; | ||
120 | case 3: | ||
121 | mtpmr(PMRN_PMLCA3, val); | ||
122 | break; | ||
123 | default: | ||
124 | printk(KERN_ERR "oops trying to write PMLCA%d\n", idx); | ||
125 | } | ||
126 | |||
127 | isync(); | ||
128 | } | ||
129 | |||
130 | /* | ||
131 | * Write one local control B register | ||
132 | */ | ||
133 | static void write_pmlcb(int idx, unsigned long val) | ||
134 | { | ||
135 | switch (idx) { | ||
136 | case 0: | ||
137 | mtpmr(PMRN_PMLCB0, val); | ||
138 | break; | ||
139 | case 1: | ||
140 | mtpmr(PMRN_PMLCB1, val); | ||
141 | break; | ||
142 | case 2: | ||
143 | mtpmr(PMRN_PMLCB2, val); | ||
144 | break; | ||
145 | case 3: | ||
146 | mtpmr(PMRN_PMLCB3, val); | ||
147 | break; | ||
148 | default: | ||
149 | printk(KERN_ERR "oops trying to write PMLCB%d\n", idx); | ||
150 | } | ||
151 | |||
152 | isync(); | ||
153 | } | ||
154 | |||
155 | static void fsl_emb_pmu_read(struct perf_event *event) | ||
156 | { | ||
157 | s64 val, delta, prev; | ||
158 | |||
159 | /* | ||
160 | * Performance monitor interrupts come even when interrupts | ||
161 | * are soft-disabled, as long as interrupts are hard-enabled. | ||
162 | * Therefore we treat them like NMIs. | ||
163 | */ | ||
164 | do { | ||
165 | prev = atomic64_read(&event->hw.prev_count); | ||
166 | barrier(); | ||
167 | val = read_pmc(event->hw.idx); | ||
168 | } while (atomic64_cmpxchg(&event->hw.prev_count, prev, val) != prev); | ||
169 | |||
170 | /* The counters are only 32 bits wide */ | ||
171 | delta = (val - prev) & 0xfffffffful; | ||
172 | atomic64_add(delta, &event->count); | ||
173 | atomic64_sub(delta, &event->hw.period_left); | ||
174 | } | ||
175 | |||
176 | /* | ||
177 | * Disable all events to prevent PMU interrupts and to allow | ||
178 | * events to be added or removed. | ||
179 | */ | ||
180 | void hw_perf_disable(void) | ||
181 | { | ||
182 | struct cpu_hw_events *cpuhw; | ||
183 | unsigned long flags; | ||
184 | |||
185 | local_irq_save(flags); | ||
186 | cpuhw = &__get_cpu_var(cpu_hw_events); | ||
187 | |||
188 | if (!cpuhw->disabled) { | ||
189 | cpuhw->disabled = 1; | ||
190 | |||
191 | /* | ||
192 | * Check if we ever enabled the PMU on this cpu. | ||
193 | */ | ||
194 | if (!cpuhw->pmcs_enabled) { | ||
195 | ppc_enable_pmcs(); | ||
196 | cpuhw->pmcs_enabled = 1; | ||
197 | } | ||
198 | |||
199 | if (atomic_read(&num_events)) { | ||
200 | /* | ||
201 | * Set the 'freeze all counters' bit, and disable | ||
202 | * interrupts. The barrier is to make sure the | ||
203 | * mtpmr has been executed and the PMU has frozen | ||
204 | * the events before we return. | ||
205 | */ | ||
206 | |||
207 | mtpmr(PMRN_PMGC0, PMGC0_FAC); | ||
208 | isync(); | ||
209 | } | ||
210 | } | ||
211 | local_irq_restore(flags); | ||
212 | } | ||
213 | |||
214 | /* | ||
215 | * Re-enable all events if disable == 0. | ||
216 | * If we were previously disabled and events were added, then | ||
217 | * put the new config on the PMU. | ||
218 | */ | ||
219 | void hw_perf_enable(void) | ||
220 | { | ||
221 | struct cpu_hw_events *cpuhw; | ||
222 | unsigned long flags; | ||
223 | |||
224 | local_irq_save(flags); | ||
225 | cpuhw = &__get_cpu_var(cpu_hw_events); | ||
226 | if (!cpuhw->disabled) | ||
227 | goto out; | ||
228 | |||
229 | cpuhw->disabled = 0; | ||
230 | ppc_set_pmu_inuse(cpuhw->n_events != 0); | ||
231 | |||
232 | if (cpuhw->n_events > 0) { | ||
233 | mtpmr(PMRN_PMGC0, PMGC0_PMIE | PMGC0_FCECE); | ||
234 | isync(); | ||
235 | } | ||
236 | |||
237 | out: | ||
238 | local_irq_restore(flags); | ||
239 | } | ||
240 | |||
241 | static int collect_events(struct perf_event *group, int max_count, | ||
242 | struct perf_event *ctrs[]) | ||
243 | { | ||
244 | int n = 0; | ||
245 | struct perf_event *event; | ||
246 | |||
247 | if (!is_software_event(group)) { | ||
248 | if (n >= max_count) | ||
249 | return -1; | ||
250 | ctrs[n] = group; | ||
251 | n++; | ||
252 | } | ||
253 | list_for_each_entry(event, &group->sibling_list, group_entry) { | ||
254 | if (!is_software_event(event) && | ||
255 | event->state != PERF_EVENT_STATE_OFF) { | ||
256 | if (n >= max_count) | ||
257 | return -1; | ||
258 | ctrs[n] = event; | ||
259 | n++; | ||
260 | } | ||
261 | } | ||
262 | return n; | ||
263 | } | ||
264 | |||
265 | /* perf must be disabled, context locked on entry */ | ||
266 | static int fsl_emb_pmu_enable(struct perf_event *event) | ||
267 | { | ||
268 | struct cpu_hw_events *cpuhw; | ||
269 | int ret = -EAGAIN; | ||
270 | int num_counters = ppmu->n_counter; | ||
271 | u64 val; | ||
272 | int i; | ||
273 | |||
274 | cpuhw = &get_cpu_var(cpu_hw_events); | ||
275 | |||
276 | if (event->hw.config & FSL_EMB_EVENT_RESTRICTED) | ||
277 | num_counters = ppmu->n_restricted; | ||
278 | |||
279 | /* | ||
280 | * Allocate counters from top-down, so that restricted-capable | ||
281 | * counters are kept free as long as possible. | ||
282 | */ | ||
283 | for (i = num_counters - 1; i >= 0; i--) { | ||
284 | if (cpuhw->event[i]) | ||
285 | continue; | ||
286 | |||
287 | break; | ||
288 | } | ||
289 | |||
290 | if (i < 0) | ||
291 | goto out; | ||
292 | |||
293 | event->hw.idx = i; | ||
294 | cpuhw->event[i] = event; | ||
295 | ++cpuhw->n_events; | ||
296 | |||
297 | val = 0; | ||
298 | if (event->hw.sample_period) { | ||
299 | s64 left = atomic64_read(&event->hw.period_left); | ||
300 | if (left < 0x80000000L) | ||
301 | val = 0x80000000L - left; | ||
302 | } | ||
303 | atomic64_set(&event->hw.prev_count, val); | ||
304 | write_pmc(i, val); | ||
305 | perf_event_update_userpage(event); | ||
306 | |||
307 | write_pmlcb(i, event->hw.config >> 32); | ||
308 | write_pmlca(i, event->hw.config_base); | ||
309 | |||
310 | ret = 0; | ||
311 | out: | ||
312 | put_cpu_var(cpu_hw_events); | ||
313 | return ret; | ||
314 | } | ||
315 | |||
316 | /* perf must be disabled, context locked on entry */ | ||
317 | static void fsl_emb_pmu_disable(struct perf_event *event) | ||
318 | { | ||
319 | struct cpu_hw_events *cpuhw; | ||
320 | int i = event->hw.idx; | ||
321 | |||
322 | if (i < 0) | ||
323 | goto out; | ||
324 | |||
325 | fsl_emb_pmu_read(event); | ||
326 | |||
327 | cpuhw = &get_cpu_var(cpu_hw_events); | ||
328 | |||
329 | WARN_ON(event != cpuhw->event[event->hw.idx]); | ||
330 | |||
331 | write_pmlca(i, 0); | ||
332 | write_pmlcb(i, 0); | ||
333 | write_pmc(i, 0); | ||
334 | |||
335 | cpuhw->event[i] = NULL; | ||
336 | event->hw.idx = -1; | ||
337 | |||
338 | /* | ||
339 | * TODO: if at least one restricted event exists, and we | ||
340 | * just freed up a non-restricted-capable counter, and | ||
341 | * there is a restricted-capable counter occupied by | ||
342 | * a non-restricted event, migrate that event to the | ||
343 | * vacated counter. | ||
344 | */ | ||
345 | |||
346 | cpuhw->n_events--; | ||
347 | |||
348 | out: | ||
349 | put_cpu_var(cpu_hw_events); | ||
350 | } | ||
351 | |||
352 | /* | ||
353 | * Re-enable interrupts on a event after they were throttled | ||
354 | * because they were coming too fast. | ||
355 | * | ||
356 | * Context is locked on entry, but perf is not disabled. | ||
357 | */ | ||
358 | static void fsl_emb_pmu_unthrottle(struct perf_event *event) | ||
359 | { | ||
360 | s64 val, left; | ||
361 | unsigned long flags; | ||
362 | |||
363 | if (event->hw.idx < 0 || !event->hw.sample_period) | ||
364 | return; | ||
365 | local_irq_save(flags); | ||
366 | perf_disable(); | ||
367 | fsl_emb_pmu_read(event); | ||
368 | left = event->hw.sample_period; | ||
369 | event->hw.last_period = left; | ||
370 | val = 0; | ||
371 | if (left < 0x80000000L) | ||
372 | val = 0x80000000L - left; | ||
373 | write_pmc(event->hw.idx, val); | ||
374 | atomic64_set(&event->hw.prev_count, val); | ||
375 | atomic64_set(&event->hw.period_left, left); | ||
376 | perf_event_update_userpage(event); | ||
377 | perf_enable(); | ||
378 | local_irq_restore(flags); | ||
379 | } | ||
380 | |||
381 | static struct pmu fsl_emb_pmu = { | ||
382 | .enable = fsl_emb_pmu_enable, | ||
383 | .disable = fsl_emb_pmu_disable, | ||
384 | .read = fsl_emb_pmu_read, | ||
385 | .unthrottle = fsl_emb_pmu_unthrottle, | ||
386 | }; | ||
387 | |||
388 | /* | ||
389 | * Release the PMU if this is the last perf_event. | ||
390 | */ | ||
391 | static void hw_perf_event_destroy(struct perf_event *event) | ||
392 | { | ||
393 | if (!atomic_add_unless(&num_events, -1, 1)) { | ||
394 | mutex_lock(&pmc_reserve_mutex); | ||
395 | if (atomic_dec_return(&num_events) == 0) | ||
396 | release_pmc_hardware(); | ||
397 | mutex_unlock(&pmc_reserve_mutex); | ||
398 | } | ||
399 | } | ||
400 | |||
401 | /* | ||
402 | * Translate a generic cache event_id config to a raw event_id code. | ||
403 | */ | ||
404 | static int hw_perf_cache_event(u64 config, u64 *eventp) | ||
405 | { | ||
406 | unsigned long type, op, result; | ||
407 | int ev; | ||
408 | |||
409 | if (!ppmu->cache_events) | ||
410 | return -EINVAL; | ||
411 | |||
412 | /* unpack config */ | ||
413 | type = config & 0xff; | ||
414 | op = (config >> 8) & 0xff; | ||
415 | result = (config >> 16) & 0xff; | ||
416 | |||
417 | if (type >= PERF_COUNT_HW_CACHE_MAX || | ||
418 | op >= PERF_COUNT_HW_CACHE_OP_MAX || | ||
419 | result >= PERF_COUNT_HW_CACHE_RESULT_MAX) | ||
420 | return -EINVAL; | ||
421 | |||
422 | ev = (*ppmu->cache_events)[type][op][result]; | ||
423 | if (ev == 0) | ||
424 | return -EOPNOTSUPP; | ||
425 | if (ev == -1) | ||
426 | return -EINVAL; | ||
427 | *eventp = ev; | ||
428 | return 0; | ||
429 | } | ||
430 | |||
431 | const struct pmu *hw_perf_event_init(struct perf_event *event) | ||
432 | { | ||
433 | u64 ev; | ||
434 | struct perf_event *events[MAX_HWEVENTS]; | ||
435 | int n; | ||
436 | int err; | ||
437 | int num_restricted; | ||
438 | int i; | ||
439 | |||
440 | switch (event->attr.type) { | ||
441 | case PERF_TYPE_HARDWARE: | ||
442 | ev = event->attr.config; | ||
443 | if (ev >= ppmu->n_generic || ppmu->generic_events[ev] == 0) | ||
444 | return ERR_PTR(-EOPNOTSUPP); | ||
445 | ev = ppmu->generic_events[ev]; | ||
446 | break; | ||
447 | |||
448 | case PERF_TYPE_HW_CACHE: | ||
449 | err = hw_perf_cache_event(event->attr.config, &ev); | ||
450 | if (err) | ||
451 | return ERR_PTR(err); | ||
452 | break; | ||
453 | |||
454 | case PERF_TYPE_RAW: | ||
455 | ev = event->attr.config; | ||
456 | break; | ||
457 | |||
458 | default: | ||
459 | return ERR_PTR(-EINVAL); | ||
460 | } | ||
461 | |||
462 | event->hw.config = ppmu->xlate_event(ev); | ||
463 | if (!(event->hw.config & FSL_EMB_EVENT_VALID)) | ||
464 | return ERR_PTR(-EINVAL); | ||
465 | |||
466 | /* | ||
467 | * If this is in a group, check if it can go on with all the | ||
468 | * other hardware events in the group. We assume the event | ||
469 | * hasn't been linked into its leader's sibling list at this point. | ||
470 | */ | ||
471 | n = 0; | ||
472 | if (event->group_leader != event) { | ||
473 | n = collect_events(event->group_leader, | ||
474 | ppmu->n_counter - 1, events); | ||
475 | if (n < 0) | ||
476 | return ERR_PTR(-EINVAL); | ||
477 | } | ||
478 | |||
479 | if (event->hw.config & FSL_EMB_EVENT_RESTRICTED) { | ||
480 | num_restricted = 0; | ||
481 | for (i = 0; i < n; i++) { | ||
482 | if (events[i]->hw.config & FSL_EMB_EVENT_RESTRICTED) | ||
483 | num_restricted++; | ||
484 | } | ||
485 | |||
486 | if (num_restricted >= ppmu->n_restricted) | ||
487 | return ERR_PTR(-EINVAL); | ||
488 | } | ||
489 | |||
490 | event->hw.idx = -1; | ||
491 | |||
492 | event->hw.config_base = PMLCA_CE | PMLCA_FCM1 | | ||
493 | (u32)((ev << 16) & PMLCA_EVENT_MASK); | ||
494 | |||
495 | if (event->attr.exclude_user) | ||
496 | event->hw.config_base |= PMLCA_FCU; | ||
497 | if (event->attr.exclude_kernel) | ||
498 | event->hw.config_base |= PMLCA_FCS; | ||
499 | if (event->attr.exclude_idle) | ||
500 | return ERR_PTR(-ENOTSUPP); | ||
501 | |||
502 | event->hw.last_period = event->hw.sample_period; | ||
503 | atomic64_set(&event->hw.period_left, event->hw.last_period); | ||
504 | |||
505 | /* | ||
506 | * See if we need to reserve the PMU. | ||
507 | * If no events are currently in use, then we have to take a | ||
508 | * mutex to ensure that we don't race with another task doing | ||
509 | * reserve_pmc_hardware or release_pmc_hardware. | ||
510 | */ | ||
511 | err = 0; | ||
512 | if (!atomic_inc_not_zero(&num_events)) { | ||
513 | mutex_lock(&pmc_reserve_mutex); | ||
514 | if (atomic_read(&num_events) == 0 && | ||
515 | reserve_pmc_hardware(perf_event_interrupt)) | ||
516 | err = -EBUSY; | ||
517 | else | ||
518 | atomic_inc(&num_events); | ||
519 | mutex_unlock(&pmc_reserve_mutex); | ||
520 | |||
521 | mtpmr(PMRN_PMGC0, PMGC0_FAC); | ||
522 | isync(); | ||
523 | } | ||
524 | event->destroy = hw_perf_event_destroy; | ||
525 | |||
526 | if (err) | ||
527 | return ERR_PTR(err); | ||
528 | return &fsl_emb_pmu; | ||
529 | } | ||
530 | |||
531 | /* | ||
532 | * A counter has overflowed; update its count and record | ||
533 | * things if requested. Note that interrupts are hard-disabled | ||
534 | * here so there is no possibility of being interrupted. | ||
535 | */ | ||
536 | static void record_and_restart(struct perf_event *event, unsigned long val, | ||
537 | struct pt_regs *regs, int nmi) | ||
538 | { | ||
539 | u64 period = event->hw.sample_period; | ||
540 | s64 prev, delta, left; | ||
541 | int record = 0; | ||
542 | |||
543 | /* we don't have to worry about interrupts here */ | ||
544 | prev = atomic64_read(&event->hw.prev_count); | ||
545 | delta = (val - prev) & 0xfffffffful; | ||
546 | atomic64_add(delta, &event->count); | ||
547 | |||
548 | /* | ||
549 | * See if the total period for this event has expired, | ||
550 | * and update for the next period. | ||
551 | */ | ||
552 | val = 0; | ||
553 | left = atomic64_read(&event->hw.period_left) - delta; | ||
554 | if (period) { | ||
555 | if (left <= 0) { | ||
556 | left += period; | ||
557 | if (left <= 0) | ||
558 | left = period; | ||
559 | record = 1; | ||
560 | } | ||
561 | if (left < 0x80000000LL) | ||
562 | val = 0x80000000LL - left; | ||
563 | } | ||
564 | |||
565 | /* | ||
566 | * Finally record data if requested. | ||
567 | */ | ||
568 | if (record) { | ||
569 | struct perf_sample_data data = { | ||
570 | .period = event->hw.last_period, | ||
571 | }; | ||
572 | |||
573 | if (perf_event_overflow(event, nmi, &data, regs)) { | ||
574 | /* | ||
575 | * Interrupts are coming too fast - throttle them | ||
576 | * by setting the event to 0, so it will be | ||
577 | * at least 2^30 cycles until the next interrupt | ||
578 | * (assuming each event counts at most 2 counts | ||
579 | * per cycle). | ||
580 | */ | ||
581 | val = 0; | ||
582 | left = ~0ULL >> 1; | ||
583 | } | ||
584 | } | ||
585 | |||
586 | write_pmc(event->hw.idx, val); | ||
587 | atomic64_set(&event->hw.prev_count, val); | ||
588 | atomic64_set(&event->hw.period_left, left); | ||
589 | perf_event_update_userpage(event); | ||
590 | } | ||
591 | |||
592 | static void perf_event_interrupt(struct pt_regs *regs) | ||
593 | { | ||
594 | int i; | ||
595 | struct cpu_hw_events *cpuhw = &__get_cpu_var(cpu_hw_events); | ||
596 | struct perf_event *event; | ||
597 | unsigned long val; | ||
598 | int found = 0; | ||
599 | int nmi; | ||
600 | |||
601 | nmi = perf_intr_is_nmi(regs); | ||
602 | if (nmi) | ||
603 | nmi_enter(); | ||
604 | else | ||
605 | irq_enter(); | ||
606 | |||
607 | for (i = 0; i < ppmu->n_counter; ++i) { | ||
608 | event = cpuhw->event[i]; | ||
609 | |||
610 | val = read_pmc(i); | ||
611 | if ((int)val < 0) { | ||
612 | if (event) { | ||
613 | /* event has overflowed */ | ||
614 | found = 1; | ||
615 | record_and_restart(event, val, regs, nmi); | ||
616 | } else { | ||
617 | /* | ||
618 | * Disabled counter is negative, | ||
619 | * reset it just in case. | ||
620 | */ | ||
621 | write_pmc(i, 0); | ||
622 | } | ||
623 | } | ||
624 | } | ||
625 | |||
626 | /* PMM will keep counters frozen until we return from the interrupt. */ | ||
627 | mtmsr(mfmsr() | MSR_PMM); | ||
628 | mtpmr(PMRN_PMGC0, PMGC0_PMIE | PMGC0_FCECE); | ||
629 | isync(); | ||
630 | |||
631 | if (nmi) | ||
632 | nmi_exit(); | ||
633 | else | ||
634 | irq_exit(); | ||
635 | } | ||
636 | |||
637 | void hw_perf_event_setup(int cpu) | ||
638 | { | ||
639 | struct cpu_hw_events *cpuhw = &per_cpu(cpu_hw_events, cpu); | ||
640 | |||
641 | memset(cpuhw, 0, sizeof(*cpuhw)); | ||
642 | } | ||
643 | |||
644 | int register_fsl_emb_pmu(struct fsl_emb_pmu *pmu) | ||
645 | { | ||
646 | if (ppmu) | ||
647 | return -EBUSY; /* something's already registered */ | ||
648 | |||
649 | ppmu = pmu; | ||
650 | pr_info("%s performance monitor hardware support registered\n", | ||
651 | pmu->name); | ||
652 | |||
653 | return 0; | ||
654 | } | ||
diff --git a/arch/powerpc/platforms/Kconfig.cputype b/arch/powerpc/platforms/Kconfig.cputype index fa0f690d3867..a8aae0b54579 100644 --- a/arch/powerpc/platforms/Kconfig.cputype +++ b/arch/powerpc/platforms/Kconfig.cputype | |||
@@ -144,6 +144,16 @@ config FSL_EMB_PERFMON | |||
144 | and some e300 cores (c3 and c4). Select this only if your | 144 | and some e300 cores (c3 and c4). Select this only if your |
145 | core supports the Embedded Performance Monitor APU | 145 | core supports the Embedded Performance Monitor APU |
146 | 146 | ||
147 | config FSL_EMB_PERF_EVENT | ||
148 | bool | ||
149 | depends on FSL_EMB_PERFMON && PERF_EVENTS && !PPC_PERF_CTRS | ||
150 | default y | ||
151 | |||
152 | config FSL_EMB_PERF_EVENT_E500 | ||
153 | bool | ||
154 | depends on FSL_EMB_PERF_EVENT && E500 | ||
155 | default y | ||
156 | |||
147 | config 4xx | 157 | config 4xx |
148 | bool | 158 | bool |
149 | depends on 40x || 44x | 159 | depends on 40x || 44x |