diff options
author | Linus Torvalds <torvalds@linux-foundation.org> | 2013-09-06 13:49:42 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2013-09-06 13:49:42 -0400 |
commit | 39eda2aba6be642b71f2e0ad623dcb09fd9d79cf (patch) | |
tree | cd0c8f547847641af73e38aab2478f3119dee490 /arch/powerpc/perf | |
parent | 2e515bf096c245ba87f20ab4b4ea20f911afaeda (diff) | |
parent | 9f24b0c9ef9b6b1292579c9e2cd7ff07ddc372b7 (diff) |
Merge branch 'next' of git://git.kernel.org/pub/scm/linux/kernel/git/benh/powerpc
Pull powerpc updates from Ben Herrenschmidt:
"Here's the powerpc batch for this merge window. Some of the
highlights are:
- A bunch of endian fixes ! We don't have full LE support yet in that
release but this contains a lot of fixes all over arch/powerpc to
use the proper accessors, call the firmware with the right endian
mode, etc...
- A few updates to our "powernv" platform (non-virtualized, the one
to run KVM on), among other, support for bridging the P8 LPC bus
for UARTs, support and some EEH fixes.
- Some mpc51xx clock API cleanups in preparation for a clock API
overhaul
- A pile of cleanups of our old math emulation code, including better
support for using it to emulate optional FP instructions on
embedded chips that otherwise have a HW FPU.
- Some infrastructure in selftest, for powerpc now, but could be
generalized, initially used by some tests for our perf instruction
counting code.
- A pile of fixes for hotplug on pseries (that was seriously
bitrotting)
- The usual slew of freescale embedded updates, new boards, 64-bit
hiberation support, e6500 core PMU support, etc..."
* 'next' of git://git.kernel.org/pub/scm/linux/kernel/git/benh/powerpc: (146 commits)
powerpc: Correct FSCR bit definitions
powerpc/xmon: Fix printing of set of CPUs in xmon
powerpc/pseries: Move lparcfg.c to platforms/pseries
powerpc/powernv: Return secondary CPUs to firmware on kexec
powerpc/btext: Fix CONFIG_PPC_EARLY_DEBUG_BOOTX on ppc32
powerpc: Cleanup handling of the DSCR bit in the FSCR register
powerpc/pseries: Child nodes are not detached by dlpar_detach_node
powerpc/pseries: Add mising of_node_put in delete_dt_node
powerpc/pseries: Make dlpar_configure_connector parent node aware
powerpc/pseries: Do all node initialization in dlpar_parse_cc_node
powerpc/pseries: Fix parsing of initial node path in update_dt_node
powerpc/pseries: Pack update_props_workarea to map correctly to rtas buffer header
powerpc/pseries: Fix over writing of rtas return code in update_dt_node
powerpc/pseries: Fix creation of loop in device node property list
powerpc: Skip emulating & leave interrupts off for kernel program checks
powerpc: Add more exception trampolines for hypervisor exceptions
powerpc: Fix location and rename exception trampolines
powerpc: Add more trap names to xmon
powerpc/pseries: Add a warning in the case of cross-cpu VPA registration
powerpc: Update the 00-Index in Documentation/powerpc
...
Diffstat (limited to 'arch/powerpc/perf')
-rw-r--r-- | arch/powerpc/perf/Makefile | 2 | ||||
-rw-r--r-- | arch/powerpc/perf/core-book3s.c | 2 | ||||
-rw-r--r-- | arch/powerpc/perf/core-fsl-emb.c | 30 | ||||
-rw-r--r-- | arch/powerpc/perf/e6500-pmu.c | 121 |
4 files changed, 153 insertions, 2 deletions
diff --git a/arch/powerpc/perf/Makefile b/arch/powerpc/perf/Makefile index 510fae10513d..60d71eea919c 100644 --- a/arch/powerpc/perf/Makefile +++ b/arch/powerpc/perf/Makefile | |||
@@ -9,7 +9,7 @@ obj64-$(CONFIG_PPC_PERF_CTRS) += power4-pmu.o ppc970-pmu.o power5-pmu.o \ | |||
9 | obj32-$(CONFIG_PPC_PERF_CTRS) += mpc7450-pmu.o | 9 | obj32-$(CONFIG_PPC_PERF_CTRS) += mpc7450-pmu.o |
10 | 10 | ||
11 | obj-$(CONFIG_FSL_EMB_PERF_EVENT) += core-fsl-emb.o | 11 | obj-$(CONFIG_FSL_EMB_PERF_EVENT) += core-fsl-emb.o |
12 | obj-$(CONFIG_FSL_EMB_PERF_EVENT_E500) += e500-pmu.o | 12 | obj-$(CONFIG_FSL_EMB_PERF_EVENT_E500) += e500-pmu.o e6500-pmu.o |
13 | 13 | ||
14 | obj-$(CONFIG_PPC64) += $(obj64-y) | 14 | obj-$(CONFIG_PPC64) += $(obj64-y) |
15 | obj-$(CONFIG_PPC32) += $(obj32-y) | 15 | obj-$(CONFIG_PPC32) += $(obj32-y) |
diff --git a/arch/powerpc/perf/core-book3s.c b/arch/powerpc/perf/core-book3s.c index eeae308cf982..29b89e863d7c 100644 --- a/arch/powerpc/perf/core-book3s.c +++ b/arch/powerpc/perf/core-book3s.c | |||
@@ -24,7 +24,7 @@ | |||
24 | #define BHRB_MAX_ENTRIES 32 | 24 | #define BHRB_MAX_ENTRIES 32 |
25 | #define BHRB_TARGET 0x0000000000000002 | 25 | #define BHRB_TARGET 0x0000000000000002 |
26 | #define BHRB_PREDICTION 0x0000000000000001 | 26 | #define BHRB_PREDICTION 0x0000000000000001 |
27 | #define BHRB_EA 0xFFFFFFFFFFFFFFFC | 27 | #define BHRB_EA 0xFFFFFFFFFFFFFFFCUL |
28 | 28 | ||
29 | struct cpu_hw_events { | 29 | struct cpu_hw_events { |
30 | int n_events; | 30 | int n_events; |
diff --git a/arch/powerpc/perf/core-fsl-emb.c b/arch/powerpc/perf/core-fsl-emb.c index 106c53354675..d35ae52c69dc 100644 --- a/arch/powerpc/perf/core-fsl-emb.c +++ b/arch/powerpc/perf/core-fsl-emb.c | |||
@@ -70,6 +70,12 @@ static unsigned long read_pmc(int idx) | |||
70 | case 3: | 70 | case 3: |
71 | val = mfpmr(PMRN_PMC3); | 71 | val = mfpmr(PMRN_PMC3); |
72 | break; | 72 | break; |
73 | case 4: | ||
74 | val = mfpmr(PMRN_PMC4); | ||
75 | break; | ||
76 | case 5: | ||
77 | val = mfpmr(PMRN_PMC5); | ||
78 | break; | ||
73 | default: | 79 | default: |
74 | printk(KERN_ERR "oops trying to read PMC%d\n", idx); | 80 | printk(KERN_ERR "oops trying to read PMC%d\n", idx); |
75 | val = 0; | 81 | val = 0; |
@@ -95,6 +101,12 @@ static void write_pmc(int idx, unsigned long val) | |||
95 | case 3: | 101 | case 3: |
96 | mtpmr(PMRN_PMC3, val); | 102 | mtpmr(PMRN_PMC3, val); |
97 | break; | 103 | break; |
104 | case 4: | ||
105 | mtpmr(PMRN_PMC4, val); | ||
106 | break; | ||
107 | case 5: | ||
108 | mtpmr(PMRN_PMC5, val); | ||
109 | break; | ||
98 | default: | 110 | default: |
99 | printk(KERN_ERR "oops trying to write PMC%d\n", idx); | 111 | printk(KERN_ERR "oops trying to write PMC%d\n", idx); |
100 | } | 112 | } |
@@ -120,6 +132,12 @@ static void write_pmlca(int idx, unsigned long val) | |||
120 | case 3: | 132 | case 3: |
121 | mtpmr(PMRN_PMLCA3, val); | 133 | mtpmr(PMRN_PMLCA3, val); |
122 | break; | 134 | break; |
135 | case 4: | ||
136 | mtpmr(PMRN_PMLCA4, val); | ||
137 | break; | ||
138 | case 5: | ||
139 | mtpmr(PMRN_PMLCA5, val); | ||
140 | break; | ||
123 | default: | 141 | default: |
124 | printk(KERN_ERR "oops trying to write PMLCA%d\n", idx); | 142 | printk(KERN_ERR "oops trying to write PMLCA%d\n", idx); |
125 | } | 143 | } |
@@ -145,6 +163,12 @@ static void write_pmlcb(int idx, unsigned long val) | |||
145 | case 3: | 163 | case 3: |
146 | mtpmr(PMRN_PMLCB3, val); | 164 | mtpmr(PMRN_PMLCB3, val); |
147 | break; | 165 | break; |
166 | case 4: | ||
167 | mtpmr(PMRN_PMLCB4, val); | ||
168 | break; | ||
169 | case 5: | ||
170 | mtpmr(PMRN_PMLCB5, val); | ||
171 | break; | ||
148 | default: | 172 | default: |
149 | printk(KERN_ERR "oops trying to write PMLCB%d\n", idx); | 173 | printk(KERN_ERR "oops trying to write PMLCB%d\n", idx); |
150 | } | 174 | } |
@@ -462,6 +486,12 @@ static int fsl_emb_pmu_event_init(struct perf_event *event) | |||
462 | int num_restricted; | 486 | int num_restricted; |
463 | int i; | 487 | int i; |
464 | 488 | ||
489 | if (ppmu->n_counter > MAX_HWEVENTS) { | ||
490 | WARN(1, "No. of perf counters (%d) is higher than max array size(%d)\n", | ||
491 | ppmu->n_counter, MAX_HWEVENTS); | ||
492 | ppmu->n_counter = MAX_HWEVENTS; | ||
493 | } | ||
494 | |||
465 | switch (event->attr.type) { | 495 | switch (event->attr.type) { |
466 | case PERF_TYPE_HARDWARE: | 496 | case PERF_TYPE_HARDWARE: |
467 | ev = event->attr.config; | 497 | ev = event->attr.config; |
diff --git a/arch/powerpc/perf/e6500-pmu.c b/arch/powerpc/perf/e6500-pmu.c new file mode 100644 index 000000000000..3d877aa777b5 --- /dev/null +++ b/arch/powerpc/perf/e6500-pmu.c | |||
@@ -0,0 +1,121 @@ | |||
1 | /* | ||
2 | * Performance counter support for e6500 family processors. | ||
3 | * | ||
4 | * Author: Priyanka Jain, Priyanka.Jain@freescale.com | ||
5 | * Based on e500-pmu.c | ||
6 | * Copyright 2013 Freescale Semiconductor, Inc. | ||
7 | * Copyright 2008-2009 Paul Mackerras, IBM Corporation. | ||
8 | * | ||
9 | * This program is free software; you can redistribute it and/or | ||
10 | * modify it under the terms of the GNU General Public License | ||
11 | * as published by the Free Software Foundation; either version | ||
12 | * 2 of the License, or (at your option) any later version. | ||
13 | */ | ||
14 | |||
15 | #include <linux/string.h> | ||
16 | #include <linux/perf_event.h> | ||
17 | #include <asm/reg.h> | ||
18 | #include <asm/cputable.h> | ||
19 | |||
20 | /* | ||
21 | * Map of generic hardware event types to hardware events | ||
22 | * Zero if unsupported | ||
23 | */ | ||
24 | static int e6500_generic_events[] = { | ||
25 | [PERF_COUNT_HW_CPU_CYCLES] = 1, | ||
26 | [PERF_COUNT_HW_INSTRUCTIONS] = 2, | ||
27 | [PERF_COUNT_HW_CACHE_MISSES] = 221, | ||
28 | [PERF_COUNT_HW_BRANCH_INSTRUCTIONS] = 12, | ||
29 | [PERF_COUNT_HW_BRANCH_MISSES] = 15, | ||
30 | }; | ||
31 | |||
32 | #define C(x) PERF_COUNT_HW_CACHE_##x | ||
33 | |||
34 | /* | ||
35 | * Table of generalized cache-related events. | ||
36 | * 0 means not supported, -1 means nonsensical, other values | ||
37 | * are event codes. | ||
38 | */ | ||
39 | static int e6500_cache_events[C(MAX)][C(OP_MAX)][C(RESULT_MAX)] = { | ||
40 | [C(L1D)] = { | ||
41 | /*RESULT_ACCESS RESULT_MISS */ | ||
42 | [C(OP_READ)] = { 27, 222 }, | ||
43 | [C(OP_WRITE)] = { 28, 223 }, | ||
44 | [C(OP_PREFETCH)] = { 29, 0 }, | ||
45 | }, | ||
46 | [C(L1I)] = { | ||
47 | /*RESULT_ACCESS RESULT_MISS */ | ||
48 | [C(OP_READ)] = { 2, 254 }, | ||
49 | [C(OP_WRITE)] = { -1, -1 }, | ||
50 | [C(OP_PREFETCH)] = { 37, 0 }, | ||
51 | }, | ||
52 | /* | ||
53 | * Assuming LL means L2, it's not a good match for this model. | ||
54 | * It does not have separate read/write events (but it does have | ||
55 | * separate instruction/data events). | ||
56 | */ | ||
57 | [C(LL)] = { | ||
58 | /*RESULT_ACCESS RESULT_MISS */ | ||
59 | [C(OP_READ)] = { 0, 0 }, | ||
60 | [C(OP_WRITE)] = { 0, 0 }, | ||
61 | [C(OP_PREFETCH)] = { 0, 0 }, | ||
62 | }, | ||
63 | /* | ||
64 | * There are data/instruction MMU misses, but that's a miss on | ||
65 | * the chip's internal level-one TLB which is probably not | ||
66 | * what the user wants. Instead, unified level-two TLB misses | ||
67 | * are reported here. | ||
68 | */ | ||
69 | [C(DTLB)] = { | ||
70 | /*RESULT_ACCESS RESULT_MISS */ | ||
71 | [C(OP_READ)] = { 26, 66 }, | ||
72 | [C(OP_WRITE)] = { -1, -1 }, | ||
73 | [C(OP_PREFETCH)] = { -1, -1 }, | ||
74 | }, | ||
75 | [C(BPU)] = { | ||
76 | /*RESULT_ACCESS RESULT_MISS */ | ||
77 | [C(OP_READ)] = { 12, 15 }, | ||
78 | [C(OP_WRITE)] = { -1, -1 }, | ||
79 | [C(OP_PREFETCH)] = { -1, -1 }, | ||
80 | }, | ||
81 | [C(NODE)] = { | ||
82 | /* RESULT_ACCESS RESULT_MISS */ | ||
83 | [C(OP_READ)] = { -1, -1 }, | ||
84 | [C(OP_WRITE)] = { -1, -1 }, | ||
85 | [C(OP_PREFETCH)] = { -1, -1 }, | ||
86 | }, | ||
87 | }; | ||
88 | |||
89 | static int num_events = 512; | ||
90 | |||
91 | /* Upper half of event id is PMLCb, for threshold events */ | ||
92 | static u64 e6500_xlate_event(u64 event_id) | ||
93 | { | ||
94 | u32 event_low = (u32)event_id; | ||
95 | if (event_low >= num_events || | ||
96 | (event_id & (FSL_EMB_EVENT_THRESHMUL | FSL_EMB_EVENT_THRESH))) | ||
97 | return 0; | ||
98 | |||
99 | return FSL_EMB_EVENT_VALID; | ||
100 | } | ||
101 | |||
102 | static struct fsl_emb_pmu e6500_pmu = { | ||
103 | .name = "e6500 family", | ||
104 | .n_counter = 6, | ||
105 | .n_restricted = 0, | ||
106 | .xlate_event = e6500_xlate_event, | ||
107 | .n_generic = ARRAY_SIZE(e6500_generic_events), | ||
108 | .generic_events = e6500_generic_events, | ||
109 | .cache_events = &e6500_cache_events, | ||
110 | }; | ||
111 | |||
112 | static int init_e6500_pmu(void) | ||
113 | { | ||
114 | if (!cur_cpu_spec->oprofile_cpu_type || | ||
115 | strcmp(cur_cpu_spec->oprofile_cpu_type, "ppc/e6500")) | ||
116 | return -ENODEV; | ||
117 | |||
118 | return register_fsl_emb_pmu(&e6500_pmu); | ||
119 | } | ||
120 | |||
121 | early_initcall(init_e6500_pmu); | ||