diff options
author | Fenghua Yu <fenghua.yu@intel.com> | 2010-07-29 20:13:45 -0400 |
---|---|---|
committer | H. Peter Anvin <hpa@linux.intel.com> | 2010-08-03 18:58:56 -0400 |
commit | 0199114c31798af5b83841b21759b64171060d9b (patch) | |
tree | a50a9eb0b1f2a43fb92d6143931fb0f688d766e8 /arch/x86/kernel | |
parent | 55d435a227bd28c77afab326de44dfacc0b15059 (diff) |
x86, hwmon: Package Level Thermal/Power: power limit
Power limit notification feature is published in Intel 64 and IA-32
Architectures SDMV Vol 3A 14.5.6 Power Limit Notification.
It is implemented first on Intel Sandy Bridge platform.
The patch handles notification interrupt. Interrupt handler dumps power limit
information in log_buf, logs the event in mce log, and increases the event
counters (core_power_limit and package_power_limit). Upper level applications
could use the data to detect system health or diagnose functionality/performance
issues.
In the future, the event could be handled in a more fancy way.
Signed-off-by: Fenghua Yu <fenghua.yu@intel.com>
LKML-Reference: <1280448826-12004-5-git-send-email-fenghua.yu@intel.com>
Reviewed-by: Len Brown <len.brown@intel.com>
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Diffstat (limited to 'arch/x86/kernel')
-rw-r--r-- | arch/x86/kernel/cpu/mcheck/therm_throt.c | 183 |
1 files changed, 129 insertions, 54 deletions
diff --git a/arch/x86/kernel/cpu/mcheck/therm_throt.c b/arch/x86/kernel/cpu/mcheck/therm_throt.c index d307f9f64c23..c2a8b26d4fea 100644 --- a/arch/x86/kernel/cpu/mcheck/therm_throt.c +++ b/arch/x86/kernel/cpu/mcheck/therm_throt.c | |||
@@ -34,20 +34,25 @@ | |||
34 | /* How long to wait between reporting thermal events */ | 34 | /* How long to wait between reporting thermal events */ |
35 | #define CHECK_INTERVAL (300 * HZ) | 35 | #define CHECK_INTERVAL (300 * HZ) |
36 | 36 | ||
37 | #define THERMAL_THROTTLING_EVENT 0 | ||
38 | #define POWER_LIMIT_EVENT 1 | ||
39 | |||
37 | /* | 40 | /* |
38 | * Current thermal throttling state: | 41 | * Current thermal event state: |
39 | */ | 42 | */ |
40 | struct _thermal_state { | 43 | struct _thermal_state { |
41 | bool is_throttled; | 44 | bool new_event; |
42 | 45 | int event; | |
43 | u64 next_check; | 46 | u64 next_check; |
44 | unsigned long throttle_count; | 47 | unsigned long count; |
45 | unsigned long last_throttle_count; | 48 | unsigned long last_count; |
46 | }; | 49 | }; |
47 | 50 | ||
48 | struct thermal_state { | 51 | struct thermal_state { |
49 | struct _thermal_state core; | 52 | struct _thermal_state core_throttle; |
50 | struct _thermal_state package; | 53 | struct _thermal_state core_power_limit; |
54 | struct _thermal_state package_throttle; | ||
55 | struct _thermal_state package_power_limit; | ||
51 | }; | 56 | }; |
52 | 57 | ||
53 | static DEFINE_PER_CPU(struct thermal_state, thermal_state); | 58 | static DEFINE_PER_CPU(struct thermal_state, thermal_state); |
@@ -62,9 +67,9 @@ static u32 lvtthmr_init __read_mostly; | |||
62 | therm_throt_sysdev_show_##_name, \ | 67 | therm_throt_sysdev_show_##_name, \ |
63 | NULL) \ | 68 | NULL) \ |
64 | 69 | ||
65 | #define define_therm_throt_sysdev_show_func(level, name) \ | 70 | #define define_therm_throt_sysdev_show_func(event, name) \ |
66 | \ | 71 | \ |
67 | static ssize_t therm_throt_sysdev_show_##level##_##name( \ | 72 | static ssize_t therm_throt_sysdev_show_##event##_##name( \ |
68 | struct sys_device *dev, \ | 73 | struct sys_device *dev, \ |
69 | struct sysdev_attribute *attr, \ | 74 | struct sysdev_attribute *attr, \ |
70 | char *buf) \ | 75 | char *buf) \ |
@@ -75,7 +80,7 @@ static ssize_t therm_throt_sysdev_show_##level##_##name( \ | |||
75 | preempt_disable(); /* CPU hotplug */ \ | 80 | preempt_disable(); /* CPU hotplug */ \ |
76 | if (cpu_online(cpu)) { \ | 81 | if (cpu_online(cpu)) { \ |
77 | ret = sprintf(buf, "%lu\n", \ | 82 | ret = sprintf(buf, "%lu\n", \ |
78 | per_cpu(thermal_state, cpu).level.name); \ | 83 | per_cpu(thermal_state, cpu).event.name); \ |
79 | } else \ | 84 | } else \ |
80 | ret = 0; \ | 85 | ret = 0; \ |
81 | preempt_enable(); \ | 86 | preempt_enable(); \ |
@@ -83,23 +88,32 @@ static ssize_t therm_throt_sysdev_show_##level##_##name( \ | |||
83 | return ret; \ | 88 | return ret; \ |
84 | } | 89 | } |
85 | 90 | ||
86 | define_therm_throt_sysdev_show_func(core, throttle_count); | 91 | define_therm_throt_sysdev_show_func(core_throttle, count); |
87 | define_therm_throt_sysdev_one_ro(core_throttle_count); | 92 | define_therm_throt_sysdev_one_ro(core_throttle_count); |
88 | 93 | ||
89 | define_therm_throt_sysdev_show_func(package, throttle_count); | 94 | define_therm_throt_sysdev_show_func(core_power_limit, count); |
95 | define_therm_throt_sysdev_one_ro(core_power_limit_count); | ||
96 | |||
97 | define_therm_throt_sysdev_show_func(package_throttle, count); | ||
90 | define_therm_throt_sysdev_one_ro(package_throttle_count); | 98 | define_therm_throt_sysdev_one_ro(package_throttle_count); |
91 | 99 | ||
100 | define_therm_throt_sysdev_show_func(package_power_limit, count); | ||
101 | define_therm_throt_sysdev_one_ro(package_power_limit_count); | ||
102 | |||
92 | static struct attribute *thermal_throttle_attrs[] = { | 103 | static struct attribute *thermal_throttle_attrs[] = { |
93 | &attr_core_throttle_count.attr, | 104 | &attr_core_throttle_count.attr, |
94 | NULL | 105 | NULL |
95 | }; | 106 | }; |
96 | 107 | ||
97 | static struct attribute_group thermal_throttle_attr_group = { | 108 | static struct attribute_group thermal_attr_group = { |
98 | .attrs = thermal_throttle_attrs, | 109 | .attrs = thermal_throttle_attrs, |
99 | .name = "thermal_throttle" | 110 | .name = "thermal_throttle" |
100 | }; | 111 | }; |
101 | #endif /* CONFIG_SYSFS */ | 112 | #endif /* CONFIG_SYSFS */ |
102 | 113 | ||
114 | #define CORE_LEVEL 0 | ||
115 | #define PACKAGE_LEVEL 1 | ||
116 | |||
103 | /*** | 117 | /*** |
104 | * therm_throt_process - Process thermal throttling event from interrupt | 118 | * therm_throt_process - Process thermal throttling event from interrupt |
105 | * @curr: Whether the condition is current or not (boolean), since the | 119 | * @curr: Whether the condition is current or not (boolean), since the |
@@ -116,49 +130,70 @@ static struct attribute_group thermal_throttle_attr_group = { | |||
116 | * 1 : Event should be logged further, and a message has been | 130 | * 1 : Event should be logged further, and a message has been |
117 | * printed to the syslog. | 131 | * printed to the syslog. |
118 | */ | 132 | */ |
119 | #define CORE_LEVEL 0 | 133 | static int therm_throt_process(bool new_event, int event, int level) |
120 | #define PACKAGE_LEVEL 1 | ||
121 | static int therm_throt_process(bool is_throttled, int level) | ||
122 | { | 134 | { |
123 | struct _thermal_state *state; | 135 | struct _thermal_state *state; |
124 | unsigned int this_cpu; | 136 | unsigned int this_cpu = smp_processor_id(); |
125 | bool was_throttled; | 137 | bool old_event; |
126 | u64 now; | 138 | u64 now; |
139 | struct thermal_state *pstate = &per_cpu(thermal_state, this_cpu); | ||
127 | 140 | ||
128 | this_cpu = smp_processor_id(); | ||
129 | now = get_jiffies_64(); | 141 | now = get_jiffies_64(); |
130 | if (level == CORE_LEVEL) | 142 | if (level == CORE_LEVEL) { |
131 | state = &per_cpu(thermal_state, this_cpu).core; | 143 | if (event == THERMAL_THROTTLING_EVENT) |
132 | else | 144 | state = &pstate->core_throttle; |
133 | state = &per_cpu(thermal_state, this_cpu).package; | 145 | else if (event == POWER_LIMIT_EVENT) |
146 | state = &pstate->core_power_limit; | ||
147 | else | ||
148 | return 0; | ||
149 | } else if (level == PACKAGE_LEVEL) { | ||
150 | if (event == THERMAL_THROTTLING_EVENT) | ||
151 | state = &pstate->package_throttle; | ||
152 | else if (event == POWER_LIMIT_EVENT) | ||
153 | state = &pstate->package_power_limit; | ||
154 | else | ||
155 | return 0; | ||
156 | } else | ||
157 | return 0; | ||
134 | 158 | ||
135 | was_throttled = state->is_throttled; | 159 | old_event = state->new_event; |
136 | state->is_throttled = is_throttled; | 160 | state->new_event = new_event; |
137 | 161 | ||
138 | if (is_throttled) | 162 | if (new_event) |
139 | state->throttle_count++; | 163 | state->count++; |
140 | 164 | ||
141 | if (time_before64(now, state->next_check) && | 165 | if (time_before64(now, state->next_check) && |
142 | state->throttle_count != state->last_throttle_count) | 166 | state->count != state->last_count) |
143 | return 0; | 167 | return 0; |
144 | 168 | ||
145 | state->next_check = now + CHECK_INTERVAL; | 169 | state->next_check = now + CHECK_INTERVAL; |
146 | state->last_throttle_count = state->throttle_count; | 170 | state->last_count = state->count; |
147 | 171 | ||
148 | /* if we just entered the thermal event */ | 172 | /* if we just entered the thermal event */ |
149 | if (is_throttled) { | 173 | if (new_event) { |
150 | printk(KERN_CRIT "CPU%d: %s temperature above threshold, cpu clock throttled (total events = %lu)\n", | 174 | if (event == THERMAL_THROTTLING_EVENT) |
151 | this_cpu, | 175 | printk(KERN_CRIT "CPU%d: %s temperature above threshold, cpu clock throttled (total events = %lu)\n", |
152 | level == CORE_LEVEL ? "Core" : "Package", | 176 | this_cpu, |
153 | state->throttle_count); | 177 | level == CORE_LEVEL ? "Core" : "Package", |
178 | state->count); | ||
179 | else | ||
180 | printk(KERN_CRIT "CPU%d: %s power limit notification (total events = %lu)\n", | ||
181 | this_cpu, | ||
182 | level == CORE_LEVEL ? "Core" : "Package", | ||
183 | state->count); | ||
154 | 184 | ||
155 | add_taint(TAINT_MACHINE_CHECK); | 185 | add_taint(TAINT_MACHINE_CHECK); |
156 | return 1; | 186 | return 1; |
157 | } | 187 | } |
158 | if (was_throttled) { | 188 | if (old_event) { |
159 | printk(KERN_INFO "CPU%d: %s temperature/speed normal\n", | 189 | if (event == THERMAL_THROTTLING_EVENT) |
160 | this_cpu, | 190 | printk(KERN_INFO "CPU%d: %s temperature/speed normal\n", |
161 | level == CORE_LEVEL ? "Core" : "Package"); | 191 | this_cpu, |
192 | level == CORE_LEVEL ? "Core" : "Package"); | ||
193 | else | ||
194 | printk(KERN_INFO "CPU%d: %s power limit normal\n", | ||
195 | this_cpu, | ||
196 | level == CORE_LEVEL ? "Core" : "Package"); | ||
162 | return 1; | 197 | return 1; |
163 | } | 198 | } |
164 | 199 | ||
@@ -172,21 +207,29 @@ static __cpuinit int thermal_throttle_add_dev(struct sys_device *sys_dev) | |||
172 | int err; | 207 | int err; |
173 | struct cpuinfo_x86 *c = &cpu_data(smp_processor_id()); | 208 | struct cpuinfo_x86 *c = &cpu_data(smp_processor_id()); |
174 | 209 | ||
175 | err = sysfs_create_group(&sys_dev->kobj, &thermal_throttle_attr_group); | 210 | err = sysfs_create_group(&sys_dev->kobj, &thermal_attr_group); |
176 | if (err) | 211 | if (err) |
177 | return err; | 212 | return err; |
178 | 213 | ||
214 | if (cpu_has(c, X86_FEATURE_PLN)) | ||
215 | err = sysfs_add_file_to_group(&sys_dev->kobj, | ||
216 | &attr_core_power_limit_count.attr, | ||
217 | thermal_attr_group.name); | ||
179 | if (cpu_has(c, X86_FEATURE_PTS)) | 218 | if (cpu_has(c, X86_FEATURE_PTS)) |
180 | err = sysfs_add_file_to_group(&sys_dev->kobj, | 219 | err = sysfs_add_file_to_group(&sys_dev->kobj, |
181 | &attr_package_throttle_count.attr, | 220 | &attr_package_throttle_count.attr, |
182 | thermal_throttle_attr_group.name); | 221 | thermal_attr_group.name); |
222 | if (cpu_has(c, X86_FEATURE_PLN)) | ||
223 | err = sysfs_add_file_to_group(&sys_dev->kobj, | ||
224 | &attr_package_power_limit_count.attr, | ||
225 | thermal_attr_group.name); | ||
183 | 226 | ||
184 | return err; | 227 | return err; |
185 | } | 228 | } |
186 | 229 | ||
187 | static __cpuinit void thermal_throttle_remove_dev(struct sys_device *sys_dev) | 230 | static __cpuinit void thermal_throttle_remove_dev(struct sys_device *sys_dev) |
188 | { | 231 | { |
189 | sysfs_remove_group(&sys_dev->kobj, &thermal_throttle_attr_group); | 232 | sysfs_remove_group(&sys_dev->kobj, &thermal_attr_group); |
190 | } | 233 | } |
191 | 234 | ||
192 | /* Mutex protecting device creation against CPU hotplug: */ | 235 | /* Mutex protecting device creation against CPU hotplug: */ |
@@ -257,6 +300,17 @@ device_initcall(thermal_throttle_init_device); | |||
257 | 300 | ||
258 | #endif /* CONFIG_SYSFS */ | 301 | #endif /* CONFIG_SYSFS */ |
259 | 302 | ||
303 | /* | ||
304 | * Set up the most two significant bit to notify mce log that this thermal | ||
305 | * event type. | ||
306 | * This is a temp solution. May be changed in the future with mce log | ||
307 | * infrasture. | ||
308 | */ | ||
309 | #define CORE_THROTTLED (0) | ||
310 | #define CORE_POWER_LIMIT ((__u64)1 << 62) | ||
311 | #define PACKAGE_THROTTLED ((__u64)2 << 62) | ||
312 | #define PACKAGE_POWER_LIMIT ((__u64)3 << 62) | ||
313 | |||
260 | /* Thermal transition interrupt handler */ | 314 | /* Thermal transition interrupt handler */ |
261 | static void intel_thermal_interrupt(void) | 315 | static void intel_thermal_interrupt(void) |
262 | { | 316 | { |
@@ -264,21 +318,31 @@ static void intel_thermal_interrupt(void) | |||
264 | struct cpuinfo_x86 *c = &cpu_data(smp_processor_id()); | 318 | struct cpuinfo_x86 *c = &cpu_data(smp_processor_id()); |
265 | 319 | ||
266 | rdmsrl(MSR_IA32_THERM_STATUS, msr_val); | 320 | rdmsrl(MSR_IA32_THERM_STATUS, msr_val); |
321 | |||
267 | if (therm_throt_process(msr_val & THERM_STATUS_PROCHOT, | 322 | if (therm_throt_process(msr_val & THERM_STATUS_PROCHOT, |
323 | THERMAL_THROTTLING_EVENT, | ||
268 | CORE_LEVEL) != 0) | 324 | CORE_LEVEL) != 0) |
269 | mce_log_therm_throt_event(msr_val); | 325 | mce_log_therm_throt_event(CORE_THROTTLED | msr_val); |
326 | |||
327 | if (cpu_has(c, X86_FEATURE_PLN)) | ||
328 | if (therm_throt_process(msr_val & THERM_STATUS_POWER_LIMIT, | ||
329 | POWER_LIMIT_EVENT, | ||
330 | CORE_LEVEL) != 0) | ||
331 | mce_log_therm_throt_event(CORE_POWER_LIMIT | msr_val); | ||
270 | 332 | ||
271 | if (cpu_has(c, X86_FEATURE_PTS)) { | 333 | if (cpu_has(c, X86_FEATURE_PTS)) { |
272 | rdmsrl(MSR_IA32_PACKAGE_THERM_STATUS, msr_val); | 334 | rdmsrl(MSR_IA32_PACKAGE_THERM_STATUS, msr_val); |
273 | if (therm_throt_process(msr_val & PACKAGE_THERM_STATUS_PROCHOT, | 335 | if (therm_throt_process(msr_val & PACKAGE_THERM_STATUS_PROCHOT, |
336 | THERMAL_THROTTLING_EVENT, | ||
274 | PACKAGE_LEVEL) != 0) | 337 | PACKAGE_LEVEL) != 0) |
275 | /* | 338 | mce_log_therm_throt_event(PACKAGE_THROTTLED | msr_val); |
276 | * Set up the most significant bit to notify mce log | 339 | if (cpu_has(c, X86_FEATURE_PLN)) |
277 | * that this thermal event is a package level event. | 340 | if (therm_throt_process(msr_val & |
278 | * This is a temp solution. May be changed in the future | 341 | PACKAGE_THERM_STATUS_POWER_LIMIT, |
279 | * with mce log infrasture. | 342 | POWER_LIMIT_EVENT, |
280 | */ | 343 | PACKAGE_LEVEL) != 0) |
281 | mce_log_therm_throt_event(((__u64)1 << 63) | msr_val); | 344 | mce_log_therm_throt_event(PACKAGE_POWER_LIMIT |
345 | | msr_val); | ||
282 | } | 346 | } |
283 | } | 347 | } |
284 | 348 | ||
@@ -381,14 +445,25 @@ void intel_init_thermal(struct cpuinfo_x86 *c) | |||
381 | apic_write(APIC_LVTTHMR, h); | 445 | apic_write(APIC_LVTTHMR, h); |
382 | 446 | ||
383 | rdmsr(MSR_IA32_THERM_INTERRUPT, l, h); | 447 | rdmsr(MSR_IA32_THERM_INTERRUPT, l, h); |
384 | wrmsr(MSR_IA32_THERM_INTERRUPT, | 448 | if (cpu_has(c, X86_FEATURE_PLN)) |
385 | l | (THERM_INT_LOW_ENABLE | THERM_INT_HIGH_ENABLE), h); | 449 | wrmsr(MSR_IA32_THERM_INTERRUPT, |
450 | l | (THERM_INT_LOW_ENABLE | ||
451 | | THERM_INT_HIGH_ENABLE | THERM_INT_PLN_ENABLE), h); | ||
452 | else | ||
453 | wrmsr(MSR_IA32_THERM_INTERRUPT, | ||
454 | l | (THERM_INT_LOW_ENABLE | THERM_INT_HIGH_ENABLE), h); | ||
386 | 455 | ||
387 | if (cpu_has(c, X86_FEATURE_PTS)) { | 456 | if (cpu_has(c, X86_FEATURE_PTS)) { |
388 | rdmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, l, h); | 457 | rdmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, l, h); |
389 | wrmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, | 458 | if (cpu_has(c, X86_FEATURE_PLN)) |
390 | l | (PACKAGE_THERM_INT_LOW_ENABLE | 459 | wrmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, |
391 | | PACKAGE_THERM_INT_HIGH_ENABLE), h); | 460 | l | (PACKAGE_THERM_INT_LOW_ENABLE |
461 | | PACKAGE_THERM_INT_HIGH_ENABLE | ||
462 | | PACKAGE_THERM_INT_PLN_ENABLE), h); | ||
463 | else | ||
464 | wrmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, | ||
465 | l | (PACKAGE_THERM_INT_LOW_ENABLE | ||
466 | | PACKAGE_THERM_INT_HIGH_ENABLE), h); | ||
392 | } | 467 | } |
393 | 468 | ||
394 | smp_thermal_vector = intel_thermal_interrupt; | 469 | smp_thermal_vector = intel_thermal_interrupt; |