diff options
author | Chen, Kenneth W <kenneth.w.chen@intel.com> | 2005-11-15 17:37:05 -0500 |
---|---|---|
committer | Linus Torvalds <torvalds@g5.osdl.org> | 2005-11-15 18:50:51 -0500 |
commit | 1e185b97b4364063f1135604b87f8d8469944233 (patch) | |
tree | 0184e24ae1e9247b7dee62838b981c2d2a741d2e | |
parent | 47227d50c4ba7d2308b30c19b14e6edf133d5aa8 (diff) |
[PATCH] ia64: cpu_idle performance bug fix
Our performance validation on 2.6.15-rc1 caught a disastrous performance
regression on ia64 with netperf (-98%) and volanomark (-58%) compares to
previous kernel version 2.6.14-git7. See the following chart (result
group 1 & 2).
http://kernel-perf.sourceforge.net/results.machine_id=26.html
We have root caused it to commit 64c7c8f88559624abdbe12b5da6502e8879f8d28
This changeset broke the ia64 task resched notification. In
sched.c:resched_task(), a reschedule IPI is conditioned upon
TIF_POLLING_NRFLAG. However, the above changeset unconditionally set
the polling thread flag for idle tasks regardless whether pal_halt_light
is in use or not. As a result, resched IPI is not sent from
resched_task(). And since the default behavior on ia64 is to use
pal_halt_light, we end up delaying the rescheduling task until next
timer tick, and thus cause the performance regression.
This fixes the performance bug. I'm glad our performance suite is
turning up bad performance bug like this in time.
Signed-off-by: Ken Chen <kenneth.w.chen@intel.com>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
-rw-r--r-- | arch/ia64/kernel/process.c | 15 |
1 files changed, 8 insertions, 7 deletions
diff --git a/arch/ia64/kernel/process.c b/arch/ia64/kernel/process.c index e92ea64d8040..4305d2ba76f6 100644 --- a/arch/ia64/kernel/process.c +++ b/arch/ia64/kernel/process.c | |||
@@ -202,12 +202,9 @@ default_idle (void) | |||
202 | { | 202 | { |
203 | local_irq_enable(); | 203 | local_irq_enable(); |
204 | while (!need_resched()) { | 204 | while (!need_resched()) { |
205 | if (can_do_pal_halt) { | 205 | if (can_do_pal_halt) |
206 | local_irq_disable(); | 206 | safe_halt(); |
207 | if (!need_resched()) | 207 | else |
208 | safe_halt(); | ||
209 | local_irq_enable(); | ||
210 | } else | ||
211 | cpu_relax(); | 208 | cpu_relax(); |
212 | } | 209 | } |
213 | } | 210 | } |
@@ -272,10 +269,14 @@ cpu_idle (void) | |||
272 | { | 269 | { |
273 | void (*mark_idle)(int) = ia64_mark_idle; | 270 | void (*mark_idle)(int) = ia64_mark_idle; |
274 | int cpu = smp_processor_id(); | 271 | int cpu = smp_processor_id(); |
275 | set_thread_flag(TIF_POLLING_NRFLAG); | ||
276 | 272 | ||
277 | /* endless idle loop with no priority at all */ | 273 | /* endless idle loop with no priority at all */ |
278 | while (1) { | 274 | while (1) { |
275 | if (can_do_pal_halt) | ||
276 | clear_thread_flag(TIF_POLLING_NRFLAG); | ||
277 | else | ||
278 | set_thread_flag(TIF_POLLING_NRFLAG); | ||
279 | |||
279 | if (!need_resched()) { | 280 | if (!need_resched()) { |
280 | void (*idle)(void); | 281 | void (*idle)(void); |
281 | #ifdef CONFIG_SMP | 282 | #ifdef CONFIG_SMP |