aboutsummaryrefslogtreecommitdiffstats
path: root/arch
diff options
context:
space:
mode:
authorChen, Kenneth W <kenneth.w.chen@intel.com>2005-11-15 17:37:05 -0500
committerLinus Torvalds <torvalds@g5.osdl.org>2005-11-15 18:50:51 -0500
commit1e185b97b4364063f1135604b87f8d8469944233 (patch)
tree0184e24ae1e9247b7dee62838b981c2d2a741d2e /arch
parent47227d50c4ba7d2308b30c19b14e6edf133d5aa8 (diff)
[PATCH] ia64: cpu_idle performance bug fix
Our performance validation on 2.6.15-rc1 caught a disastrous performance regression on ia64 with netperf (-98%) and volanomark (-58%) compares to previous kernel version 2.6.14-git7. See the following chart (result group 1 & 2). http://kernel-perf.sourceforge.net/results.machine_id=26.html We have root caused it to commit 64c7c8f88559624abdbe12b5da6502e8879f8d28 This changeset broke the ia64 task resched notification. In sched.c:resched_task(), a reschedule IPI is conditioned upon TIF_POLLING_NRFLAG. However, the above changeset unconditionally set the polling thread flag for idle tasks regardless whether pal_halt_light is in use or not. As a result, resched IPI is not sent from resched_task(). And since the default behavior on ia64 is to use pal_halt_light, we end up delaying the rescheduling task until next timer tick, and thus cause the performance regression. This fixes the performance bug. I'm glad our performance suite is turning up bad performance bug like this in time. Signed-off-by: Ken Chen <kenneth.w.chen@intel.com> Signed-off-by: Linus Torvalds <torvalds@osdl.org>
Diffstat (limited to 'arch')
-rw-r--r--arch/ia64/kernel/process.c15
1 files changed, 8 insertions, 7 deletions
diff --git a/arch/ia64/kernel/process.c b/arch/ia64/kernel/process.c
index e92ea64d8040..4305d2ba76f6 100644
--- a/arch/ia64/kernel/process.c
+++ b/arch/ia64/kernel/process.c
@@ -202,12 +202,9 @@ default_idle (void)
202{ 202{
203 local_irq_enable(); 203 local_irq_enable();
204 while (!need_resched()) { 204 while (!need_resched()) {
205 if (can_do_pal_halt) { 205 if (can_do_pal_halt)
206 local_irq_disable(); 206 safe_halt();
207 if (!need_resched()) 207 else
208 safe_halt();
209 local_irq_enable();
210 } else
211 cpu_relax(); 208 cpu_relax();
212 } 209 }
213} 210}
@@ -272,10 +269,14 @@ cpu_idle (void)
272{ 269{
273 void (*mark_idle)(int) = ia64_mark_idle; 270 void (*mark_idle)(int) = ia64_mark_idle;
274 int cpu = smp_processor_id(); 271 int cpu = smp_processor_id();
275 set_thread_flag(TIF_POLLING_NRFLAG);
276 272
277 /* endless idle loop with no priority at all */ 273 /* endless idle loop with no priority at all */
278 while (1) { 274 while (1) {
275 if (can_do_pal_halt)
276 clear_thread_flag(TIF_POLLING_NRFLAG);
277 else
278 set_thread_flag(TIF_POLLING_NRFLAG);
279
279 if (!need_resched()) { 280 if (!need_resched()) {
280 void (*idle)(void); 281 void (*idle)(void);
281#ifdef CONFIG_SMP 282#ifdef CONFIG_SMP