aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorRavikiran G Thirumalai <kiran@scalex86.org>2007-10-17 02:26:09 -0400
committerLinus Torvalds <torvalds@woody.linux-foundation.org>2007-10-17 11:42:47 -0400
commitc4f3b63fe15b4629aa1ec163c95ab30423d0f76a (patch)
tree432723f1c7ac2fcff0aa57377c31187140d69145
parenta5f2ce3c6024a5bb895647b6bd88ecae5001020a (diff)
softlockup: add a /proc tuning parameter
Control the trigger limit for softlockup warnings. This is useful for debugging softlockups, by lowering the softlockup_thresh to identify possible softlockups earlier. This patch: 1. Adds a sysctl softlockup_thresh with valid values of 1-60s (Higher value to disable false positives) 2. Changes the softlockup printk to print the cpu softlockup time [akpm@linux-foundation.org: Fix various warnings and add definition of "two"] Signed-off-by: Ravikiran Thirumalai <kiran@scalex86.org> Signed-off-by: Shai Fultheim <shai@scalex86.org> Acked-by: Ingo Molnar <mingo@elte.hu> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
-rw-r--r--Documentation/sysctl/kernel.txt8
-rw-r--r--include/linux/sched.h1
-rw-r--r--kernel/softlockup.c7
-rw-r--r--kernel/sysctl.c33
4 files changed, 40 insertions, 9 deletions
diff --git a/Documentation/sysctl/kernel.txt b/Documentation/sysctl/kernel.txt
index 111fd28727ec..8984a5396271 100644
--- a/Documentation/sysctl/kernel.txt
+++ b/Documentation/sysctl/kernel.txt
@@ -320,6 +320,14 @@ kernel. This value defaults to SHMMAX.
320 320
321============================================================== 321==============================================================
322 322
323softlockup_thresh:
324
325This value can be used to lower the softlockup tolerance
326threshold. The default threshold is 10s. If a cpu is locked up
327for 10s, the kernel complains. Valid values are 1-60s.
328
329==============================================================
330
323tainted: 331tainted:
324 332
325Non-zero if the kernel has been tainted. Numeric values, which 333Non-zero if the kernel has been tainted. Numeric values, which
diff --git a/include/linux/sched.h b/include/linux/sched.h
index 59738efff8ad..e643357eda05 100644
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -261,6 +261,7 @@ extern void softlockup_tick(void);
261extern void spawn_softlockup_task(void); 261extern void spawn_softlockup_task(void);
262extern void touch_softlockup_watchdog(void); 262extern void touch_softlockup_watchdog(void);
263extern void touch_all_softlockup_watchdogs(void); 263extern void touch_all_softlockup_watchdogs(void);
264extern int softlockup_thresh;
264#else 265#else
265static inline void softlockup_tick(void) 266static inline void softlockup_tick(void)
266{ 267{
diff --git a/kernel/softlockup.c b/kernel/softlockup.c
index 72c2561ff5f8..edeeef3a6a32 100644
--- a/kernel/softlockup.c
+++ b/kernel/softlockup.c
@@ -24,6 +24,7 @@ static DEFINE_PER_CPU(unsigned long, print_timestamp);
24static DEFINE_PER_CPU(struct task_struct *, watchdog_task); 24static DEFINE_PER_CPU(struct task_struct *, watchdog_task);
25 25
26static int did_panic; 26static int did_panic;
27int softlockup_thresh = 10;
27 28
28static int 29static int
29softlock_panic(struct notifier_block *this, unsigned long event, void *ptr) 30softlock_panic(struct notifier_block *this, unsigned long event, void *ptr)
@@ -104,13 +105,15 @@ void softlockup_tick(void)
104 wake_up_process(per_cpu(watchdog_task, this_cpu)); 105 wake_up_process(per_cpu(watchdog_task, this_cpu));
105 106
106 /* Warn about unreasonable 10+ seconds delays: */ 107 /* Warn about unreasonable 10+ seconds delays: */
107 if (now <= (touch_timestamp + 10)) 108 if (now <= (touch_timestamp + softlockup_thresh))
108 return; 109 return;
109 110
110 per_cpu(print_timestamp, this_cpu) = touch_timestamp; 111 per_cpu(print_timestamp, this_cpu) = touch_timestamp;
111 112
112 spin_lock(&print_lock); 113 spin_lock(&print_lock);
113 printk(KERN_ERR "BUG: soft lockup detected on CPU#%d!\n", this_cpu); 114 printk(KERN_ERR "BUG: soft lockup - CPU#%d stuck for %lus! [%s:%d]\n",
115 this_cpu, now - touch_timestamp,
116 current->comm, current->pid);
114 if (regs) 117 if (regs)
115 show_regs(regs); 118 show_regs(regs);
116 else 119 else
diff --git a/kernel/sysctl.c b/kernel/sysctl.c
index 5e63de0f9ee2..dde3d53e8adc 100644
--- a/kernel/sysctl.c
+++ b/kernel/sysctl.c
@@ -80,6 +80,19 @@ extern int maps_protect;
80extern int sysctl_stat_interval; 80extern int sysctl_stat_interval;
81extern int audit_argv_kb; 81extern int audit_argv_kb;
82 82
83/* Constants used for minimum and maximum */
84#ifdef CONFIG_DETECT_SOFTLOCKUP
85static int one = 1;
86static int sixty = 60;
87#endif
88
89#ifdef CONFIG_MMU
90static int two = 2;
91#endif
92
93static int zero;
94static int one_hundred = 100;
95
83/* this is needed for the proc_dointvec_minmax for [fs_]overflow UID and GID */ 96/* this is needed for the proc_dointvec_minmax for [fs_]overflow UID and GID */
84static int maxolduid = 65535; 97static int maxolduid = 65535;
85static int minolduid; 98static int minolduid;
@@ -711,6 +724,19 @@ static ctl_table kern_table[] = {
711 .proc_handler = &proc_dointvec, 724 .proc_handler = &proc_dointvec,
712 }, 725 },
713#endif 726#endif
727#ifdef CONFIG_DETECT_SOFTLOCKUP
728 {
729 .ctl_name = CTL_UNNUMBERED,
730 .procname = "softlockup_thresh",
731 .data = &softlockup_thresh,
732 .maxlen = sizeof(int),
733 .mode = 0644,
734 .proc_handler = &proc_dointvec_minmax,
735 .strategy = &sysctl_intvec,
736 .extra1 = &one,
737 .extra2 = &sixty,
738 },
739#endif
714#ifdef CONFIG_COMPAT 740#ifdef CONFIG_COMPAT
715 { 741 {
716 .ctl_name = KERN_COMPAT_LOG, 742 .ctl_name = KERN_COMPAT_LOG,
@@ -757,13 +783,6 @@ static ctl_table kern_table[] = {
757 { .ctl_name = 0 } 783 { .ctl_name = 0 }
758}; 784};
759 785
760/* Constants for minimum and maximum testing in vm_table.
761 We use these as one-element integer vectors. */
762static int zero;
763static int two = 2;
764static int one_hundred = 100;
765
766
767static ctl_table vm_table[] = { 786static ctl_table vm_table[] = {
768 { 787 {
769 .ctl_name = VM_OVERCOMMIT_MEMORY, 788 .ctl_name = VM_OVERCOMMIT_MEMORY,