diff options
author | Ingo Molnar <mingo@elte.hu> | 2005-09-10 03:25:56 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@g5.osdl.org> | 2005-09-10 13:06:21 -0400 |
commit | fb1c8f93d869b34cacb8b8932e2b83d96a19d720 (patch) | |
tree | a006d078aa02e421a7dc4793c335308204859d36 /lib | |
parent | 4327edf6b8a7ac7dce144313947995538842d8fd (diff) |
[PATCH] spinlock consolidation
This patch (written by me and also containing many suggestions of Arjan van
de Ven) does a major cleanup of the spinlock code. It does the following
things:
- consolidates and enhances the spinlock/rwlock debugging code
- simplifies the asm/spinlock.h files
- encapsulates the raw spinlock type and moves generic spinlock
features (such as ->break_lock) into the generic code.
- cleans up the spinlock code hierarchy to get rid of the spaghetti.
Most notably there's now only a single variant of the debugging code,
located in lib/spinlock_debug.c. (previously we had one SMP debugging
variant per architecture, plus a separate generic one for UP builds)
Also, i've enhanced the rwlock debugging facility, it will now track
write-owners. There is new spinlock-owner/CPU-tracking on SMP builds too.
All locks have lockup detection now, which will work for both soft and hard
spin/rwlock lockups.
The arch-level include files now only contain the minimally necessary
subset of the spinlock code - all the rest that can be generalized now
lives in the generic headers:
include/asm-i386/spinlock_types.h | 16
include/asm-x86_64/spinlock_types.h | 16
I have also split up the various spinlock variants into separate files,
making it easier to see which does what. The new layout is:
SMP | UP
----------------------------|-----------------------------------
asm/spinlock_types_smp.h | linux/spinlock_types_up.h
linux/spinlock_types.h | linux/spinlock_types.h
asm/spinlock_smp.h | linux/spinlock_up.h
linux/spinlock_api_smp.h | linux/spinlock_api_up.h
linux/spinlock.h | linux/spinlock.h
/*
* here's the role of the various spinlock/rwlock related include files:
*
* on SMP builds:
*
* asm/spinlock_types.h: contains the raw_spinlock_t/raw_rwlock_t and the
* initializers
*
* linux/spinlock_types.h:
* defines the generic type and initializers
*
* asm/spinlock.h: contains the __raw_spin_*()/etc. lowlevel
* implementations, mostly inline assembly code
*
* (also included on UP-debug builds:)
*
* linux/spinlock_api_smp.h:
* contains the prototypes for the _spin_*() APIs.
*
* linux/spinlock.h: builds the final spin_*() APIs.
*
* on UP builds:
*
* linux/spinlock_type_up.h:
* contains the generic, simplified UP spinlock type.
* (which is an empty structure on non-debug builds)
*
* linux/spinlock_types.h:
* defines the generic type and initializers
*
* linux/spinlock_up.h:
* contains the __raw_spin_*()/etc. version of UP
* builds. (which are NOPs on non-debug, non-preempt
* builds)
*
* (included on UP-non-debug builds:)
*
* linux/spinlock_api_up.h:
* builds the _spin_*() APIs.
*
* linux/spinlock.h: builds the final spin_*() APIs.
*/
All SMP and UP architectures are converted by this patch.
arm, i386, ia64, ppc, ppc64, s390/s390x, x64 was build-tested via
crosscompilers. m32r, mips, sh, sparc, have not been tested yet, but should
be mostly fine.
From: Grant Grundler <grundler@parisc-linux.org>
Booted and lightly tested on a500-44 (64-bit, SMP kernel, dual CPU).
Builds 32-bit SMP kernel (not booted or tested). I did not try to build
non-SMP kernels. That should be trivial to fix up later if necessary.
I converted bit ops atomic_hash lock to raw_spinlock_t. Doing so avoids
some ugly nesting of linux/*.h and asm/*.h files. Those particular locks
are well tested and contained entirely inside arch specific code. I do NOT
expect any new issues to arise with them.
If someone does ever need to use debug/metrics with them, then they will
need to unravel this hairball between spinlocks, atomic ops, and bit ops
that exist only because parisc has exactly one atomic instruction: LDCW
(load and clear word).
From: "Luck, Tony" <tony.luck@intel.com>
ia64 fix
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Arjan van de Ven <arjanv@infradead.org>
Signed-off-by: Grant Grundler <grundler@parisc-linux.org>
Cc: Matthew Wilcox <willy@debian.org>
Signed-off-by: Hirokazu Takata <takata@linux-m32r.org>
Signed-off-by: Mikael Pettersson <mikpe@csd.uu.se>
Signed-off-by: Benoit Boissinot <benoit.boissinot@ens-lyon.org>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
Diffstat (limited to 'lib')
-rw-r--r-- | lib/Makefile | 1 | ||||
-rw-r--r-- | lib/dec_and_lock.c | 3 | ||||
-rw-r--r-- | lib/kernel_lock.c | 3 | ||||
-rw-r--r-- | lib/spinlock_debug.c | 257 |
4 files changed, 259 insertions, 5 deletions
diff --git a/lib/Makefile b/lib/Makefile index d9c38ba05e7b..44a46750690a 100644 --- a/lib/Makefile +++ b/lib/Makefile | |||
@@ -16,6 +16,7 @@ CFLAGS_kobject.o += -DDEBUG | |||
16 | CFLAGS_kobject_uevent.o += -DDEBUG | 16 | CFLAGS_kobject_uevent.o += -DDEBUG |
17 | endif | 17 | endif |
18 | 18 | ||
19 | obj-$(CONFIG_DEBUG_SPINLOCK) += spinlock_debug.o | ||
19 | lib-$(CONFIG_RWSEM_GENERIC_SPINLOCK) += rwsem-spinlock.o | 20 | lib-$(CONFIG_RWSEM_GENERIC_SPINLOCK) += rwsem-spinlock.o |
20 | lib-$(CONFIG_RWSEM_XCHGADD_ALGORITHM) += rwsem.o | 21 | lib-$(CONFIG_RWSEM_XCHGADD_ALGORITHM) += rwsem.o |
21 | lib-$(CONFIG_SEMAPHORE_SLEEPERS) += semaphore-sleepers.o | 22 | lib-$(CONFIG_SEMAPHORE_SLEEPERS) += semaphore-sleepers.o |
diff --git a/lib/dec_and_lock.c b/lib/dec_and_lock.c index 6658d81e1836..2377af057d09 100644 --- a/lib/dec_and_lock.c +++ b/lib/dec_and_lock.c | |||
@@ -25,8 +25,6 @@ | |||
25 | * this is trivially done efficiently using a load-locked | 25 | * this is trivially done efficiently using a load-locked |
26 | * store-conditional approach, for example. | 26 | * store-conditional approach, for example. |
27 | */ | 27 | */ |
28 | |||
29 | #ifndef ATOMIC_DEC_AND_LOCK | ||
30 | int _atomic_dec_and_lock(atomic_t *atomic, spinlock_t *lock) | 28 | int _atomic_dec_and_lock(atomic_t *atomic, spinlock_t *lock) |
31 | { | 29 | { |
32 | spin_lock(lock); | 30 | spin_lock(lock); |
@@ -37,4 +35,3 @@ int _atomic_dec_and_lock(atomic_t *atomic, spinlock_t *lock) | |||
37 | } | 35 | } |
38 | 36 | ||
39 | EXPORT_SYMBOL(_atomic_dec_and_lock); | 37 | EXPORT_SYMBOL(_atomic_dec_and_lock); |
40 | #endif | ||
diff --git a/lib/kernel_lock.c b/lib/kernel_lock.c index bd2bc5d887b8..cb5490ec00f2 100644 --- a/lib/kernel_lock.c +++ b/lib/kernel_lock.c | |||
@@ -177,8 +177,7 @@ static inline void __lock_kernel(void) | |||
177 | 177 | ||
178 | static inline void __unlock_kernel(void) | 178 | static inline void __unlock_kernel(void) |
179 | { | 179 | { |
180 | _raw_spin_unlock(&kernel_flag); | 180 | spin_unlock(&kernel_flag); |
181 | preempt_enable(); | ||
182 | } | 181 | } |
183 | 182 | ||
184 | /* | 183 | /* |
diff --git a/lib/spinlock_debug.c b/lib/spinlock_debug.c new file mode 100644 index 000000000000..906ad101eab3 --- /dev/null +++ b/lib/spinlock_debug.c | |||
@@ -0,0 +1,257 @@ | |||
1 | /* | ||
2 | * Copyright 2005, Red Hat, Inc., Ingo Molnar | ||
3 | * Released under the General Public License (GPL). | ||
4 | * | ||
5 | * This file contains the spinlock/rwlock implementations for | ||
6 | * DEBUG_SPINLOCK. | ||
7 | */ | ||
8 | |||
9 | #include <linux/config.h> | ||
10 | #include <linux/spinlock.h> | ||
11 | #include <linux/interrupt.h> | ||
12 | #include <linux/delay.h> | ||
13 | |||
14 | static void spin_bug(spinlock_t *lock, const char *msg) | ||
15 | { | ||
16 | static long print_once = 1; | ||
17 | struct task_struct *owner = NULL; | ||
18 | |||
19 | if (xchg(&print_once, 0)) { | ||
20 | if (lock->owner && lock->owner != SPINLOCK_OWNER_INIT) | ||
21 | owner = lock->owner; | ||
22 | printk("BUG: spinlock %s on CPU#%d, %s/%d\n", | ||
23 | msg, smp_processor_id(), current->comm, current->pid); | ||
24 | printk(" lock: %p, .magic: %08x, .owner: %s/%d, .owner_cpu: %d\n", | ||
25 | lock, lock->magic, | ||
26 | owner ? owner->comm : "<none>", | ||
27 | owner ? owner->pid : -1, | ||
28 | lock->owner_cpu); | ||
29 | dump_stack(); | ||
30 | #ifdef CONFIG_SMP | ||
31 | /* | ||
32 | * We cannot continue on SMP: | ||
33 | */ | ||
34 | // panic("bad locking"); | ||
35 | #endif | ||
36 | } | ||
37 | } | ||
38 | |||
39 | #define SPIN_BUG_ON(cond, lock, msg) if (unlikely(cond)) spin_bug(lock, msg) | ||
40 | |||
41 | static inline void debug_spin_lock_before(spinlock_t *lock) | ||
42 | { | ||
43 | SPIN_BUG_ON(lock->magic != SPINLOCK_MAGIC, lock, "bad magic"); | ||
44 | SPIN_BUG_ON(lock->owner == current, lock, "recursion"); | ||
45 | SPIN_BUG_ON(lock->owner_cpu == raw_smp_processor_id(), | ||
46 | lock, "cpu recursion"); | ||
47 | } | ||
48 | |||
49 | static inline void debug_spin_lock_after(spinlock_t *lock) | ||
50 | { | ||
51 | lock->owner_cpu = raw_smp_processor_id(); | ||
52 | lock->owner = current; | ||
53 | } | ||
54 | |||
55 | static inline void debug_spin_unlock(spinlock_t *lock) | ||
56 | { | ||
57 | SPIN_BUG_ON(lock->magic != SPINLOCK_MAGIC, lock, "bad magic"); | ||
58 | SPIN_BUG_ON(!spin_is_locked(lock), lock, "already unlocked"); | ||
59 | SPIN_BUG_ON(lock->owner != current, lock, "wrong owner"); | ||
60 | SPIN_BUG_ON(lock->owner_cpu != raw_smp_processor_id(), | ||
61 | lock, "wrong CPU"); | ||
62 | lock->owner = SPINLOCK_OWNER_INIT; | ||
63 | lock->owner_cpu = -1; | ||
64 | } | ||
65 | |||
66 | static void __spin_lock_debug(spinlock_t *lock) | ||
67 | { | ||
68 | int print_once = 1; | ||
69 | u64 i; | ||
70 | |||
71 | for (;;) { | ||
72 | for (i = 0; i < loops_per_jiffy * HZ; i++) { | ||
73 | cpu_relax(); | ||
74 | if (__raw_spin_trylock(&lock->raw_lock)) | ||
75 | return; | ||
76 | } | ||
77 | /* lockup suspected: */ | ||
78 | if (print_once) { | ||
79 | print_once = 0; | ||
80 | printk("BUG: spinlock lockup on CPU#%d, %s/%d, %p\n", | ||
81 | smp_processor_id(), current->comm, current->pid, | ||
82 | lock); | ||
83 | dump_stack(); | ||
84 | } | ||
85 | } | ||
86 | } | ||
87 | |||
88 | void _raw_spin_lock(spinlock_t *lock) | ||
89 | { | ||
90 | debug_spin_lock_before(lock); | ||
91 | if (unlikely(!__raw_spin_trylock(&lock->raw_lock))) | ||
92 | __spin_lock_debug(lock); | ||
93 | debug_spin_lock_after(lock); | ||
94 | } | ||
95 | |||
96 | int _raw_spin_trylock(spinlock_t *lock) | ||
97 | { | ||
98 | int ret = __raw_spin_trylock(&lock->raw_lock); | ||
99 | |||
100 | if (ret) | ||
101 | debug_spin_lock_after(lock); | ||
102 | #ifndef CONFIG_SMP | ||
103 | /* | ||
104 | * Must not happen on UP: | ||
105 | */ | ||
106 | SPIN_BUG_ON(!ret, lock, "trylock failure on UP"); | ||
107 | #endif | ||
108 | return ret; | ||
109 | } | ||
110 | |||
111 | void _raw_spin_unlock(spinlock_t *lock) | ||
112 | { | ||
113 | debug_spin_unlock(lock); | ||
114 | __raw_spin_unlock(&lock->raw_lock); | ||
115 | } | ||
116 | |||
117 | static void rwlock_bug(rwlock_t *lock, const char *msg) | ||
118 | { | ||
119 | static long print_once = 1; | ||
120 | |||
121 | if (xchg(&print_once, 0)) { | ||
122 | printk("BUG: rwlock %s on CPU#%d, %s/%d, %p\n", msg, | ||
123 | smp_processor_id(), current->comm, current->pid, lock); | ||
124 | dump_stack(); | ||
125 | #ifdef CONFIG_SMP | ||
126 | /* | ||
127 | * We cannot continue on SMP: | ||
128 | */ | ||
129 | panic("bad locking"); | ||
130 | #endif | ||
131 | } | ||
132 | } | ||
133 | |||
134 | #define RWLOCK_BUG_ON(cond, lock, msg) if (unlikely(cond)) rwlock_bug(lock, msg) | ||
135 | |||
136 | static void __read_lock_debug(rwlock_t *lock) | ||
137 | { | ||
138 | int print_once = 1; | ||
139 | u64 i; | ||
140 | |||
141 | for (;;) { | ||
142 | for (i = 0; i < loops_per_jiffy * HZ; i++) { | ||
143 | cpu_relax(); | ||
144 | if (__raw_read_trylock(&lock->raw_lock)) | ||
145 | return; | ||
146 | } | ||
147 | /* lockup suspected: */ | ||
148 | if (print_once) { | ||
149 | print_once = 0; | ||
150 | printk("BUG: read-lock lockup on CPU#%d, %s/%d, %p\n", | ||
151 | smp_processor_id(), current->comm, current->pid, | ||
152 | lock); | ||
153 | dump_stack(); | ||
154 | } | ||
155 | } | ||
156 | } | ||
157 | |||
158 | void _raw_read_lock(rwlock_t *lock) | ||
159 | { | ||
160 | RWLOCK_BUG_ON(lock->magic != RWLOCK_MAGIC, lock, "bad magic"); | ||
161 | if (unlikely(!__raw_read_trylock(&lock->raw_lock))) | ||
162 | __read_lock_debug(lock); | ||
163 | } | ||
164 | |||
165 | int _raw_read_trylock(rwlock_t *lock) | ||
166 | { | ||
167 | int ret = __raw_read_trylock(&lock->raw_lock); | ||
168 | |||
169 | #ifndef CONFIG_SMP | ||
170 | /* | ||
171 | * Must not happen on UP: | ||
172 | */ | ||
173 | RWLOCK_BUG_ON(!ret, lock, "trylock failure on UP"); | ||
174 | #endif | ||
175 | return ret; | ||
176 | } | ||
177 | |||
178 | void _raw_read_unlock(rwlock_t *lock) | ||
179 | { | ||
180 | RWLOCK_BUG_ON(lock->magic != RWLOCK_MAGIC, lock, "bad magic"); | ||
181 | __raw_read_unlock(&lock->raw_lock); | ||
182 | } | ||
183 | |||
184 | static inline void debug_write_lock_before(rwlock_t *lock) | ||
185 | { | ||
186 | RWLOCK_BUG_ON(lock->magic != RWLOCK_MAGIC, lock, "bad magic"); | ||
187 | RWLOCK_BUG_ON(lock->owner == current, lock, "recursion"); | ||
188 | RWLOCK_BUG_ON(lock->owner_cpu == raw_smp_processor_id(), | ||
189 | lock, "cpu recursion"); | ||
190 | } | ||
191 | |||
192 | static inline void debug_write_lock_after(rwlock_t *lock) | ||
193 | { | ||
194 | lock->owner_cpu = raw_smp_processor_id(); | ||
195 | lock->owner = current; | ||
196 | } | ||
197 | |||
198 | static inline void debug_write_unlock(rwlock_t *lock) | ||
199 | { | ||
200 | RWLOCK_BUG_ON(lock->magic != RWLOCK_MAGIC, lock, "bad magic"); | ||
201 | RWLOCK_BUG_ON(lock->owner != current, lock, "wrong owner"); | ||
202 | RWLOCK_BUG_ON(lock->owner_cpu != raw_smp_processor_id(), | ||
203 | lock, "wrong CPU"); | ||
204 | lock->owner = SPINLOCK_OWNER_INIT; | ||
205 | lock->owner_cpu = -1; | ||
206 | } | ||
207 | |||
208 | static void __write_lock_debug(rwlock_t *lock) | ||
209 | { | ||
210 | int print_once = 1; | ||
211 | u64 i; | ||
212 | |||
213 | for (;;) { | ||
214 | for (i = 0; i < loops_per_jiffy * HZ; i++) { | ||
215 | cpu_relax(); | ||
216 | if (__raw_write_trylock(&lock->raw_lock)) | ||
217 | return; | ||
218 | } | ||
219 | /* lockup suspected: */ | ||
220 | if (print_once) { | ||
221 | print_once = 0; | ||
222 | printk("BUG: write-lock lockup on CPU#%d, %s/%d, %p\n", | ||
223 | smp_processor_id(), current->comm, current->pid, | ||
224 | lock); | ||
225 | dump_stack(); | ||
226 | } | ||
227 | } | ||
228 | } | ||
229 | |||
230 | void _raw_write_lock(rwlock_t *lock) | ||
231 | { | ||
232 | debug_write_lock_before(lock); | ||
233 | if (unlikely(!__raw_write_trylock(&lock->raw_lock))) | ||
234 | __write_lock_debug(lock); | ||
235 | debug_write_lock_after(lock); | ||
236 | } | ||
237 | |||
238 | int _raw_write_trylock(rwlock_t *lock) | ||
239 | { | ||
240 | int ret = __raw_write_trylock(&lock->raw_lock); | ||
241 | |||
242 | if (ret) | ||
243 | debug_write_lock_after(lock); | ||
244 | #ifndef CONFIG_SMP | ||
245 | /* | ||
246 | * Must not happen on UP: | ||
247 | */ | ||
248 | RWLOCK_BUG_ON(!ret, lock, "trylock failure on UP"); | ||
249 | #endif | ||
250 | return ret; | ||
251 | } | ||
252 | |||
253 | void _raw_write_unlock(rwlock_t *lock) | ||
254 | { | ||
255 | debug_write_unlock(lock); | ||
256 | __raw_write_unlock(&lock->raw_lock); | ||
257 | } | ||