aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMartin Peschke <mpeschke@linux.vnet.ibm.com>2013-08-22 11:45:36 -0400
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>2013-08-29 12:47:39 -0400
commitbda5d1efa09527e443a6990f81459779a313e24d (patch)
tree87ba9935d1d07394feec2b36f52d4a5a58abb8c2
parent67bdd3c0dc4dc00fc1e708fc9f326304d88cc8be (diff)
SCSI: zfcp: fix lock imbalance by reworking request queue locking
commit d79ff142624e1be080ad8d09101f7004d79c36e1 upstream. This patch adds wait_event_interruptible_lock_irq_timeout(), which is a straight-forward descendant of wait_event_interruptible_timeout() and wait_event_interruptible_lock_irq(). The zfcp driver used to call wait_event_interruptible_timeout() in combination with some intricate and error-prone locking. Using wait_event_interruptible_lock_irq_timeout() as a replacement nicely cleans up that locking. This rework removes a situation that resulted in a locking imbalance in zfcp_qdio_sbal_get(): BUG: workqueue leaked lock or atomic: events/1/0xffffff00/10 last function: zfcp_fc_wka_port_offline+0x0/0xa0 [zfcp] It was introduced by commit c2af7545aaff3495d9bf9a7608c52f0af86fb194 "[SCSI] zfcp: Do not wait for SBALs on stopped queue", which had a new code path related to ZFCP_STATUS_ADAPTER_QDIOUP that took an early exit without a required lock being held. The problem occured when a special, non-SCSI I/O request was being submitted in process context, when the adapter's queues had been torn down. In this case the bug surfaced when the Fibre Channel port connection for a well-known address was closed during a concurrent adapter shut-down procedure, which is a rare constellation. This patch also fixes these warnings from the sparse tool (make C=1): drivers/s390/scsi/zfcp_qdio.c:224:12: warning: context imbalance in 'zfcp_qdio_sbal_check' - wrong count at exit drivers/s390/scsi/zfcp_qdio.c:244:5: warning: context imbalance in 'zfcp_qdio_sbal_get' - unexpected unlock Last but not least, we get rid of that crappy lock-unlock-lock sequence at the beginning of the critical section. It is okay to call zfcp_erp_adapter_reopen() with req_q_lock held. Reported-by: Mikulas Patocka <mpatocka@redhat.com> Reported-by: Heiko Carstens <heiko.carstens@de.ibm.com> Signed-off-by: Martin Peschke <mpeschke@linux.vnet.ibm.com> Signed-off-by: Steffen Maier <maier@linux.vnet.ibm.com> Signed-off-by: James Bottomley <JBottomley@Parallels.com> Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
-rw-r--r--drivers/s390/scsi/zfcp_qdio.c8
-rw-r--r--include/linux/wait.h57
2 files changed, 59 insertions, 6 deletions
diff --git a/drivers/s390/scsi/zfcp_qdio.c b/drivers/s390/scsi/zfcp_qdio.c
index 665e3cfaaf85..de0598eaacd2 100644
--- a/drivers/s390/scsi/zfcp_qdio.c
+++ b/drivers/s390/scsi/zfcp_qdio.c
@@ -224,11 +224,9 @@ int zfcp_qdio_sbals_from_sg(struct zfcp_qdio *qdio, struct zfcp_qdio_req *q_req,
224 224
225static int zfcp_qdio_sbal_check(struct zfcp_qdio *qdio) 225static int zfcp_qdio_sbal_check(struct zfcp_qdio *qdio)
226{ 226{
227 spin_lock_irq(&qdio->req_q_lock);
228 if (atomic_read(&qdio->req_q_free) || 227 if (atomic_read(&qdio->req_q_free) ||
229 !(atomic_read(&qdio->adapter->status) & ZFCP_STATUS_ADAPTER_QDIOUP)) 228 !(atomic_read(&qdio->adapter->status) & ZFCP_STATUS_ADAPTER_QDIOUP))
230 return 1; 229 return 1;
231 spin_unlock_irq(&qdio->req_q_lock);
232 return 0; 230 return 0;
233} 231}
234 232
@@ -246,9 +244,8 @@ int zfcp_qdio_sbal_get(struct zfcp_qdio *qdio)
246{ 244{
247 long ret; 245 long ret;
248 246
249 spin_unlock_irq(&qdio->req_q_lock); 247 ret = wait_event_interruptible_lock_irq_timeout(qdio->req_q_wq,
250 ret = wait_event_interruptible_timeout(qdio->req_q_wq, 248 zfcp_qdio_sbal_check(qdio), qdio->req_q_lock, 5 * HZ);
251 zfcp_qdio_sbal_check(qdio), 5 * HZ);
252 249
253 if (!(atomic_read(&qdio->adapter->status) & ZFCP_STATUS_ADAPTER_QDIOUP)) 250 if (!(atomic_read(&qdio->adapter->status) & ZFCP_STATUS_ADAPTER_QDIOUP))
254 return -EIO; 251 return -EIO;
@@ -262,7 +259,6 @@ int zfcp_qdio_sbal_get(struct zfcp_qdio *qdio)
262 zfcp_erp_adapter_reopen(qdio->adapter, 0, "qdsbg_1"); 259 zfcp_erp_adapter_reopen(qdio->adapter, 0, "qdsbg_1");
263 } 260 }
264 261
265 spin_lock_irq(&qdio->req_q_lock);
266 return -EIO; 262 return -EIO;
267} 263}
268 264
diff --git a/include/linux/wait.h b/include/linux/wait.h
index 1133695eb067..c8e576022234 100644
--- a/include/linux/wait.h
+++ b/include/linux/wait.h
@@ -805,6 +805,63 @@ do { \
805 __ret; \ 805 __ret; \
806}) 806})
807 807
808#define __wait_event_interruptible_lock_irq_timeout(wq, condition, \
809 lock, ret) \
810do { \
811 DEFINE_WAIT(__wait); \
812 \
813 for (;;) { \
814 prepare_to_wait(&wq, &__wait, TASK_INTERRUPTIBLE); \
815 if (condition) \
816 break; \
817 if (signal_pending(current)) { \
818 ret = -ERESTARTSYS; \
819 break; \
820 } \
821 spin_unlock_irq(&lock); \
822 ret = schedule_timeout(ret); \
823 spin_lock_irq(&lock); \
824 if (!ret) \
825 break; \
826 } \
827 finish_wait(&wq, &__wait); \
828} while (0)
829
830/**
831 * wait_event_interruptible_lock_irq_timeout - sleep until a condition gets true or a timeout elapses.
832 * The condition is checked under the lock. This is expected
833 * to be called with the lock taken.
834 * @wq: the waitqueue to wait on
835 * @condition: a C expression for the event to wait for
836 * @lock: a locked spinlock_t, which will be released before schedule()
837 * and reacquired afterwards.
838 * @timeout: timeout, in jiffies
839 *
840 * The process is put to sleep (TASK_INTERRUPTIBLE) until the
841 * @condition evaluates to true or signal is received. The @condition is
842 * checked each time the waitqueue @wq is woken up.
843 *
844 * wake_up() has to be called after changing any variable that could
845 * change the result of the wait condition.
846 *
847 * This is supposed to be called while holding the lock. The lock is
848 * dropped before going to sleep and is reacquired afterwards.
849 *
850 * The function returns 0 if the @timeout elapsed, -ERESTARTSYS if it
851 * was interrupted by a signal, and the remaining jiffies otherwise
852 * if the condition evaluated to true before the timeout elapsed.
853 */
854#define wait_event_interruptible_lock_irq_timeout(wq, condition, lock, \
855 timeout) \
856({ \
857 int __ret = timeout; \
858 \
859 if (!(condition)) \
860 __wait_event_interruptible_lock_irq_timeout( \
861 wq, condition, lock, __ret); \
862 __ret; \
863})
864
808 865
809/* 866/*
810 * These are the old interfaces to sleep waiting for an event. 867 * These are the old interfaces to sleep waiting for an event.