diff options
author | Jeff Layton <jlayton@redhat.com> | 2009-09-21 06:47:50 -0400 |
---|---|---|
committer | Steve French <sfrench@us.ibm.com> | 2009-09-24 14:33:18 -0400 |
commit | 3bc303c254335dbd7c7012cc1760b12f1d5514d3 (patch) | |
tree | 7da17fbfd697216d9ed0ccd64ea9c03aaf3d52c1 /fs/cifs/cifsfs.c | |
parent | 48541bd3dd4739b4d574b44ea47660c88d833677 (diff) |
cifs: convert oplock breaks to use slow_work facility (try #4)
This is the fourth respin of the patch to convert oplock breaks to
use the slow_work facility.
A customer of ours was testing a backport of one of the earlier
patchsets, and hit a "Busy inodes after umount..." problem. An oplock
break job had raced with a umount, and the superblock got torn down and
its memory reused. When the oplock break job tried to dereference the
inode->i_sb, the kernel oopsed.
This patchset has the oplock break job hold an inode and vfsmount
reference until the oplock break completes. With this, there should be
no need to take a tcon reference (the vfsmount implicitly holds one
already).
Currently, when an oplock break comes in there's a chance that the
oplock break job won't occur if the allocation of the oplock_q_entry
fails. There are also some rather nasty races in the allocation and
handling these structs.
Rather than allocating oplock queue entries when an oplock break comes
in, add a few extra fields to the cifsFileInfo struct. Get rid of the
dedicated cifs_oplock_thread as well and queue the oplock break job to
the slow_work thread pool.
This approach also has the advantage that the oplock break jobs can
potentially run in parallel rather than be serialized like they are
today.
Signed-off-by: Jeff Layton <jlayton@redhat.com>
Signed-off-by: Steve French <sfrench@us.ibm.com>
Diffstat (limited to 'fs/cifs/cifsfs.c')
-rw-r--r-- | fs/cifs/cifsfs.c | 95 |
1 files changed, 5 insertions, 90 deletions
diff --git a/fs/cifs/cifsfs.c b/fs/cifs/cifsfs.c index 3610e9958b4c..89142b39fec1 100644 --- a/fs/cifs/cifsfs.c +++ b/fs/cifs/cifsfs.c | |||
@@ -64,9 +64,6 @@ unsigned int multiuser_mount = 0; | |||
64 | unsigned int extended_security = CIFSSEC_DEF; | 64 | unsigned int extended_security = CIFSSEC_DEF; |
65 | /* unsigned int ntlmv2_support = 0; */ | 65 | /* unsigned int ntlmv2_support = 0; */ |
66 | unsigned int sign_CIFS_PDUs = 1; | 66 | unsigned int sign_CIFS_PDUs = 1; |
67 | extern struct task_struct *oplockThread; /* remove sparse warning */ | ||
68 | struct task_struct *oplockThread = NULL; | ||
69 | /* extern struct task_struct * dnotifyThread; remove sparse warning */ | ||
70 | static const struct super_operations cifs_super_ops; | 67 | static const struct super_operations cifs_super_ops; |
71 | unsigned int CIFSMaxBufSize = CIFS_MAX_MSGSIZE; | 68 | unsigned int CIFSMaxBufSize = CIFS_MAX_MSGSIZE; |
72 | module_param(CIFSMaxBufSize, int, 0); | 69 | module_param(CIFSMaxBufSize, int, 0); |
@@ -973,89 +970,12 @@ cifs_destroy_mids(void) | |||
973 | kmem_cache_destroy(cifs_oplock_cachep); | 970 | kmem_cache_destroy(cifs_oplock_cachep); |
974 | } | 971 | } |
975 | 972 | ||
976 | static int cifs_oplock_thread(void *dummyarg) | ||
977 | { | ||
978 | struct oplock_q_entry *oplock_item; | ||
979 | struct cifsTconInfo *pTcon; | ||
980 | struct inode *inode; | ||
981 | __u16 netfid; | ||
982 | int rc, waitrc = 0; | ||
983 | |||
984 | set_freezable(); | ||
985 | do { | ||
986 | if (try_to_freeze()) | ||
987 | continue; | ||
988 | |||
989 | spin_lock(&cifs_oplock_lock); | ||
990 | if (list_empty(&cifs_oplock_list)) { | ||
991 | spin_unlock(&cifs_oplock_lock); | ||
992 | set_current_state(TASK_INTERRUPTIBLE); | ||
993 | schedule_timeout(39*HZ); | ||
994 | } else { | ||
995 | oplock_item = list_entry(cifs_oplock_list.next, | ||
996 | struct oplock_q_entry, qhead); | ||
997 | cFYI(1, ("found oplock item to write out")); | ||
998 | pTcon = oplock_item->tcon; | ||
999 | inode = oplock_item->pinode; | ||
1000 | netfid = oplock_item->netfid; | ||
1001 | spin_unlock(&cifs_oplock_lock); | ||
1002 | DeleteOplockQEntry(oplock_item); | ||
1003 | /* can not grab inode sem here since it would | ||
1004 | deadlock when oplock received on delete | ||
1005 | since vfs_unlink holds the i_mutex across | ||
1006 | the call */ | ||
1007 | /* mutex_lock(&inode->i_mutex);*/ | ||
1008 | if (S_ISREG(inode->i_mode)) { | ||
1009 | #ifdef CONFIG_CIFS_EXPERIMENTAL | ||
1010 | if (CIFS_I(inode)->clientCanCacheAll == 0) | ||
1011 | break_lease(inode, FMODE_READ); | ||
1012 | else if (CIFS_I(inode)->clientCanCacheRead == 0) | ||
1013 | break_lease(inode, FMODE_WRITE); | ||
1014 | #endif | ||
1015 | rc = filemap_fdatawrite(inode->i_mapping); | ||
1016 | if (CIFS_I(inode)->clientCanCacheRead == 0) { | ||
1017 | waitrc = filemap_fdatawait( | ||
1018 | inode->i_mapping); | ||
1019 | invalidate_remote_inode(inode); | ||
1020 | } | ||
1021 | if (rc == 0) | ||
1022 | rc = waitrc; | ||
1023 | } else | ||
1024 | rc = 0; | ||
1025 | /* mutex_unlock(&inode->i_mutex);*/ | ||
1026 | if (rc) | ||
1027 | CIFS_I(inode)->write_behind_rc = rc; | ||
1028 | cFYI(1, ("Oplock flush inode %p rc %d", | ||
1029 | inode, rc)); | ||
1030 | |||
1031 | /* releasing stale oplock after recent reconnect | ||
1032 | of smb session using a now incorrect file | ||
1033 | handle is not a data integrity issue but do | ||
1034 | not bother sending an oplock release if session | ||
1035 | to server still is disconnected since oplock | ||
1036 | already released by the server in that case */ | ||
1037 | if (!pTcon->need_reconnect) { | ||
1038 | rc = CIFSSMBLock(0, pTcon, netfid, | ||
1039 | 0 /* len */ , 0 /* offset */, 0, | ||
1040 | 0, LOCKING_ANDX_OPLOCK_RELEASE, | ||
1041 | false /* wait flag */); | ||
1042 | cFYI(1, ("Oplock release rc = %d", rc)); | ||
1043 | } | ||
1044 | set_current_state(TASK_INTERRUPTIBLE); | ||
1045 | schedule_timeout(1); /* yield in case q were corrupt */ | ||
1046 | } | ||
1047 | } while (!kthread_should_stop()); | ||
1048 | |||
1049 | return 0; | ||
1050 | } | ||
1051 | |||
1052 | static int __init | 973 | static int __init |
1053 | init_cifs(void) | 974 | init_cifs(void) |
1054 | { | 975 | { |
1055 | int rc = 0; | 976 | int rc = 0; |
1056 | cifs_proc_init(); | 977 | cifs_proc_init(); |
1057 | INIT_LIST_HEAD(&cifs_tcp_ses_list); | 978 | INIT_LIST_HEAD(&cifs_tcp_ses_list); |
1058 | INIT_LIST_HEAD(&cifs_oplock_list); | ||
1059 | #ifdef CONFIG_CIFS_EXPERIMENTAL | 979 | #ifdef CONFIG_CIFS_EXPERIMENTAL |
1060 | INIT_LIST_HEAD(&GlobalDnotifyReqList); | 980 | INIT_LIST_HEAD(&GlobalDnotifyReqList); |
1061 | INIT_LIST_HEAD(&GlobalDnotifyRsp_Q); | 981 | INIT_LIST_HEAD(&GlobalDnotifyRsp_Q); |
@@ -1084,7 +1004,6 @@ init_cifs(void) | |||
1084 | rwlock_init(&GlobalSMBSeslock); | 1004 | rwlock_init(&GlobalSMBSeslock); |
1085 | rwlock_init(&cifs_tcp_ses_lock); | 1005 | rwlock_init(&cifs_tcp_ses_lock); |
1086 | spin_lock_init(&GlobalMid_Lock); | 1006 | spin_lock_init(&GlobalMid_Lock); |
1087 | spin_lock_init(&cifs_oplock_lock); | ||
1088 | 1007 | ||
1089 | if (cifs_max_pending < 2) { | 1008 | if (cifs_max_pending < 2) { |
1090 | cifs_max_pending = 2; | 1009 | cifs_max_pending = 2; |
@@ -1119,18 +1038,15 @@ init_cifs(void) | |||
1119 | if (rc) | 1038 | if (rc) |
1120 | goto out_unregister_key_type; | 1039 | goto out_unregister_key_type; |
1121 | #endif | 1040 | #endif |
1122 | oplockThread = kthread_run(cifs_oplock_thread, NULL, "cifsoplockd"); | 1041 | rc = slow_work_register_user(); |
1123 | if (IS_ERR(oplockThread)) { | 1042 | if (rc) |
1124 | rc = PTR_ERR(oplockThread); | 1043 | goto out_unregister_resolver_key; |
1125 | cERROR(1, ("error %d create oplock thread", rc)); | ||
1126 | goto out_unregister_dfs_key_type; | ||
1127 | } | ||
1128 | 1044 | ||
1129 | return 0; | 1045 | return 0; |
1130 | 1046 | ||
1131 | out_unregister_dfs_key_type: | 1047 | out_unregister_resolver_key: |
1132 | #ifdef CONFIG_CIFS_DFS_UPCALL | ||
1133 | unregister_key_type(&key_type_dns_resolver); | 1048 | unregister_key_type(&key_type_dns_resolver); |
1049 | #ifdef CONFIG_CIFS_DFS_UPCALL | ||
1134 | out_unregister_key_type: | 1050 | out_unregister_key_type: |
1135 | #endif | 1051 | #endif |
1136 | #ifdef CONFIG_CIFS_UPCALL | 1052 | #ifdef CONFIG_CIFS_UPCALL |
@@ -1165,7 +1081,6 @@ exit_cifs(void) | |||
1165 | cifs_destroy_inodecache(); | 1081 | cifs_destroy_inodecache(); |
1166 | cifs_destroy_mids(); | 1082 | cifs_destroy_mids(); |
1167 | cifs_destroy_request_bufs(); | 1083 | cifs_destroy_request_bufs(); |
1168 | kthread_stop(oplockThread); | ||
1169 | } | 1084 | } |
1170 | 1085 | ||
1171 | MODULE_AUTHOR("Steve French <sfrench@us.ibm.com>"); | 1086 | MODULE_AUTHOR("Steve French <sfrench@us.ibm.com>"); |