diff options
author | Nick Piggin <npiggin@kernel.dk> | 2011-01-07 01:49:37 -0500 |
---|---|---|
committer | Nick Piggin <npiggin@kernel.dk> | 2011-01-07 01:50:22 -0500 |
commit | 949854d02455080d20cd3e1db28a3a18daf7599d (patch) | |
tree | 9b13a6f86c1d0b91e462a471e53b0e717036b18e | |
parent | 9abca36087288fe28de4749c71ca003d4b9e3ed0 (diff) |
fs: Use rename lock and RCU for multi-step operations
The remaining usages for dcache_lock is to allow atomic, multi-step read-side
operations over the directory tree by excluding modifications to the tree.
Also, to walk in the leaf->root direction in the tree where we don't have
a natural d_lock ordering.
This could be accomplished by taking every d_lock, but this would mean a
huge number of locks and actually gets very tricky.
Solve this instead by using the rename seqlock for multi-step read-side
operations, retry in case of a rename so we don't walk up the wrong parent.
Concurrent dentry insertions are not serialised against. Concurrent deletes
are tricky when walking up the directory: our parent might have been deleted
when dropping locks so also need to check and retry for that.
We can also use the rename lock in cases where livelock is a worry (and it
is introduced in subsequent patch).
Signed-off-by: Nick Piggin <npiggin@kernel.dk>
-rw-r--r-- | drivers/staging/pohmelfs/path_entry.c | 15 | ||||
-rw-r--r-- | fs/autofs4/waitq.c | 18 | ||||
-rw-r--r-- | fs/dcache.c | 134 | ||||
-rw-r--r-- | fs/nfs/namespace.c | 14 | ||||
-rw-r--r-- | include/linux/dcache.h | 1 |
5 files changed, 152 insertions, 30 deletions
diff --git a/drivers/staging/pohmelfs/path_entry.c b/drivers/staging/pohmelfs/path_entry.c index 8ec83d2dffb7..bbe42f42ca8f 100644 --- a/drivers/staging/pohmelfs/path_entry.c +++ b/drivers/staging/pohmelfs/path_entry.c | |||
@@ -83,10 +83,11 @@ out: | |||
83 | int pohmelfs_path_length(struct pohmelfs_inode *pi) | 83 | int pohmelfs_path_length(struct pohmelfs_inode *pi) |
84 | { | 84 | { |
85 | struct dentry *d, *root, *first; | 85 | struct dentry *d, *root, *first; |
86 | int len = 1; /* Root slash */ | 86 | int len; |
87 | unsigned seq; | ||
87 | 88 | ||
88 | first = d = d_find_alias(&pi->vfs_inode); | 89 | first = d_find_alias(&pi->vfs_inode); |
89 | if (!d) { | 90 | if (!first) { |
90 | dprintk("%s: ino: %llu, mode: %o.\n", __func__, pi->ino, pi->vfs_inode.i_mode); | 91 | dprintk("%s: ino: %llu, mode: %o.\n", __func__, pi->ino, pi->vfs_inode.i_mode); |
91 | return -ENOENT; | 92 | return -ENOENT; |
92 | } | 93 | } |
@@ -95,6 +96,11 @@ int pohmelfs_path_length(struct pohmelfs_inode *pi) | |||
95 | root = dget(current->fs->root.dentry); | 96 | root = dget(current->fs->root.dentry); |
96 | spin_unlock(¤t->fs->lock); | 97 | spin_unlock(¤t->fs->lock); |
97 | 98 | ||
99 | rename_retry: | ||
100 | len = 1; /* Root slash */ | ||
101 | d = first; | ||
102 | seq = read_seqbegin(&rename_lock); | ||
103 | rcu_read_lock(); | ||
98 | spin_lock(&dcache_lock); | 104 | spin_lock(&dcache_lock); |
99 | 105 | ||
100 | if (!IS_ROOT(d) && d_unhashed(d)) | 106 | if (!IS_ROOT(d) && d_unhashed(d)) |
@@ -105,6 +111,9 @@ int pohmelfs_path_length(struct pohmelfs_inode *pi) | |||
105 | d = d->d_parent; | 111 | d = d->d_parent; |
106 | } | 112 | } |
107 | spin_unlock(&dcache_lock); | 113 | spin_unlock(&dcache_lock); |
114 | rcu_read_unlock(); | ||
115 | if (read_seqretry(&rename_lock, seq)) | ||
116 | goto rename_retry; | ||
108 | 117 | ||
109 | dput(root); | 118 | dput(root); |
110 | dput(first); | 119 | dput(first); |
diff --git a/fs/autofs4/waitq.c b/fs/autofs4/waitq.c index 2341375386f8..4be8f778a418 100644 --- a/fs/autofs4/waitq.c +++ b/fs/autofs4/waitq.c | |||
@@ -186,16 +186,25 @@ static int autofs4_getpath(struct autofs_sb_info *sbi, | |||
186 | { | 186 | { |
187 | struct dentry *root = sbi->sb->s_root; | 187 | struct dentry *root = sbi->sb->s_root; |
188 | struct dentry *tmp; | 188 | struct dentry *tmp; |
189 | char *buf = *name; | 189 | char *buf; |
190 | char *p; | 190 | char *p; |
191 | int len = 0; | 191 | int len; |
192 | 192 | unsigned seq; | |
193 | |||
194 | rename_retry: | ||
195 | buf = *name; | ||
196 | len = 0; | ||
197 | seq = read_seqbegin(&rename_lock); | ||
198 | rcu_read_lock(); | ||
193 | spin_lock(&dcache_lock); | 199 | spin_lock(&dcache_lock); |
194 | for (tmp = dentry ; tmp != root ; tmp = tmp->d_parent) | 200 | for (tmp = dentry ; tmp != root ; tmp = tmp->d_parent) |
195 | len += tmp->d_name.len + 1; | 201 | len += tmp->d_name.len + 1; |
196 | 202 | ||
197 | if (!len || --len > NAME_MAX) { | 203 | if (!len || --len > NAME_MAX) { |
198 | spin_unlock(&dcache_lock); | 204 | spin_unlock(&dcache_lock); |
205 | rcu_read_unlock(); | ||
206 | if (read_seqretry(&rename_lock, seq)) | ||
207 | goto rename_retry; | ||
199 | return 0; | 208 | return 0; |
200 | } | 209 | } |
201 | 210 | ||
@@ -209,6 +218,9 @@ static int autofs4_getpath(struct autofs_sb_info *sbi, | |||
209 | strncpy(p, tmp->d_name.name, tmp->d_name.len); | 218 | strncpy(p, tmp->d_name.name, tmp->d_name.len); |
210 | } | 219 | } |
211 | spin_unlock(&dcache_lock); | 220 | spin_unlock(&dcache_lock); |
221 | rcu_read_unlock(); | ||
222 | if (read_seqretry(&rename_lock, seq)) | ||
223 | goto rename_retry; | ||
212 | 224 | ||
213 | return len; | 225 | return len; |
214 | } | 226 | } |
diff --git a/fs/dcache.c b/fs/dcache.c index a09f0771fd27..a9bc4ecc21e1 100644 --- a/fs/dcache.c +++ b/fs/dcache.c | |||
@@ -80,6 +80,7 @@ static __cacheline_aligned_in_smp DEFINE_SPINLOCK(dcache_lru_lock); | |||
80 | __cacheline_aligned_in_smp DEFINE_SPINLOCK(dcache_lock); | 80 | __cacheline_aligned_in_smp DEFINE_SPINLOCK(dcache_lock); |
81 | __cacheline_aligned_in_smp DEFINE_SEQLOCK(rename_lock); | 81 | __cacheline_aligned_in_smp DEFINE_SEQLOCK(rename_lock); |
82 | 82 | ||
83 | EXPORT_SYMBOL(rename_lock); | ||
83 | EXPORT_SYMBOL(dcache_inode_lock); | 84 | EXPORT_SYMBOL(dcache_inode_lock); |
84 | EXPORT_SYMBOL(dcache_lock); | 85 | EXPORT_SYMBOL(dcache_lock); |
85 | 86 | ||
@@ -243,6 +244,7 @@ static struct dentry *d_kill(struct dentry *dentry, struct dentry *parent) | |||
243 | __releases(dcache_inode_lock) | 244 | __releases(dcache_inode_lock) |
244 | __releases(dcache_lock) | 245 | __releases(dcache_lock) |
245 | { | 246 | { |
247 | dentry->d_parent = NULL; | ||
246 | list_del(&dentry->d_u.d_child); | 248 | list_del(&dentry->d_u.d_child); |
247 | if (parent) | 249 | if (parent) |
248 | spin_unlock(&parent->d_lock); | 250 | spin_unlock(&parent->d_lock); |
@@ -1017,11 +1019,15 @@ void shrink_dcache_for_umount(struct super_block *sb) | |||
1017 | * Return true if the parent or its subdirectories contain | 1019 | * Return true if the parent or its subdirectories contain |
1018 | * a mount point | 1020 | * a mount point |
1019 | */ | 1021 | */ |
1020 | |||
1021 | int have_submounts(struct dentry *parent) | 1022 | int have_submounts(struct dentry *parent) |
1022 | { | 1023 | { |
1023 | struct dentry *this_parent = parent; | 1024 | struct dentry *this_parent; |
1024 | struct list_head *next; | 1025 | struct list_head *next; |
1026 | unsigned seq; | ||
1027 | |||
1028 | rename_retry: | ||
1029 | this_parent = parent; | ||
1030 | seq = read_seqbegin(&rename_lock); | ||
1025 | 1031 | ||
1026 | spin_lock(&dcache_lock); | 1032 | spin_lock(&dcache_lock); |
1027 | if (d_mountpoint(parent)) | 1033 | if (d_mountpoint(parent)) |
@@ -1055,17 +1061,37 @@ resume: | |||
1055 | * All done at this level ... ascend and resume the search. | 1061 | * All done at this level ... ascend and resume the search. |
1056 | */ | 1062 | */ |
1057 | if (this_parent != parent) { | 1063 | if (this_parent != parent) { |
1058 | next = this_parent->d_u.d_child.next; | 1064 | struct dentry *tmp; |
1065 | struct dentry *child; | ||
1066 | |||
1067 | tmp = this_parent->d_parent; | ||
1068 | rcu_read_lock(); | ||
1059 | spin_unlock(&this_parent->d_lock); | 1069 | spin_unlock(&this_parent->d_lock); |
1060 | this_parent = this_parent->d_parent; | 1070 | child = this_parent; |
1071 | this_parent = tmp; | ||
1061 | spin_lock(&this_parent->d_lock); | 1072 | spin_lock(&this_parent->d_lock); |
1073 | /* might go back up the wrong parent if we have had a rename | ||
1074 | * or deletion */ | ||
1075 | if (this_parent != child->d_parent || | ||
1076 | read_seqretry(&rename_lock, seq)) { | ||
1077 | spin_unlock(&this_parent->d_lock); | ||
1078 | spin_unlock(&dcache_lock); | ||
1079 | rcu_read_unlock(); | ||
1080 | goto rename_retry; | ||
1081 | } | ||
1082 | rcu_read_unlock(); | ||
1083 | next = child->d_u.d_child.next; | ||
1062 | goto resume; | 1084 | goto resume; |
1063 | } | 1085 | } |
1064 | spin_unlock(&this_parent->d_lock); | 1086 | spin_unlock(&this_parent->d_lock); |
1065 | spin_unlock(&dcache_lock); | 1087 | spin_unlock(&dcache_lock); |
1088 | if (read_seqretry(&rename_lock, seq)) | ||
1089 | goto rename_retry; | ||
1066 | return 0; /* No mount points found in tree */ | 1090 | return 0; /* No mount points found in tree */ |
1067 | positive: | 1091 | positive: |
1068 | spin_unlock(&dcache_lock); | 1092 | spin_unlock(&dcache_lock); |
1093 | if (read_seqretry(&rename_lock, seq)) | ||
1094 | goto rename_retry; | ||
1069 | return 1; | 1095 | return 1; |
1070 | } | 1096 | } |
1071 | EXPORT_SYMBOL(have_submounts); | 1097 | EXPORT_SYMBOL(have_submounts); |
@@ -1086,10 +1112,15 @@ EXPORT_SYMBOL(have_submounts); | |||
1086 | */ | 1112 | */ |
1087 | static int select_parent(struct dentry * parent) | 1113 | static int select_parent(struct dentry * parent) |
1088 | { | 1114 | { |
1089 | struct dentry *this_parent = parent; | 1115 | struct dentry *this_parent; |
1090 | struct list_head *next; | 1116 | struct list_head *next; |
1117 | unsigned seq; | ||
1091 | int found = 0; | 1118 | int found = 0; |
1092 | 1119 | ||
1120 | rename_retry: | ||
1121 | this_parent = parent; | ||
1122 | seq = read_seqbegin(&rename_lock); | ||
1123 | |||
1093 | spin_lock(&dcache_lock); | 1124 | spin_lock(&dcache_lock); |
1094 | spin_lock(&this_parent->d_lock); | 1125 | spin_lock(&this_parent->d_lock); |
1095 | repeat: | 1126 | repeat: |
@@ -1099,7 +1130,6 @@ resume: | |||
1099 | struct list_head *tmp = next; | 1130 | struct list_head *tmp = next; |
1100 | struct dentry *dentry = list_entry(tmp, struct dentry, d_u.d_child); | 1131 | struct dentry *dentry = list_entry(tmp, struct dentry, d_u.d_child); |
1101 | next = tmp->next; | 1132 | next = tmp->next; |
1102 | BUG_ON(this_parent == dentry); | ||
1103 | 1133 | ||
1104 | spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED); | 1134 | spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED); |
1105 | 1135 | ||
@@ -1142,17 +1172,32 @@ resume: | |||
1142 | */ | 1172 | */ |
1143 | if (this_parent != parent) { | 1173 | if (this_parent != parent) { |
1144 | struct dentry *tmp; | 1174 | struct dentry *tmp; |
1145 | next = this_parent->d_u.d_child.next; | 1175 | struct dentry *child; |
1176 | |||
1146 | tmp = this_parent->d_parent; | 1177 | tmp = this_parent->d_parent; |
1178 | rcu_read_lock(); | ||
1147 | spin_unlock(&this_parent->d_lock); | 1179 | spin_unlock(&this_parent->d_lock); |
1148 | BUG_ON(tmp == this_parent); | 1180 | child = this_parent; |
1149 | this_parent = tmp; | 1181 | this_parent = tmp; |
1150 | spin_lock(&this_parent->d_lock); | 1182 | spin_lock(&this_parent->d_lock); |
1183 | /* might go back up the wrong parent if we have had a rename | ||
1184 | * or deletion */ | ||
1185 | if (this_parent != child->d_parent || | ||
1186 | read_seqretry(&rename_lock, seq)) { | ||
1187 | spin_unlock(&this_parent->d_lock); | ||
1188 | spin_unlock(&dcache_lock); | ||
1189 | rcu_read_unlock(); | ||
1190 | goto rename_retry; | ||
1191 | } | ||
1192 | rcu_read_unlock(); | ||
1193 | next = child->d_u.d_child.next; | ||
1151 | goto resume; | 1194 | goto resume; |
1152 | } | 1195 | } |
1153 | out: | 1196 | out: |
1154 | spin_unlock(&this_parent->d_lock); | 1197 | spin_unlock(&this_parent->d_lock); |
1155 | spin_unlock(&dcache_lock); | 1198 | spin_unlock(&dcache_lock); |
1199 | if (read_seqretry(&rename_lock, seq)) | ||
1200 | goto rename_retry; | ||
1156 | return found; | 1201 | return found; |
1157 | } | 1202 | } |
1158 | 1203 | ||
@@ -1654,7 +1699,7 @@ EXPORT_SYMBOL(d_add_ci); | |||
1654 | struct dentry * d_lookup(struct dentry * parent, struct qstr * name) | 1699 | struct dentry * d_lookup(struct dentry * parent, struct qstr * name) |
1655 | { | 1700 | { |
1656 | struct dentry * dentry = NULL; | 1701 | struct dentry * dentry = NULL; |
1657 | unsigned long seq; | 1702 | unsigned seq; |
1658 | 1703 | ||
1659 | do { | 1704 | do { |
1660 | seq = read_seqbegin(&rename_lock); | 1705 | seq = read_seqbegin(&rename_lock); |
@@ -2290,7 +2335,7 @@ static int prepend_name(char **buffer, int *buflen, struct qstr *name) | |||
2290 | * @buffer: pointer to the end of the buffer | 2335 | * @buffer: pointer to the end of the buffer |
2291 | * @buflen: pointer to buffer length | 2336 | * @buflen: pointer to buffer length |
2292 | * | 2337 | * |
2293 | * Caller holds the dcache_lock. | 2338 | * Caller holds the rename_lock. |
2294 | * | 2339 | * |
2295 | * If path is not reachable from the supplied root, then the value of | 2340 | * If path is not reachable from the supplied root, then the value of |
2296 | * root is changed (without modifying refcounts). | 2341 | * root is changed (without modifying refcounts). |
@@ -2377,7 +2422,9 @@ char *__d_path(const struct path *path, struct path *root, | |||
2377 | 2422 | ||
2378 | prepend(&res, &buflen, "\0", 1); | 2423 | prepend(&res, &buflen, "\0", 1); |
2379 | spin_lock(&dcache_lock); | 2424 | spin_lock(&dcache_lock); |
2425 | write_seqlock(&rename_lock); | ||
2380 | error = prepend_path(path, root, &res, &buflen); | 2426 | error = prepend_path(path, root, &res, &buflen); |
2427 | write_sequnlock(&rename_lock); | ||
2381 | spin_unlock(&dcache_lock); | 2428 | spin_unlock(&dcache_lock); |
2382 | 2429 | ||
2383 | if (error) | 2430 | if (error) |
@@ -2441,10 +2488,12 @@ char *d_path(const struct path *path, char *buf, int buflen) | |||
2441 | 2488 | ||
2442 | get_fs_root(current->fs, &root); | 2489 | get_fs_root(current->fs, &root); |
2443 | spin_lock(&dcache_lock); | 2490 | spin_lock(&dcache_lock); |
2491 | write_seqlock(&rename_lock); | ||
2444 | tmp = root; | 2492 | tmp = root; |
2445 | error = path_with_deleted(path, &tmp, &res, &buflen); | 2493 | error = path_with_deleted(path, &tmp, &res, &buflen); |
2446 | if (error) | 2494 | if (error) |
2447 | res = ERR_PTR(error); | 2495 | res = ERR_PTR(error); |
2496 | write_sequnlock(&rename_lock); | ||
2448 | spin_unlock(&dcache_lock); | 2497 | spin_unlock(&dcache_lock); |
2449 | path_put(&root); | 2498 | path_put(&root); |
2450 | return res; | 2499 | return res; |
@@ -2472,10 +2521,12 @@ char *d_path_with_unreachable(const struct path *path, char *buf, int buflen) | |||
2472 | 2521 | ||
2473 | get_fs_root(current->fs, &root); | 2522 | get_fs_root(current->fs, &root); |
2474 | spin_lock(&dcache_lock); | 2523 | spin_lock(&dcache_lock); |
2524 | write_seqlock(&rename_lock); | ||
2475 | tmp = root; | 2525 | tmp = root; |
2476 | error = path_with_deleted(path, &tmp, &res, &buflen); | 2526 | error = path_with_deleted(path, &tmp, &res, &buflen); |
2477 | if (!error && !path_equal(&tmp, &root)) | 2527 | if (!error && !path_equal(&tmp, &root)) |
2478 | error = prepend_unreachable(&res, &buflen); | 2528 | error = prepend_unreachable(&res, &buflen); |
2529 | write_sequnlock(&rename_lock); | ||
2479 | spin_unlock(&dcache_lock); | 2530 | spin_unlock(&dcache_lock); |
2480 | path_put(&root); | 2531 | path_put(&root); |
2481 | if (error) | 2532 | if (error) |
@@ -2544,7 +2595,9 @@ char *dentry_path_raw(struct dentry *dentry, char *buf, int buflen) | |||
2544 | char *retval; | 2595 | char *retval; |
2545 | 2596 | ||
2546 | spin_lock(&dcache_lock); | 2597 | spin_lock(&dcache_lock); |
2598 | write_seqlock(&rename_lock); | ||
2547 | retval = __dentry_path(dentry, buf, buflen); | 2599 | retval = __dentry_path(dentry, buf, buflen); |
2600 | write_sequnlock(&rename_lock); | ||
2548 | spin_unlock(&dcache_lock); | 2601 | spin_unlock(&dcache_lock); |
2549 | 2602 | ||
2550 | return retval; | 2603 | return retval; |
@@ -2557,6 +2610,7 @@ char *dentry_path(struct dentry *dentry, char *buf, int buflen) | |||
2557 | char *retval; | 2610 | char *retval; |
2558 | 2611 | ||
2559 | spin_lock(&dcache_lock); | 2612 | spin_lock(&dcache_lock); |
2613 | write_seqlock(&rename_lock); | ||
2560 | if (d_unlinked(dentry)) { | 2614 | if (d_unlinked(dentry)) { |
2561 | p = buf + buflen; | 2615 | p = buf + buflen; |
2562 | if (prepend(&p, &buflen, "//deleted", 10) != 0) | 2616 | if (prepend(&p, &buflen, "//deleted", 10) != 0) |
@@ -2564,6 +2618,7 @@ char *dentry_path(struct dentry *dentry, char *buf, int buflen) | |||
2564 | buflen++; | 2618 | buflen++; |
2565 | } | 2619 | } |
2566 | retval = __dentry_path(dentry, buf, buflen); | 2620 | retval = __dentry_path(dentry, buf, buflen); |
2621 | write_sequnlock(&rename_lock); | ||
2567 | spin_unlock(&dcache_lock); | 2622 | spin_unlock(&dcache_lock); |
2568 | if (!IS_ERR(retval) && p) | 2623 | if (!IS_ERR(retval) && p) |
2569 | *p = '/'; /* restore '/' overriden with '\0' */ | 2624 | *p = '/'; /* restore '/' overriden with '\0' */ |
@@ -2604,6 +2659,7 @@ SYSCALL_DEFINE2(getcwd, char __user *, buf, unsigned long, size) | |||
2604 | 2659 | ||
2605 | error = -ENOENT; | 2660 | error = -ENOENT; |
2606 | spin_lock(&dcache_lock); | 2661 | spin_lock(&dcache_lock); |
2662 | write_seqlock(&rename_lock); | ||
2607 | if (!d_unlinked(pwd.dentry)) { | 2663 | if (!d_unlinked(pwd.dentry)) { |
2608 | unsigned long len; | 2664 | unsigned long len; |
2609 | struct path tmp = root; | 2665 | struct path tmp = root; |
@@ -2612,6 +2668,7 @@ SYSCALL_DEFINE2(getcwd, char __user *, buf, unsigned long, size) | |||
2612 | 2668 | ||
2613 | prepend(&cwd, &buflen, "\0", 1); | 2669 | prepend(&cwd, &buflen, "\0", 1); |
2614 | error = prepend_path(&pwd, &tmp, &cwd, &buflen); | 2670 | error = prepend_path(&pwd, &tmp, &cwd, &buflen); |
2671 | write_sequnlock(&rename_lock); | ||
2615 | spin_unlock(&dcache_lock); | 2672 | spin_unlock(&dcache_lock); |
2616 | 2673 | ||
2617 | if (error) | 2674 | if (error) |
@@ -2631,8 +2688,10 @@ SYSCALL_DEFINE2(getcwd, char __user *, buf, unsigned long, size) | |||
2631 | if (copy_to_user(buf, cwd, len)) | 2688 | if (copy_to_user(buf, cwd, len)) |
2632 | error = -EFAULT; | 2689 | error = -EFAULT; |
2633 | } | 2690 | } |
2634 | } else | 2691 | } else { |
2692 | write_sequnlock(&rename_lock); | ||
2635 | spin_unlock(&dcache_lock); | 2693 | spin_unlock(&dcache_lock); |
2694 | } | ||
2636 | 2695 | ||
2637 | out: | 2696 | out: |
2638 | path_put(&pwd); | 2697 | path_put(&pwd); |
@@ -2660,25 +2719,25 @@ out: | |||
2660 | int is_subdir(struct dentry *new_dentry, struct dentry *old_dentry) | 2719 | int is_subdir(struct dentry *new_dentry, struct dentry *old_dentry) |
2661 | { | 2720 | { |
2662 | int result; | 2721 | int result; |
2663 | unsigned long seq; | 2722 | unsigned seq; |
2664 | 2723 | ||
2665 | if (new_dentry == old_dentry) | 2724 | if (new_dentry == old_dentry) |
2666 | return 1; | 2725 | return 1; |
2667 | 2726 | ||
2668 | /* | ||
2669 | * Need rcu_readlock to protect against the d_parent trashing | ||
2670 | * due to d_move | ||
2671 | */ | ||
2672 | rcu_read_lock(); | ||
2673 | do { | 2727 | do { |
2674 | /* for restarting inner loop in case of seq retry */ | 2728 | /* for restarting inner loop in case of seq retry */ |
2675 | seq = read_seqbegin(&rename_lock); | 2729 | seq = read_seqbegin(&rename_lock); |
2730 | /* | ||
2731 | * Need rcu_readlock to protect against the d_parent trashing | ||
2732 | * due to d_move | ||
2733 | */ | ||
2734 | rcu_read_lock(); | ||
2676 | if (d_ancestor(old_dentry, new_dentry)) | 2735 | if (d_ancestor(old_dentry, new_dentry)) |
2677 | result = 1; | 2736 | result = 1; |
2678 | else | 2737 | else |
2679 | result = 0; | 2738 | result = 0; |
2739 | rcu_read_unlock(); | ||
2680 | } while (read_seqretry(&rename_lock, seq)); | 2740 | } while (read_seqretry(&rename_lock, seq)); |
2681 | rcu_read_unlock(); | ||
2682 | 2741 | ||
2683 | return result; | 2742 | return result; |
2684 | } | 2743 | } |
@@ -2710,9 +2769,13 @@ EXPORT_SYMBOL(path_is_under); | |||
2710 | 2769 | ||
2711 | void d_genocide(struct dentry *root) | 2770 | void d_genocide(struct dentry *root) |
2712 | { | 2771 | { |
2713 | struct dentry *this_parent = root; | 2772 | struct dentry *this_parent; |
2714 | struct list_head *next; | 2773 | struct list_head *next; |
2774 | unsigned seq; | ||
2715 | 2775 | ||
2776 | rename_retry: | ||
2777 | this_parent = root; | ||
2778 | seq = read_seqbegin(&rename_lock); | ||
2716 | spin_lock(&dcache_lock); | 2779 | spin_lock(&dcache_lock); |
2717 | spin_lock(&this_parent->d_lock); | 2780 | spin_lock(&this_parent->d_lock); |
2718 | repeat: | 2781 | repeat: |
@@ -2722,6 +2785,7 @@ resume: | |||
2722 | struct list_head *tmp = next; | 2785 | struct list_head *tmp = next; |
2723 | struct dentry *dentry = list_entry(tmp, struct dentry, d_u.d_child); | 2786 | struct dentry *dentry = list_entry(tmp, struct dentry, d_u.d_child); |
2724 | next = tmp->next; | 2787 | next = tmp->next; |
2788 | |||
2725 | spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED); | 2789 | spin_lock_nested(&dentry->d_lock, DENTRY_D_LOCK_NESTED); |
2726 | if (d_unhashed(dentry) || !dentry->d_inode) { | 2790 | if (d_unhashed(dentry) || !dentry->d_inode) { |
2727 | spin_unlock(&dentry->d_lock); | 2791 | spin_unlock(&dentry->d_lock); |
@@ -2734,19 +2798,43 @@ resume: | |||
2734 | spin_acquire(&this_parent->d_lock.dep_map, 0, 1, _RET_IP_); | 2798 | spin_acquire(&this_parent->d_lock.dep_map, 0, 1, _RET_IP_); |
2735 | goto repeat; | 2799 | goto repeat; |
2736 | } | 2800 | } |
2737 | dentry->d_count--; | 2801 | if (!(dentry->d_flags & DCACHE_GENOCIDE)) { |
2802 | dentry->d_flags |= DCACHE_GENOCIDE; | ||
2803 | dentry->d_count--; | ||
2804 | } | ||
2738 | spin_unlock(&dentry->d_lock); | 2805 | spin_unlock(&dentry->d_lock); |
2739 | } | 2806 | } |
2740 | if (this_parent != root) { | 2807 | if (this_parent != root) { |
2741 | next = this_parent->d_u.d_child.next; | 2808 | struct dentry *tmp; |
2742 | this_parent->d_count--; | 2809 | struct dentry *child; |
2810 | |||
2811 | tmp = this_parent->d_parent; | ||
2812 | if (!(this_parent->d_flags & DCACHE_GENOCIDE)) { | ||
2813 | this_parent->d_flags |= DCACHE_GENOCIDE; | ||
2814 | this_parent->d_count--; | ||
2815 | } | ||
2816 | rcu_read_lock(); | ||
2743 | spin_unlock(&this_parent->d_lock); | 2817 | spin_unlock(&this_parent->d_lock); |
2744 | this_parent = this_parent->d_parent; | 2818 | child = this_parent; |
2819 | this_parent = tmp; | ||
2745 | spin_lock(&this_parent->d_lock); | 2820 | spin_lock(&this_parent->d_lock); |
2821 | /* might go back up the wrong parent if we have had a rename | ||
2822 | * or deletion */ | ||
2823 | if (this_parent != child->d_parent || | ||
2824 | read_seqretry(&rename_lock, seq)) { | ||
2825 | spin_unlock(&this_parent->d_lock); | ||
2826 | spin_unlock(&dcache_lock); | ||
2827 | rcu_read_unlock(); | ||
2828 | goto rename_retry; | ||
2829 | } | ||
2830 | rcu_read_unlock(); | ||
2831 | next = child->d_u.d_child.next; | ||
2746 | goto resume; | 2832 | goto resume; |
2747 | } | 2833 | } |
2748 | spin_unlock(&this_parent->d_lock); | 2834 | spin_unlock(&this_parent->d_lock); |
2749 | spin_unlock(&dcache_lock); | 2835 | spin_unlock(&dcache_lock); |
2836 | if (read_seqretry(&rename_lock, seq)) | ||
2837 | goto rename_retry; | ||
2750 | } | 2838 | } |
2751 | 2839 | ||
2752 | /** | 2840 | /** |
diff --git a/fs/nfs/namespace.c b/fs/nfs/namespace.c index db6aa3673cf3..78c0ebb0b07c 100644 --- a/fs/nfs/namespace.c +++ b/fs/nfs/namespace.c | |||
@@ -49,11 +49,17 @@ char *nfs_path(const char *base, | |||
49 | const struct dentry *dentry, | 49 | const struct dentry *dentry, |
50 | char *buffer, ssize_t buflen) | 50 | char *buffer, ssize_t buflen) |
51 | { | 51 | { |
52 | char *end = buffer+buflen; | 52 | char *end; |
53 | int namelen; | 53 | int namelen; |
54 | unsigned seq; | ||
54 | 55 | ||
56 | rename_retry: | ||
57 | end = buffer+buflen; | ||
55 | *--end = '\0'; | 58 | *--end = '\0'; |
56 | buflen--; | 59 | buflen--; |
60 | |||
61 | seq = read_seqbegin(&rename_lock); | ||
62 | rcu_read_lock(); | ||
57 | spin_lock(&dcache_lock); | 63 | spin_lock(&dcache_lock); |
58 | while (!IS_ROOT(dentry) && dentry != droot) { | 64 | while (!IS_ROOT(dentry) && dentry != droot) { |
59 | namelen = dentry->d_name.len; | 65 | namelen = dentry->d_name.len; |
@@ -66,6 +72,9 @@ char *nfs_path(const char *base, | |||
66 | dentry = dentry->d_parent; | 72 | dentry = dentry->d_parent; |
67 | } | 73 | } |
68 | spin_unlock(&dcache_lock); | 74 | spin_unlock(&dcache_lock); |
75 | rcu_read_unlock(); | ||
76 | if (read_seqretry(&rename_lock, seq)) | ||
77 | goto rename_retry; | ||
69 | if (*end != '/') { | 78 | if (*end != '/') { |
70 | if (--buflen < 0) | 79 | if (--buflen < 0) |
71 | goto Elong; | 80 | goto Elong; |
@@ -83,6 +92,9 @@ char *nfs_path(const char *base, | |||
83 | return end; | 92 | return end; |
84 | Elong_unlock: | 93 | Elong_unlock: |
85 | spin_unlock(&dcache_lock); | 94 | spin_unlock(&dcache_lock); |
95 | rcu_read_unlock(); | ||
96 | if (read_seqretry(&rename_lock, seq)) | ||
97 | goto rename_retry; | ||
86 | Elong: | 98 | Elong: |
87 | return ERR_PTR(-ENAMETOOLONG); | 99 | return ERR_PTR(-ENAMETOOLONG); |
88 | } | 100 | } |
diff --git a/include/linux/dcache.h b/include/linux/dcache.h index bda5ec0b077d..c963ebada922 100644 --- a/include/linux/dcache.h +++ b/include/linux/dcache.h | |||
@@ -180,6 +180,7 @@ struct dentry_operations { | |||
180 | #define DCACHE_FSNOTIFY_PARENT_WATCHED 0x0080 /* Parent inode is watched by some fsnotify listener */ | 180 | #define DCACHE_FSNOTIFY_PARENT_WATCHED 0x0080 /* Parent inode is watched by some fsnotify listener */ |
181 | 181 | ||
182 | #define DCACHE_CANT_MOUNT 0x0100 | 182 | #define DCACHE_CANT_MOUNT 0x0100 |
183 | #define DCACHE_GENOCIDE 0x0200 | ||
183 | 184 | ||
184 | extern spinlock_t dcache_inode_lock; | 185 | extern spinlock_t dcache_inode_lock; |
185 | extern spinlock_t dcache_lock; | 186 | extern spinlock_t dcache_lock; |