diff options
author | Tejun Heo <tj@kernel.org> | 2013-11-28 14:54:33 -0500 |
---|---|---|
committer | Greg Kroah-Hartman <gregkh@linuxfoundation.org> | 2013-11-29 21:08:39 -0500 |
commit | fd7b9f7b9776b11df629e9dd3865320bf57ce588 (patch) | |
tree | 06e3d55ac0179dce37b477ae6941058b00bedc3c /fs/kernfs | |
parent | ffed24e22845a3da0ae01095ae3f11c8d16e889d (diff) |
sysfs, kernfs: move dir core code to fs/kernfs/dir.c
Move core dir code to fs/kernfs/dir.c. fs/sysfs/dir.c now only
contains sysfs_warn_dup() and sysfs wrappers around kernfs interfaces.
The respective declarations in fs/sysfs/sysfs.h are moved to
fs/kernfs/kernfs-internal.h.
This is pure relocation.
v2: sysfs_symlink_target_lock was mistakenly relocated to kernfs. It
should remain with sysfs. Fixed.
Signed-off-by: Tejun Heo <tj@kernel.org>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Diffstat (limited to 'fs/kernfs')
-rw-r--r-- | fs/kernfs/dir.c | 988 | ||||
-rw-r--r-- | fs/kernfs/kernfs-internal.h | 17 |
2 files changed, 1005 insertions, 0 deletions
diff --git a/fs/kernfs/dir.c b/fs/kernfs/dir.c index 1061602ce81a..a4ca4de3cb21 100644 --- a/fs/kernfs/dir.c +++ b/fs/kernfs/dir.c | |||
@@ -7,3 +7,991 @@ | |||
7 | * | 7 | * |
8 | * This file is released under the GPLv2. | 8 | * This file is released under the GPLv2. |
9 | */ | 9 | */ |
10 | |||
11 | #include <linux/fs.h> | ||
12 | #include <linux/namei.h> | ||
13 | #include <linux/idr.h> | ||
14 | #include <linux/slab.h> | ||
15 | #include <linux/security.h> | ||
16 | #include <linux/hash.h> | ||
17 | |||
18 | #include "kernfs-internal.h" | ||
19 | |||
20 | DEFINE_MUTEX(sysfs_mutex); | ||
21 | |||
22 | #define to_sysfs_dirent(X) rb_entry((X), struct sysfs_dirent, s_rb) | ||
23 | |||
24 | static DEFINE_SPINLOCK(sysfs_ino_lock); | ||
25 | static DEFINE_IDA(sysfs_ino_ida); | ||
26 | |||
27 | /** | ||
28 | * sysfs_name_hash | ||
29 | * @name: Null terminated string to hash | ||
30 | * @ns: Namespace tag to hash | ||
31 | * | ||
32 | * Returns 31 bit hash of ns + name (so it fits in an off_t ) | ||
33 | */ | ||
34 | static unsigned int sysfs_name_hash(const char *name, const void *ns) | ||
35 | { | ||
36 | unsigned long hash = init_name_hash(); | ||
37 | unsigned int len = strlen(name); | ||
38 | while (len--) | ||
39 | hash = partial_name_hash(*name++, hash); | ||
40 | hash = (end_name_hash(hash) ^ hash_ptr((void *)ns, 31)); | ||
41 | hash &= 0x7fffffffU; | ||
42 | /* Reserve hash numbers 0, 1 and INT_MAX for magic directory entries */ | ||
43 | if (hash < 1) | ||
44 | hash += 2; | ||
45 | if (hash >= INT_MAX) | ||
46 | hash = INT_MAX - 1; | ||
47 | return hash; | ||
48 | } | ||
49 | |||
50 | static int sysfs_name_compare(unsigned int hash, const char *name, | ||
51 | const void *ns, const struct sysfs_dirent *sd) | ||
52 | { | ||
53 | if (hash != sd->s_hash) | ||
54 | return hash - sd->s_hash; | ||
55 | if (ns != sd->s_ns) | ||
56 | return ns - sd->s_ns; | ||
57 | return strcmp(name, sd->s_name); | ||
58 | } | ||
59 | |||
60 | static int sysfs_sd_compare(const struct sysfs_dirent *left, | ||
61 | const struct sysfs_dirent *right) | ||
62 | { | ||
63 | return sysfs_name_compare(left->s_hash, left->s_name, left->s_ns, | ||
64 | right); | ||
65 | } | ||
66 | |||
67 | /** | ||
68 | * sysfs_link_sibling - link sysfs_dirent into sibling rbtree | ||
69 | * @sd: sysfs_dirent of interest | ||
70 | * | ||
71 | * Link @sd into its sibling rbtree which starts from | ||
72 | * sd->s_parent->s_dir.children. | ||
73 | * | ||
74 | * Locking: | ||
75 | * mutex_lock(sysfs_mutex) | ||
76 | * | ||
77 | * RETURNS: | ||
78 | * 0 on susccess -EEXIST on failure. | ||
79 | */ | ||
80 | static int sysfs_link_sibling(struct sysfs_dirent *sd) | ||
81 | { | ||
82 | struct rb_node **node = &sd->s_parent->s_dir.children.rb_node; | ||
83 | struct rb_node *parent = NULL; | ||
84 | |||
85 | if (sysfs_type(sd) == SYSFS_DIR) | ||
86 | sd->s_parent->s_dir.subdirs++; | ||
87 | |||
88 | while (*node) { | ||
89 | struct sysfs_dirent *pos; | ||
90 | int result; | ||
91 | |||
92 | pos = to_sysfs_dirent(*node); | ||
93 | parent = *node; | ||
94 | result = sysfs_sd_compare(sd, pos); | ||
95 | if (result < 0) | ||
96 | node = &pos->s_rb.rb_left; | ||
97 | else if (result > 0) | ||
98 | node = &pos->s_rb.rb_right; | ||
99 | else | ||
100 | return -EEXIST; | ||
101 | } | ||
102 | /* add new node and rebalance the tree */ | ||
103 | rb_link_node(&sd->s_rb, parent, node); | ||
104 | rb_insert_color(&sd->s_rb, &sd->s_parent->s_dir.children); | ||
105 | return 0; | ||
106 | } | ||
107 | |||
108 | /** | ||
109 | * sysfs_unlink_sibling - unlink sysfs_dirent from sibling rbtree | ||
110 | * @sd: sysfs_dirent of interest | ||
111 | * | ||
112 | * Unlink @sd from its sibling rbtree which starts from | ||
113 | * sd->s_parent->s_dir.children. | ||
114 | * | ||
115 | * Locking: | ||
116 | * mutex_lock(sysfs_mutex) | ||
117 | */ | ||
118 | static void sysfs_unlink_sibling(struct sysfs_dirent *sd) | ||
119 | { | ||
120 | if (sysfs_type(sd) == SYSFS_DIR) | ||
121 | sd->s_parent->s_dir.subdirs--; | ||
122 | |||
123 | rb_erase(&sd->s_rb, &sd->s_parent->s_dir.children); | ||
124 | } | ||
125 | |||
126 | /** | ||
127 | * sysfs_get_active - get an active reference to sysfs_dirent | ||
128 | * @sd: sysfs_dirent to get an active reference to | ||
129 | * | ||
130 | * Get an active reference of @sd. This function is noop if @sd | ||
131 | * is NULL. | ||
132 | * | ||
133 | * RETURNS: | ||
134 | * Pointer to @sd on success, NULL on failure. | ||
135 | */ | ||
136 | struct sysfs_dirent *sysfs_get_active(struct sysfs_dirent *sd) | ||
137 | { | ||
138 | if (unlikely(!sd)) | ||
139 | return NULL; | ||
140 | |||
141 | if (!atomic_inc_unless_negative(&sd->s_active)) | ||
142 | return NULL; | ||
143 | |||
144 | if (sd->s_flags & SYSFS_FLAG_LOCKDEP) | ||
145 | rwsem_acquire_read(&sd->dep_map, 0, 1, _RET_IP_); | ||
146 | return sd; | ||
147 | } | ||
148 | |||
149 | /** | ||
150 | * sysfs_put_active - put an active reference to sysfs_dirent | ||
151 | * @sd: sysfs_dirent to put an active reference to | ||
152 | * | ||
153 | * Put an active reference to @sd. This function is noop if @sd | ||
154 | * is NULL. | ||
155 | */ | ||
156 | void sysfs_put_active(struct sysfs_dirent *sd) | ||
157 | { | ||
158 | int v; | ||
159 | |||
160 | if (unlikely(!sd)) | ||
161 | return; | ||
162 | |||
163 | if (sd->s_flags & SYSFS_FLAG_LOCKDEP) | ||
164 | rwsem_release(&sd->dep_map, 1, _RET_IP_); | ||
165 | v = atomic_dec_return(&sd->s_active); | ||
166 | if (likely(v != SD_DEACTIVATED_BIAS)) | ||
167 | return; | ||
168 | |||
169 | /* atomic_dec_return() is a mb(), we'll always see the updated | ||
170 | * sd->u.completion. | ||
171 | */ | ||
172 | complete(sd->u.completion); | ||
173 | } | ||
174 | |||
175 | /** | ||
176 | * sysfs_deactivate - deactivate sysfs_dirent | ||
177 | * @sd: sysfs_dirent to deactivate | ||
178 | * | ||
179 | * Deny new active references and drain existing ones. | ||
180 | */ | ||
181 | static void sysfs_deactivate(struct sysfs_dirent *sd) | ||
182 | { | ||
183 | DECLARE_COMPLETION_ONSTACK(wait); | ||
184 | int v; | ||
185 | |||
186 | BUG_ON(!(sd->s_flags & SYSFS_FLAG_REMOVED)); | ||
187 | |||
188 | if (!(sysfs_type(sd) & SYSFS_ACTIVE_REF)) | ||
189 | return; | ||
190 | |||
191 | sd->u.completion = (void *)&wait; | ||
192 | |||
193 | rwsem_acquire(&sd->dep_map, 0, 0, _RET_IP_); | ||
194 | /* atomic_add_return() is a mb(), put_active() will always see | ||
195 | * the updated sd->u.completion. | ||
196 | */ | ||
197 | v = atomic_add_return(SD_DEACTIVATED_BIAS, &sd->s_active); | ||
198 | |||
199 | if (v != SD_DEACTIVATED_BIAS) { | ||
200 | lock_contended(&sd->dep_map, _RET_IP_); | ||
201 | wait_for_completion(&wait); | ||
202 | } | ||
203 | |||
204 | lock_acquired(&sd->dep_map, _RET_IP_); | ||
205 | rwsem_release(&sd->dep_map, 1, _RET_IP_); | ||
206 | } | ||
207 | |||
208 | static int sysfs_alloc_ino(unsigned int *pino) | ||
209 | { | ||
210 | int ino, rc; | ||
211 | |||
212 | retry: | ||
213 | spin_lock(&sysfs_ino_lock); | ||
214 | rc = ida_get_new_above(&sysfs_ino_ida, 2, &ino); | ||
215 | spin_unlock(&sysfs_ino_lock); | ||
216 | |||
217 | if (rc == -EAGAIN) { | ||
218 | if (ida_pre_get(&sysfs_ino_ida, GFP_KERNEL)) | ||
219 | goto retry; | ||
220 | rc = -ENOMEM; | ||
221 | } | ||
222 | |||
223 | *pino = ino; | ||
224 | return rc; | ||
225 | } | ||
226 | |||
227 | static void sysfs_free_ino(unsigned int ino) | ||
228 | { | ||
229 | spin_lock(&sysfs_ino_lock); | ||
230 | ida_remove(&sysfs_ino_ida, ino); | ||
231 | spin_unlock(&sysfs_ino_lock); | ||
232 | } | ||
233 | |||
234 | /** | ||
235 | * kernfs_get - get a reference count on a sysfs_dirent | ||
236 | * @sd: the target sysfs_dirent | ||
237 | */ | ||
238 | void kernfs_get(struct sysfs_dirent *sd) | ||
239 | { | ||
240 | if (sd) { | ||
241 | WARN_ON(!atomic_read(&sd->s_count)); | ||
242 | atomic_inc(&sd->s_count); | ||
243 | } | ||
244 | } | ||
245 | EXPORT_SYMBOL_GPL(kernfs_get); | ||
246 | |||
247 | /** | ||
248 | * kernfs_put - put a reference count on a sysfs_dirent | ||
249 | * @sd: the target sysfs_dirent | ||
250 | * | ||
251 | * Put a reference count of @sd and destroy it if it reached zero. | ||
252 | */ | ||
253 | void kernfs_put(struct sysfs_dirent *sd) | ||
254 | { | ||
255 | struct sysfs_dirent *parent_sd; | ||
256 | |||
257 | if (!sd || !atomic_dec_and_test(&sd->s_count)) | ||
258 | return; | ||
259 | repeat: | ||
260 | /* Moving/renaming is always done while holding reference. | ||
261 | * sd->s_parent won't change beneath us. | ||
262 | */ | ||
263 | parent_sd = sd->s_parent; | ||
264 | |||
265 | WARN(!(sd->s_flags & SYSFS_FLAG_REMOVED), | ||
266 | "sysfs: free using entry: %s/%s\n", | ||
267 | parent_sd ? parent_sd->s_name : "", sd->s_name); | ||
268 | |||
269 | if (sysfs_type(sd) == SYSFS_KOBJ_LINK) | ||
270 | kernfs_put(sd->s_symlink.target_sd); | ||
271 | if (sysfs_type(sd) & SYSFS_COPY_NAME) | ||
272 | kfree(sd->s_name); | ||
273 | if (sd->s_iattr && sd->s_iattr->ia_secdata) | ||
274 | security_release_secctx(sd->s_iattr->ia_secdata, | ||
275 | sd->s_iattr->ia_secdata_len); | ||
276 | kfree(sd->s_iattr); | ||
277 | sysfs_free_ino(sd->s_ino); | ||
278 | kmem_cache_free(sysfs_dir_cachep, sd); | ||
279 | |||
280 | sd = parent_sd; | ||
281 | if (sd && atomic_dec_and_test(&sd->s_count)) | ||
282 | goto repeat; | ||
283 | } | ||
284 | EXPORT_SYMBOL_GPL(kernfs_put); | ||
285 | |||
286 | static int sysfs_dentry_delete(const struct dentry *dentry) | ||
287 | { | ||
288 | struct sysfs_dirent *sd = dentry->d_fsdata; | ||
289 | return !(sd && !(sd->s_flags & SYSFS_FLAG_REMOVED)); | ||
290 | } | ||
291 | |||
292 | static int sysfs_dentry_revalidate(struct dentry *dentry, unsigned int flags) | ||
293 | { | ||
294 | struct sysfs_dirent *sd; | ||
295 | |||
296 | if (flags & LOOKUP_RCU) | ||
297 | return -ECHILD; | ||
298 | |||
299 | sd = dentry->d_fsdata; | ||
300 | mutex_lock(&sysfs_mutex); | ||
301 | |||
302 | /* The sysfs dirent has been deleted */ | ||
303 | if (sd->s_flags & SYSFS_FLAG_REMOVED) | ||
304 | goto out_bad; | ||
305 | |||
306 | /* The sysfs dirent has been moved? */ | ||
307 | if (dentry->d_parent->d_fsdata != sd->s_parent) | ||
308 | goto out_bad; | ||
309 | |||
310 | /* The sysfs dirent has been renamed */ | ||
311 | if (strcmp(dentry->d_name.name, sd->s_name) != 0) | ||
312 | goto out_bad; | ||
313 | |||
314 | /* The sysfs dirent has been moved to a different namespace */ | ||
315 | if (sd->s_parent && (sd->s_parent->s_flags & SYSFS_FLAG_NS) && | ||
316 | sysfs_info(dentry->d_sb)->ns != sd->s_ns) | ||
317 | goto out_bad; | ||
318 | |||
319 | mutex_unlock(&sysfs_mutex); | ||
320 | out_valid: | ||
321 | return 1; | ||
322 | out_bad: | ||
323 | /* Remove the dentry from the dcache hashes. | ||
324 | * If this is a deleted dentry we use d_drop instead of d_delete | ||
325 | * so sysfs doesn't need to cope with negative dentries. | ||
326 | * | ||
327 | * If this is a dentry that has simply been renamed we | ||
328 | * use d_drop to remove it from the dcache lookup on its | ||
329 | * old parent. If this dentry persists later when a lookup | ||
330 | * is performed at its new name the dentry will be readded | ||
331 | * to the dcache hashes. | ||
332 | */ | ||
333 | mutex_unlock(&sysfs_mutex); | ||
334 | |||
335 | /* If we have submounts we must allow the vfs caches | ||
336 | * to lie about the state of the filesystem to prevent | ||
337 | * leaks and other nasty things. | ||
338 | */ | ||
339 | if (check_submounts_and_drop(dentry) != 0) | ||
340 | goto out_valid; | ||
341 | |||
342 | return 0; | ||
343 | } | ||
344 | |||
345 | static void sysfs_dentry_release(struct dentry *dentry) | ||
346 | { | ||
347 | kernfs_put(dentry->d_fsdata); | ||
348 | } | ||
349 | |||
350 | const struct dentry_operations sysfs_dentry_ops = { | ||
351 | .d_revalidate = sysfs_dentry_revalidate, | ||
352 | .d_delete = sysfs_dentry_delete, | ||
353 | .d_release = sysfs_dentry_release, | ||
354 | }; | ||
355 | |||
356 | struct sysfs_dirent *sysfs_new_dirent(const char *name, umode_t mode, int type) | ||
357 | { | ||
358 | char *dup_name = NULL; | ||
359 | struct sysfs_dirent *sd; | ||
360 | |||
361 | if (type & SYSFS_COPY_NAME) { | ||
362 | name = dup_name = kstrdup(name, GFP_KERNEL); | ||
363 | if (!name) | ||
364 | return NULL; | ||
365 | } | ||
366 | |||
367 | sd = kmem_cache_zalloc(sysfs_dir_cachep, GFP_KERNEL); | ||
368 | if (!sd) | ||
369 | goto err_out1; | ||
370 | |||
371 | if (sysfs_alloc_ino(&sd->s_ino)) | ||
372 | goto err_out2; | ||
373 | |||
374 | atomic_set(&sd->s_count, 1); | ||
375 | atomic_set(&sd->s_active, 0); | ||
376 | |||
377 | sd->s_name = name; | ||
378 | sd->s_mode = mode; | ||
379 | sd->s_flags = type | SYSFS_FLAG_REMOVED; | ||
380 | |||
381 | return sd; | ||
382 | |||
383 | err_out2: | ||
384 | kmem_cache_free(sysfs_dir_cachep, sd); | ||
385 | err_out1: | ||
386 | kfree(dup_name); | ||
387 | return NULL; | ||
388 | } | ||
389 | |||
390 | /** | ||
391 | * sysfs_addrm_start - prepare for sysfs_dirent add/remove | ||
392 | * @acxt: pointer to sysfs_addrm_cxt to be used | ||
393 | * | ||
394 | * This function is called when the caller is about to add or remove | ||
395 | * sysfs_dirent. This function acquires sysfs_mutex. @acxt is used | ||
396 | * to keep and pass context to other addrm functions. | ||
397 | * | ||
398 | * LOCKING: | ||
399 | * Kernel thread context (may sleep). sysfs_mutex is locked on | ||
400 | * return. | ||
401 | */ | ||
402 | void sysfs_addrm_start(struct sysfs_addrm_cxt *acxt) | ||
403 | __acquires(sysfs_mutex) | ||
404 | { | ||
405 | memset(acxt, 0, sizeof(*acxt)); | ||
406 | |||
407 | mutex_lock(&sysfs_mutex); | ||
408 | } | ||
409 | |||
410 | /** | ||
411 | * sysfs_add_one - add sysfs_dirent to parent without warning | ||
412 | * @acxt: addrm context to use | ||
413 | * @sd: sysfs_dirent to be added | ||
414 | * @parent_sd: the parent sysfs_dirent to add @sd to | ||
415 | * | ||
416 | * Get @parent_sd and set @sd->s_parent to it and increment nlink of | ||
417 | * the parent inode if @sd is a directory and link into the children | ||
418 | * list of the parent. | ||
419 | * | ||
420 | * This function should be called between calls to | ||
421 | * sysfs_addrm_start() and sysfs_addrm_finish() and should be | ||
422 | * passed the same @acxt as passed to sysfs_addrm_start(). | ||
423 | * | ||
424 | * LOCKING: | ||
425 | * Determined by sysfs_addrm_start(). | ||
426 | * | ||
427 | * RETURNS: | ||
428 | * 0 on success, -EEXIST if entry with the given name already | ||
429 | * exists. | ||
430 | */ | ||
431 | int sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd, | ||
432 | struct sysfs_dirent *parent_sd) | ||
433 | { | ||
434 | bool has_ns = parent_sd->s_flags & SYSFS_FLAG_NS; | ||
435 | struct sysfs_inode_attrs *ps_iattr; | ||
436 | int ret; | ||
437 | |||
438 | if (has_ns != (bool)sd->s_ns) { | ||
439 | WARN(1, KERN_WARNING "sysfs: ns %s in '%s' for '%s'\n", | ||
440 | has_ns ? "required" : "invalid", | ||
441 | parent_sd->s_name, sd->s_name); | ||
442 | return -EINVAL; | ||
443 | } | ||
444 | |||
445 | if (sysfs_type(parent_sd) != SYSFS_DIR) | ||
446 | return -EINVAL; | ||
447 | |||
448 | sd->s_hash = sysfs_name_hash(sd->s_name, sd->s_ns); | ||
449 | sd->s_parent = parent_sd; | ||
450 | kernfs_get(parent_sd); | ||
451 | |||
452 | ret = sysfs_link_sibling(sd); | ||
453 | if (ret) | ||
454 | return ret; | ||
455 | |||
456 | /* Update timestamps on the parent */ | ||
457 | ps_iattr = parent_sd->s_iattr; | ||
458 | if (ps_iattr) { | ||
459 | struct iattr *ps_iattrs = &ps_iattr->ia_iattr; | ||
460 | ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME; | ||
461 | } | ||
462 | |||
463 | /* Mark the entry added into directory tree */ | ||
464 | sd->s_flags &= ~SYSFS_FLAG_REMOVED; | ||
465 | |||
466 | return 0; | ||
467 | } | ||
468 | |||
469 | /** | ||
470 | * sysfs_remove_one - remove sysfs_dirent from parent | ||
471 | * @acxt: addrm context to use | ||
472 | * @sd: sysfs_dirent to be removed | ||
473 | * | ||
474 | * Mark @sd removed and drop nlink of parent inode if @sd is a | ||
475 | * directory. @sd is unlinked from the children list. | ||
476 | * | ||
477 | * This function should be called between calls to | ||
478 | * sysfs_addrm_start() and sysfs_addrm_finish() and should be | ||
479 | * passed the same @acxt as passed to sysfs_addrm_start(). | ||
480 | * | ||
481 | * LOCKING: | ||
482 | * Determined by sysfs_addrm_start(). | ||
483 | */ | ||
484 | static void sysfs_remove_one(struct sysfs_addrm_cxt *acxt, | ||
485 | struct sysfs_dirent *sd) | ||
486 | { | ||
487 | struct sysfs_inode_attrs *ps_iattr; | ||
488 | |||
489 | /* | ||
490 | * Removal can be called multiple times on the same node. Only the | ||
491 | * first invocation is effective and puts the base ref. | ||
492 | */ | ||
493 | if (sd->s_flags & SYSFS_FLAG_REMOVED) | ||
494 | return; | ||
495 | |||
496 | sysfs_unlink_sibling(sd); | ||
497 | |||
498 | /* Update timestamps on the parent */ | ||
499 | ps_iattr = sd->s_parent->s_iattr; | ||
500 | if (ps_iattr) { | ||
501 | struct iattr *ps_iattrs = &ps_iattr->ia_iattr; | ||
502 | ps_iattrs->ia_ctime = ps_iattrs->ia_mtime = CURRENT_TIME; | ||
503 | } | ||
504 | |||
505 | sd->s_flags |= SYSFS_FLAG_REMOVED; | ||
506 | sd->u.removed_list = acxt->removed; | ||
507 | acxt->removed = sd; | ||
508 | } | ||
509 | |||
510 | /** | ||
511 | * sysfs_addrm_finish - finish up sysfs_dirent add/remove | ||
512 | * @acxt: addrm context to finish up | ||
513 | * | ||
514 | * Finish up sysfs_dirent add/remove. Resources acquired by | ||
515 | * sysfs_addrm_start() are released and removed sysfs_dirents are | ||
516 | * cleaned up. | ||
517 | * | ||
518 | * LOCKING: | ||
519 | * sysfs_mutex is released. | ||
520 | */ | ||
521 | void sysfs_addrm_finish(struct sysfs_addrm_cxt *acxt) | ||
522 | __releases(sysfs_mutex) | ||
523 | { | ||
524 | /* release resources acquired by sysfs_addrm_start() */ | ||
525 | mutex_unlock(&sysfs_mutex); | ||
526 | |||
527 | /* kill removed sysfs_dirents */ | ||
528 | while (acxt->removed) { | ||
529 | struct sysfs_dirent *sd = acxt->removed; | ||
530 | |||
531 | acxt->removed = sd->u.removed_list; | ||
532 | |||
533 | sysfs_deactivate(sd); | ||
534 | sysfs_unmap_bin_file(sd); | ||
535 | kernfs_put(sd); | ||
536 | } | ||
537 | } | ||
538 | |||
539 | /** | ||
540 | * kernfs_find_ns - find sysfs_dirent with the given name | ||
541 | * @parent: sysfs_dirent to search under | ||
542 | * @name: name to look for | ||
543 | * @ns: the namespace tag to use | ||
544 | * | ||
545 | * Look for sysfs_dirent with name @name under @parent. Returns pointer to | ||
546 | * the found sysfs_dirent on success, %NULL on failure. | ||
547 | */ | ||
548 | static struct sysfs_dirent *kernfs_find_ns(struct sysfs_dirent *parent, | ||
549 | const unsigned char *name, | ||
550 | const void *ns) | ||
551 | { | ||
552 | struct rb_node *node = parent->s_dir.children.rb_node; | ||
553 | bool has_ns = parent->s_flags & SYSFS_FLAG_NS; | ||
554 | unsigned int hash; | ||
555 | |||
556 | lockdep_assert_held(&sysfs_mutex); | ||
557 | |||
558 | if (has_ns != (bool)ns) { | ||
559 | WARN(1, KERN_WARNING "sysfs: ns %s in '%s' for '%s'\n", | ||
560 | has_ns ? "required" : "invalid", | ||
561 | parent->s_name, name); | ||
562 | return NULL; | ||
563 | } | ||
564 | |||
565 | hash = sysfs_name_hash(name, ns); | ||
566 | while (node) { | ||
567 | struct sysfs_dirent *sd; | ||
568 | int result; | ||
569 | |||
570 | sd = to_sysfs_dirent(node); | ||
571 | result = sysfs_name_compare(hash, name, ns, sd); | ||
572 | if (result < 0) | ||
573 | node = node->rb_left; | ||
574 | else if (result > 0) | ||
575 | node = node->rb_right; | ||
576 | else | ||
577 | return sd; | ||
578 | } | ||
579 | return NULL; | ||
580 | } | ||
581 | |||
582 | /** | ||
583 | * kernfs_find_and_get_ns - find and get sysfs_dirent with the given name | ||
584 | * @parent: sysfs_dirent to search under | ||
585 | * @name: name to look for | ||
586 | * @ns: the namespace tag to use | ||
587 | * | ||
588 | * Look for sysfs_dirent with name @name under @parent and get a reference | ||
589 | * if found. This function may sleep and returns pointer to the found | ||
590 | * sysfs_dirent on success, %NULL on failure. | ||
591 | */ | ||
592 | struct sysfs_dirent *kernfs_find_and_get_ns(struct sysfs_dirent *parent, | ||
593 | const char *name, const void *ns) | ||
594 | { | ||
595 | struct sysfs_dirent *sd; | ||
596 | |||
597 | mutex_lock(&sysfs_mutex); | ||
598 | sd = kernfs_find_ns(parent, name, ns); | ||
599 | kernfs_get(sd); | ||
600 | mutex_unlock(&sysfs_mutex); | ||
601 | |||
602 | return sd; | ||
603 | } | ||
604 | EXPORT_SYMBOL_GPL(kernfs_find_and_get_ns); | ||
605 | |||
606 | /** | ||
607 | * kernfs_create_dir_ns - create a directory | ||
608 | * @parent: parent in which to create a new directory | ||
609 | * @name: name of the new directory | ||
610 | * @priv: opaque data associated with the new directory | ||
611 | * @ns: optional namespace tag of the directory | ||
612 | * | ||
613 | * Returns the created node on success, ERR_PTR() value on failure. | ||
614 | */ | ||
615 | struct sysfs_dirent *kernfs_create_dir_ns(struct sysfs_dirent *parent, | ||
616 | const char *name, void *priv, | ||
617 | const void *ns) | ||
618 | { | ||
619 | umode_t mode = S_IFDIR | S_IRWXU | S_IRUGO | S_IXUGO; | ||
620 | struct sysfs_addrm_cxt acxt; | ||
621 | struct sysfs_dirent *sd; | ||
622 | int rc; | ||
623 | |||
624 | /* allocate */ | ||
625 | sd = sysfs_new_dirent(name, mode, SYSFS_DIR); | ||
626 | if (!sd) | ||
627 | return ERR_PTR(-ENOMEM); | ||
628 | |||
629 | sd->s_ns = ns; | ||
630 | sd->priv = priv; | ||
631 | |||
632 | /* link in */ | ||
633 | sysfs_addrm_start(&acxt); | ||
634 | rc = sysfs_add_one(&acxt, sd, parent); | ||
635 | sysfs_addrm_finish(&acxt); | ||
636 | |||
637 | if (!rc) | ||
638 | return sd; | ||
639 | |||
640 | kernfs_put(sd); | ||
641 | return ERR_PTR(rc); | ||
642 | } | ||
643 | |||
644 | static struct dentry *sysfs_lookup(struct inode *dir, struct dentry *dentry, | ||
645 | unsigned int flags) | ||
646 | { | ||
647 | struct dentry *ret = NULL; | ||
648 | struct dentry *parent = dentry->d_parent; | ||
649 | struct sysfs_dirent *parent_sd = parent->d_fsdata; | ||
650 | struct sysfs_dirent *sd; | ||
651 | struct inode *inode; | ||
652 | const void *ns = NULL; | ||
653 | |||
654 | mutex_lock(&sysfs_mutex); | ||
655 | |||
656 | if (parent_sd->s_flags & SYSFS_FLAG_NS) | ||
657 | ns = sysfs_info(dir->i_sb)->ns; | ||
658 | |||
659 | sd = kernfs_find_ns(parent_sd, dentry->d_name.name, ns); | ||
660 | |||
661 | /* no such entry */ | ||
662 | if (!sd) { | ||
663 | ret = ERR_PTR(-ENOENT); | ||
664 | goto out_unlock; | ||
665 | } | ||
666 | kernfs_get(sd); | ||
667 | dentry->d_fsdata = sd; | ||
668 | |||
669 | /* attach dentry and inode */ | ||
670 | inode = sysfs_get_inode(dir->i_sb, sd); | ||
671 | if (!inode) { | ||
672 | ret = ERR_PTR(-ENOMEM); | ||
673 | goto out_unlock; | ||
674 | } | ||
675 | |||
676 | /* instantiate and hash dentry */ | ||
677 | ret = d_materialise_unique(dentry, inode); | ||
678 | out_unlock: | ||
679 | mutex_unlock(&sysfs_mutex); | ||
680 | return ret; | ||
681 | } | ||
682 | |||
683 | const struct inode_operations sysfs_dir_inode_operations = { | ||
684 | .lookup = sysfs_lookup, | ||
685 | .permission = sysfs_permission, | ||
686 | .setattr = sysfs_setattr, | ||
687 | .getattr = sysfs_getattr, | ||
688 | .setxattr = sysfs_setxattr, | ||
689 | }; | ||
690 | |||
691 | static struct sysfs_dirent *sysfs_leftmost_descendant(struct sysfs_dirent *pos) | ||
692 | { | ||
693 | struct sysfs_dirent *last; | ||
694 | |||
695 | while (true) { | ||
696 | struct rb_node *rbn; | ||
697 | |||
698 | last = pos; | ||
699 | |||
700 | if (sysfs_type(pos) != SYSFS_DIR) | ||
701 | break; | ||
702 | |||
703 | rbn = rb_first(&pos->s_dir.children); | ||
704 | if (!rbn) | ||
705 | break; | ||
706 | |||
707 | pos = to_sysfs_dirent(rbn); | ||
708 | } | ||
709 | |||
710 | return last; | ||
711 | } | ||
712 | |||
713 | /** | ||
714 | * sysfs_next_descendant_post - find the next descendant for post-order walk | ||
715 | * @pos: the current position (%NULL to initiate traversal) | ||
716 | * @root: sysfs_dirent whose descendants to walk | ||
717 | * | ||
718 | * Find the next descendant to visit for post-order traversal of @root's | ||
719 | * descendants. @root is included in the iteration and the last node to be | ||
720 | * visited. | ||
721 | */ | ||
722 | static struct sysfs_dirent *sysfs_next_descendant_post(struct sysfs_dirent *pos, | ||
723 | struct sysfs_dirent *root) | ||
724 | { | ||
725 | struct rb_node *rbn; | ||
726 | |||
727 | lockdep_assert_held(&sysfs_mutex); | ||
728 | |||
729 | /* if first iteration, visit leftmost descendant which may be root */ | ||
730 | if (!pos) | ||
731 | return sysfs_leftmost_descendant(root); | ||
732 | |||
733 | /* if we visited @root, we're done */ | ||
734 | if (pos == root) | ||
735 | return NULL; | ||
736 | |||
737 | /* if there's an unvisited sibling, visit its leftmost descendant */ | ||
738 | rbn = rb_next(&pos->s_rb); | ||
739 | if (rbn) | ||
740 | return sysfs_leftmost_descendant(to_sysfs_dirent(rbn)); | ||
741 | |||
742 | /* no sibling left, visit parent */ | ||
743 | return pos->s_parent; | ||
744 | } | ||
745 | |||
746 | static void __kernfs_remove(struct sysfs_addrm_cxt *acxt, | ||
747 | struct sysfs_dirent *sd) | ||
748 | { | ||
749 | struct sysfs_dirent *pos, *next; | ||
750 | |||
751 | if (!sd) | ||
752 | return; | ||
753 | |||
754 | pr_debug("sysfs %s: removing\n", sd->s_name); | ||
755 | |||
756 | next = NULL; | ||
757 | do { | ||
758 | pos = next; | ||
759 | next = sysfs_next_descendant_post(pos, sd); | ||
760 | if (pos) | ||
761 | sysfs_remove_one(acxt, pos); | ||
762 | } while (next); | ||
763 | } | ||
764 | |||
765 | /** | ||
766 | * kernfs_remove - remove a sysfs_dirent recursively | ||
767 | * @sd: the sysfs_dirent to remove | ||
768 | * | ||
769 | * Remove @sd along with all its subdirectories and files. | ||
770 | */ | ||
771 | void kernfs_remove(struct sysfs_dirent *sd) | ||
772 | { | ||
773 | struct sysfs_addrm_cxt acxt; | ||
774 | |||
775 | sysfs_addrm_start(&acxt); | ||
776 | __kernfs_remove(&acxt, sd); | ||
777 | sysfs_addrm_finish(&acxt); | ||
778 | } | ||
779 | |||
780 | /** | ||
781 | * kernfs_remove_by_name_ns - find a sysfs_dirent by name and remove it | ||
782 | * @dir_sd: parent of the target | ||
783 | * @name: name of the sysfs_dirent to remove | ||
784 | * @ns: namespace tag of the sysfs_dirent to remove | ||
785 | * | ||
786 | * Look for the sysfs_dirent with @name and @ns under @dir_sd and remove | ||
787 | * it. Returns 0 on success, -ENOENT if such entry doesn't exist. | ||
788 | */ | ||
789 | int kernfs_remove_by_name_ns(struct sysfs_dirent *dir_sd, const char *name, | ||
790 | const void *ns) | ||
791 | { | ||
792 | struct sysfs_addrm_cxt acxt; | ||
793 | struct sysfs_dirent *sd; | ||
794 | |||
795 | if (!dir_sd) { | ||
796 | WARN(1, KERN_WARNING "sysfs: can not remove '%s', no directory\n", | ||
797 | name); | ||
798 | return -ENOENT; | ||
799 | } | ||
800 | |||
801 | sysfs_addrm_start(&acxt); | ||
802 | |||
803 | sd = kernfs_find_ns(dir_sd, name, ns); | ||
804 | if (sd) | ||
805 | __kernfs_remove(&acxt, sd); | ||
806 | |||
807 | sysfs_addrm_finish(&acxt); | ||
808 | |||
809 | if (sd) | ||
810 | return 0; | ||
811 | else | ||
812 | return -ENOENT; | ||
813 | } | ||
814 | |||
815 | /** | ||
816 | * kernfs_rename_ns - move and rename a kernfs_node | ||
817 | * @sd: target node | ||
818 | * @new_parent: new parent to put @sd under | ||
819 | * @new_name: new name | ||
820 | * @new_ns: new namespace tag | ||
821 | */ | ||
822 | int kernfs_rename_ns(struct sysfs_dirent *sd, struct sysfs_dirent *new_parent, | ||
823 | const char *new_name, const void *new_ns) | ||
824 | { | ||
825 | int error; | ||
826 | |||
827 | mutex_lock(&sysfs_mutex); | ||
828 | |||
829 | error = 0; | ||
830 | if ((sd->s_parent == new_parent) && (sd->s_ns == new_ns) && | ||
831 | (strcmp(sd->s_name, new_name) == 0)) | ||
832 | goto out; /* nothing to rename */ | ||
833 | |||
834 | error = -EEXIST; | ||
835 | if (kernfs_find_ns(new_parent, new_name, new_ns)) | ||
836 | goto out; | ||
837 | |||
838 | /* rename sysfs_dirent */ | ||
839 | if (strcmp(sd->s_name, new_name) != 0) { | ||
840 | error = -ENOMEM; | ||
841 | new_name = kstrdup(new_name, GFP_KERNEL); | ||
842 | if (!new_name) | ||
843 | goto out; | ||
844 | |||
845 | kfree(sd->s_name); | ||
846 | sd->s_name = new_name; | ||
847 | } | ||
848 | |||
849 | /* | ||
850 | * Move to the appropriate place in the appropriate directories rbtree. | ||
851 | */ | ||
852 | sysfs_unlink_sibling(sd); | ||
853 | kernfs_get(new_parent); | ||
854 | kernfs_put(sd->s_parent); | ||
855 | sd->s_ns = new_ns; | ||
856 | sd->s_hash = sysfs_name_hash(sd->s_name, sd->s_ns); | ||
857 | sd->s_parent = new_parent; | ||
858 | sysfs_link_sibling(sd); | ||
859 | |||
860 | error = 0; | ||
861 | out: | ||
862 | mutex_unlock(&sysfs_mutex); | ||
863 | return error; | ||
864 | } | ||
865 | |||
866 | /** | ||
867 | * kernfs_enable_ns - enable namespace under a directory | ||
868 | * @sd: directory of interest, should be empty | ||
869 | * | ||
870 | * This is to be called right after @sd is created to enable namespace | ||
871 | * under it. All children of @sd must have non-NULL namespace tags and | ||
872 | * only the ones which match the super_block's tag will be visible. | ||
873 | */ | ||
874 | void kernfs_enable_ns(struct sysfs_dirent *sd) | ||
875 | { | ||
876 | WARN_ON_ONCE(sysfs_type(sd) != SYSFS_DIR); | ||
877 | WARN_ON_ONCE(!RB_EMPTY_ROOT(&sd->s_dir.children)); | ||
878 | sd->s_flags |= SYSFS_FLAG_NS; | ||
879 | } | ||
880 | |||
881 | /* Relationship between s_mode and the DT_xxx types */ | ||
882 | static inline unsigned char dt_type(struct sysfs_dirent *sd) | ||
883 | { | ||
884 | return (sd->s_mode >> 12) & 15; | ||
885 | } | ||
886 | |||
887 | static int sysfs_dir_release(struct inode *inode, struct file *filp) | ||
888 | { | ||
889 | kernfs_put(filp->private_data); | ||
890 | return 0; | ||
891 | } | ||
892 | |||
893 | static struct sysfs_dirent *sysfs_dir_pos(const void *ns, | ||
894 | struct sysfs_dirent *parent_sd, loff_t hash, struct sysfs_dirent *pos) | ||
895 | { | ||
896 | if (pos) { | ||
897 | int valid = !(pos->s_flags & SYSFS_FLAG_REMOVED) && | ||
898 | pos->s_parent == parent_sd && | ||
899 | hash == pos->s_hash; | ||
900 | kernfs_put(pos); | ||
901 | if (!valid) | ||
902 | pos = NULL; | ||
903 | } | ||
904 | if (!pos && (hash > 1) && (hash < INT_MAX)) { | ||
905 | struct rb_node *node = parent_sd->s_dir.children.rb_node; | ||
906 | while (node) { | ||
907 | pos = to_sysfs_dirent(node); | ||
908 | |||
909 | if (hash < pos->s_hash) | ||
910 | node = node->rb_left; | ||
911 | else if (hash > pos->s_hash) | ||
912 | node = node->rb_right; | ||
913 | else | ||
914 | break; | ||
915 | } | ||
916 | } | ||
917 | /* Skip over entries in the wrong namespace */ | ||
918 | while (pos && pos->s_ns != ns) { | ||
919 | struct rb_node *node = rb_next(&pos->s_rb); | ||
920 | if (!node) | ||
921 | pos = NULL; | ||
922 | else | ||
923 | pos = to_sysfs_dirent(node); | ||
924 | } | ||
925 | return pos; | ||
926 | } | ||
927 | |||
928 | static struct sysfs_dirent *sysfs_dir_next_pos(const void *ns, | ||
929 | struct sysfs_dirent *parent_sd, ino_t ino, struct sysfs_dirent *pos) | ||
930 | { | ||
931 | pos = sysfs_dir_pos(ns, parent_sd, ino, pos); | ||
932 | if (pos) | ||
933 | do { | ||
934 | struct rb_node *node = rb_next(&pos->s_rb); | ||
935 | if (!node) | ||
936 | pos = NULL; | ||
937 | else | ||
938 | pos = to_sysfs_dirent(node); | ||
939 | } while (pos && pos->s_ns != ns); | ||
940 | return pos; | ||
941 | } | ||
942 | |||
943 | static int sysfs_readdir(struct file *file, struct dir_context *ctx) | ||
944 | { | ||
945 | struct dentry *dentry = file->f_path.dentry; | ||
946 | struct sysfs_dirent *parent_sd = dentry->d_fsdata; | ||
947 | struct sysfs_dirent *pos = file->private_data; | ||
948 | const void *ns = NULL; | ||
949 | |||
950 | if (!dir_emit_dots(file, ctx)) | ||
951 | return 0; | ||
952 | mutex_lock(&sysfs_mutex); | ||
953 | |||
954 | if (parent_sd->s_flags & SYSFS_FLAG_NS) | ||
955 | ns = sysfs_info(dentry->d_sb)->ns; | ||
956 | |||
957 | for (pos = sysfs_dir_pos(ns, parent_sd, ctx->pos, pos); | ||
958 | pos; | ||
959 | pos = sysfs_dir_next_pos(ns, parent_sd, ctx->pos, pos)) { | ||
960 | const char *name = pos->s_name; | ||
961 | unsigned int type = dt_type(pos); | ||
962 | int len = strlen(name); | ||
963 | ino_t ino = pos->s_ino; | ||
964 | |||
965 | ctx->pos = pos->s_hash; | ||
966 | file->private_data = pos; | ||
967 | kernfs_get(pos); | ||
968 | |||
969 | mutex_unlock(&sysfs_mutex); | ||
970 | if (!dir_emit(ctx, name, len, ino, type)) | ||
971 | return 0; | ||
972 | mutex_lock(&sysfs_mutex); | ||
973 | } | ||
974 | mutex_unlock(&sysfs_mutex); | ||
975 | file->private_data = NULL; | ||
976 | ctx->pos = INT_MAX; | ||
977 | return 0; | ||
978 | } | ||
979 | |||
980 | static loff_t sysfs_dir_llseek(struct file *file, loff_t offset, int whence) | ||
981 | { | ||
982 | struct inode *inode = file_inode(file); | ||
983 | loff_t ret; | ||
984 | |||
985 | mutex_lock(&inode->i_mutex); | ||
986 | ret = generic_file_llseek(file, offset, whence); | ||
987 | mutex_unlock(&inode->i_mutex); | ||
988 | |||
989 | return ret; | ||
990 | } | ||
991 | |||
992 | const struct file_operations sysfs_dir_operations = { | ||
993 | .read = generic_read_dir, | ||
994 | .iterate = sysfs_readdir, | ||
995 | .release = sysfs_dir_release, | ||
996 | .llseek = sysfs_dir_llseek, | ||
997 | }; | ||
diff --git a/fs/kernfs/kernfs-internal.h b/fs/kernfs/kernfs-internal.h index 933ac8d5d07a..31f0dbe1881b 100644 --- a/fs/kernfs/kernfs-internal.h +++ b/fs/kernfs/kernfs-internal.h | |||
@@ -14,6 +14,7 @@ | |||
14 | #include <linux/lockdep.h> | 14 | #include <linux/lockdep.h> |
15 | #include <linux/fs.h> | 15 | #include <linux/fs.h> |
16 | #include <linux/rbtree.h> | 16 | #include <linux/rbtree.h> |
17 | #include <linux/mutex.h> | ||
17 | 18 | ||
18 | #include <linux/kernfs.h> | 19 | #include <linux/kernfs.h> |
19 | 20 | ||
@@ -125,4 +126,20 @@ int sysfs_setxattr(struct dentry *dentry, const char *name, const void *value, | |||
125 | size_t size, int flags); | 126 | size_t size, int flags); |
126 | int sysfs_inode_init(void); | 127 | int sysfs_inode_init(void); |
127 | 128 | ||
129 | /* | ||
130 | * dir.c | ||
131 | */ | ||
132 | extern struct mutex sysfs_mutex; | ||
133 | extern const struct dentry_operations sysfs_dentry_ops; | ||
134 | extern const struct file_operations sysfs_dir_operations; | ||
135 | extern const struct inode_operations sysfs_dir_inode_operations; | ||
136 | |||
137 | struct sysfs_dirent *sysfs_get_active(struct sysfs_dirent *sd); | ||
138 | void sysfs_put_active(struct sysfs_dirent *sd); | ||
139 | void sysfs_addrm_start(struct sysfs_addrm_cxt *acxt); | ||
140 | int sysfs_add_one(struct sysfs_addrm_cxt *acxt, struct sysfs_dirent *sd, | ||
141 | struct sysfs_dirent *parent_sd); | ||
142 | void sysfs_addrm_finish(struct sysfs_addrm_cxt *acxt); | ||
143 | struct sysfs_dirent *sysfs_new_dirent(const char *name, umode_t mode, int type); | ||
144 | |||
128 | #endif /* __KERNFS_INTERNAL_H */ | 145 | #endif /* __KERNFS_INTERNAL_H */ |