diff options
author | Tejun Heo <tj@kernel.org> | 2013-11-28 14:54:34 -0500 |
---|---|---|
committer | Greg Kroah-Hartman <gregkh@linuxfoundation.org> | 2013-11-29 21:08:39 -0500 |
commit | 414985ae23c031efbd6d16d484dea8b5de28b8f7 (patch) | |
tree | 06813b5fec1e2e46d9a86cd79e0dd9d23a8d51a0 /fs/kernfs/file.c | |
parent | fd7b9f7b9776b11df629e9dd3865320bf57ce588 (diff) |
sysfs, kernfs: move file core code to fs/kernfs/file.c
Move core file code to fs/kernfs/file.c. fs/sysfs/file.c now contains
sysfs kernfs_ops callbacks, sysfs wrappers around kernfs interfaces,
and sysfs_schedule_callback(). The respective declarations in
fs/sysfs/sysfs.h are moved to fs/kernfs/kernfs-internal.h.
This is pure relocation.
v2: Refreshed on top of the v2 of "sysfs, kernfs: prepare read path
for kernfs".
v3: Refreshed on top of the v3 of "sysfs, kernfs: prepare read path
for kernfs".
Signed-off-by: Tejun Heo <tj@kernel.org>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Diffstat (limited to 'fs/kernfs/file.c')
-rw-r--r-- | fs/kernfs/file.c | 805 |
1 files changed, 805 insertions, 0 deletions
diff --git a/fs/kernfs/file.c b/fs/kernfs/file.c index 90b1e88dad44..fa172e86047f 100644 --- a/fs/kernfs/file.c +++ b/fs/kernfs/file.c | |||
@@ -7,3 +7,808 @@ | |||
7 | * | 7 | * |
8 | * This file is released under the GPLv2. | 8 | * This file is released under the GPLv2. |
9 | */ | 9 | */ |
10 | |||
11 | #include <linux/fs.h> | ||
12 | #include <linux/seq_file.h> | ||
13 | #include <linux/slab.h> | ||
14 | #include <linux/poll.h> | ||
15 | #include <linux/pagemap.h> | ||
16 | #include <linux/poll.h> | ||
17 | #include <linux/sched.h> | ||
18 | |||
19 | #include "kernfs-internal.h" | ||
20 | |||
21 | /* | ||
22 | * There's one sysfs_open_file for each open file and one sysfs_open_dirent | ||
23 | * for each sysfs_dirent with one or more open files. | ||
24 | * | ||
25 | * sysfs_dirent->s_attr.open points to sysfs_open_dirent. s_attr.open is | ||
26 | * protected by sysfs_open_dirent_lock. | ||
27 | * | ||
28 | * filp->private_data points to seq_file whose ->private points to | ||
29 | * sysfs_open_file. sysfs_open_files are chained at | ||
30 | * sysfs_open_dirent->files, which is protected by sysfs_open_file_mutex. | ||
31 | */ | ||
32 | static DEFINE_SPINLOCK(sysfs_open_dirent_lock); | ||
33 | static DEFINE_MUTEX(sysfs_open_file_mutex); | ||
34 | |||
35 | struct sysfs_open_dirent { | ||
36 | atomic_t refcnt; | ||
37 | atomic_t event; | ||
38 | wait_queue_head_t poll; | ||
39 | struct list_head files; /* goes through sysfs_open_file.list */ | ||
40 | }; | ||
41 | |||
42 | static struct sysfs_open_file *sysfs_of(struct file *file) | ||
43 | { | ||
44 | return ((struct seq_file *)file->private_data)->private; | ||
45 | } | ||
46 | |||
47 | /* | ||
48 | * Determine the kernfs_ops for the given sysfs_dirent. This function must | ||
49 | * be called while holding an active reference. | ||
50 | */ | ||
51 | static const struct kernfs_ops *kernfs_ops(struct sysfs_dirent *sd) | ||
52 | { | ||
53 | if (sd->s_flags & SYSFS_FLAG_LOCKDEP) | ||
54 | lockdep_assert_held(sd); | ||
55 | return sd->s_attr.ops; | ||
56 | } | ||
57 | |||
58 | static void *kernfs_seq_start(struct seq_file *sf, loff_t *ppos) | ||
59 | { | ||
60 | struct sysfs_open_file *of = sf->private; | ||
61 | const struct kernfs_ops *ops; | ||
62 | |||
63 | /* | ||
64 | * @of->mutex nests outside active ref and is just to ensure that | ||
65 | * the ops aren't called concurrently for the same open file. | ||
66 | */ | ||
67 | mutex_lock(&of->mutex); | ||
68 | if (!sysfs_get_active(of->sd)) | ||
69 | return ERR_PTR(-ENODEV); | ||
70 | |||
71 | ops = kernfs_ops(of->sd); | ||
72 | if (ops->seq_start) { | ||
73 | return ops->seq_start(sf, ppos); | ||
74 | } else { | ||
75 | /* | ||
76 | * The same behavior and code as single_open(). Returns | ||
77 | * !NULL if pos is at the beginning; otherwise, NULL. | ||
78 | */ | ||
79 | return NULL + !*ppos; | ||
80 | } | ||
81 | } | ||
82 | |||
83 | static void *kernfs_seq_next(struct seq_file *sf, void *v, loff_t *ppos) | ||
84 | { | ||
85 | struct sysfs_open_file *of = sf->private; | ||
86 | const struct kernfs_ops *ops = kernfs_ops(of->sd); | ||
87 | |||
88 | if (ops->seq_next) { | ||
89 | return ops->seq_next(sf, v, ppos); | ||
90 | } else { | ||
91 | /* | ||
92 | * The same behavior and code as single_open(), always | ||
93 | * terminate after the initial read. | ||
94 | */ | ||
95 | ++*ppos; | ||
96 | return NULL; | ||
97 | } | ||
98 | } | ||
99 | |||
100 | static void kernfs_seq_stop(struct seq_file *sf, void *v) | ||
101 | { | ||
102 | struct sysfs_open_file *of = sf->private; | ||
103 | const struct kernfs_ops *ops = kernfs_ops(of->sd); | ||
104 | |||
105 | if (ops->seq_stop) | ||
106 | ops->seq_stop(sf, v); | ||
107 | |||
108 | sysfs_put_active(of->sd); | ||
109 | mutex_unlock(&of->mutex); | ||
110 | } | ||
111 | |||
112 | static int kernfs_seq_show(struct seq_file *sf, void *v) | ||
113 | { | ||
114 | struct sysfs_open_file *of = sf->private; | ||
115 | |||
116 | of->event = atomic_read(&of->sd->s_attr.open->event); | ||
117 | |||
118 | return of->sd->s_attr.ops->seq_show(sf, v); | ||
119 | } | ||
120 | |||
121 | static const struct seq_operations kernfs_seq_ops = { | ||
122 | .start = kernfs_seq_start, | ||
123 | .next = kernfs_seq_next, | ||
124 | .stop = kernfs_seq_stop, | ||
125 | .show = kernfs_seq_show, | ||
126 | }; | ||
127 | |||
128 | /* | ||
129 | * As reading a bin file can have side-effects, the exact offset and bytes | ||
130 | * specified in read(2) call should be passed to the read callback making | ||
131 | * it difficult to use seq_file. Implement simplistic custom buffering for | ||
132 | * bin files. | ||
133 | */ | ||
134 | static ssize_t kernfs_file_direct_read(struct sysfs_open_file *of, | ||
135 | char __user *user_buf, size_t count, | ||
136 | loff_t *ppos) | ||
137 | { | ||
138 | ssize_t len = min_t(size_t, count, PAGE_SIZE); | ||
139 | const struct kernfs_ops *ops; | ||
140 | char *buf; | ||
141 | |||
142 | buf = kmalloc(len, GFP_KERNEL); | ||
143 | if (!buf) | ||
144 | return -ENOMEM; | ||
145 | |||
146 | /* | ||
147 | * @of->mutex nests outside active ref and is just to ensure that | ||
148 | * the ops aren't called concurrently for the same open file. | ||
149 | */ | ||
150 | mutex_lock(&of->mutex); | ||
151 | if (!sysfs_get_active(of->sd)) { | ||
152 | len = -ENODEV; | ||
153 | mutex_unlock(&of->mutex); | ||
154 | goto out_free; | ||
155 | } | ||
156 | |||
157 | ops = kernfs_ops(of->sd); | ||
158 | if (ops->read) | ||
159 | len = ops->read(of, buf, len, *ppos); | ||
160 | else | ||
161 | len = -EINVAL; | ||
162 | |||
163 | sysfs_put_active(of->sd); | ||
164 | mutex_unlock(&of->mutex); | ||
165 | |||
166 | if (len < 0) | ||
167 | goto out_free; | ||
168 | |||
169 | if (copy_to_user(user_buf, buf, len)) { | ||
170 | len = -EFAULT; | ||
171 | goto out_free; | ||
172 | } | ||
173 | |||
174 | *ppos += len; | ||
175 | |||
176 | out_free: | ||
177 | kfree(buf); | ||
178 | return len; | ||
179 | } | ||
180 | |||
181 | /** | ||
182 | * kernfs_file_read - kernfs vfs read callback | ||
183 | * @file: file pointer | ||
184 | * @user_buf: data to write | ||
185 | * @count: number of bytes | ||
186 | * @ppos: starting offset | ||
187 | */ | ||
188 | static ssize_t kernfs_file_read(struct file *file, char __user *user_buf, | ||
189 | size_t count, loff_t *ppos) | ||
190 | { | ||
191 | struct sysfs_open_file *of = sysfs_of(file); | ||
192 | |||
193 | if (of->sd->s_flags & SYSFS_FLAG_HAS_SEQ_SHOW) | ||
194 | return seq_read(file, user_buf, count, ppos); | ||
195 | else | ||
196 | return kernfs_file_direct_read(of, user_buf, count, ppos); | ||
197 | } | ||
198 | |||
199 | /** | ||
200 | * kernfs_file_write - kernfs vfs write callback | ||
201 | * @file: file pointer | ||
202 | * @user_buf: data to write | ||
203 | * @count: number of bytes | ||
204 | * @ppos: starting offset | ||
205 | * | ||
206 | * Copy data in from userland and pass it to the matching kernfs write | ||
207 | * operation. | ||
208 | * | ||
209 | * There is no easy way for us to know if userspace is only doing a partial | ||
210 | * write, so we don't support them. We expect the entire buffer to come on | ||
211 | * the first write. Hint: if you're writing a value, first read the file, | ||
212 | * modify only the the value you're changing, then write entire buffer | ||
213 | * back. | ||
214 | */ | ||
215 | static ssize_t kernfs_file_write(struct file *file, const char __user *user_buf, | ||
216 | size_t count, loff_t *ppos) | ||
217 | { | ||
218 | struct sysfs_open_file *of = sysfs_of(file); | ||
219 | ssize_t len = min_t(size_t, count, PAGE_SIZE); | ||
220 | const struct kernfs_ops *ops; | ||
221 | char *buf; | ||
222 | |||
223 | buf = kmalloc(len + 1, GFP_KERNEL); | ||
224 | if (!buf) | ||
225 | return -ENOMEM; | ||
226 | |||
227 | if (copy_from_user(buf, user_buf, len)) { | ||
228 | len = -EFAULT; | ||
229 | goto out_free; | ||
230 | } | ||
231 | buf[len] = '\0'; /* guarantee string termination */ | ||
232 | |||
233 | /* | ||
234 | * @of->mutex nests outside active ref and is just to ensure that | ||
235 | * the ops aren't called concurrently for the same open file. | ||
236 | */ | ||
237 | mutex_lock(&of->mutex); | ||
238 | if (!sysfs_get_active(of->sd)) { | ||
239 | mutex_unlock(&of->mutex); | ||
240 | len = -ENODEV; | ||
241 | goto out_free; | ||
242 | } | ||
243 | |||
244 | ops = kernfs_ops(of->sd); | ||
245 | if (ops->write) | ||
246 | len = ops->write(of, buf, len, *ppos); | ||
247 | else | ||
248 | len = -EINVAL; | ||
249 | |||
250 | sysfs_put_active(of->sd); | ||
251 | mutex_unlock(&of->mutex); | ||
252 | |||
253 | if (len > 0) | ||
254 | *ppos += len; | ||
255 | out_free: | ||
256 | kfree(buf); | ||
257 | return len; | ||
258 | } | ||
259 | |||
260 | static void kernfs_vma_open(struct vm_area_struct *vma) | ||
261 | { | ||
262 | struct file *file = vma->vm_file; | ||
263 | struct sysfs_open_file *of = sysfs_of(file); | ||
264 | |||
265 | if (!of->vm_ops) | ||
266 | return; | ||
267 | |||
268 | if (!sysfs_get_active(of->sd)) | ||
269 | return; | ||
270 | |||
271 | if (of->vm_ops->open) | ||
272 | of->vm_ops->open(vma); | ||
273 | |||
274 | sysfs_put_active(of->sd); | ||
275 | } | ||
276 | |||
277 | static int kernfs_vma_fault(struct vm_area_struct *vma, struct vm_fault *vmf) | ||
278 | { | ||
279 | struct file *file = vma->vm_file; | ||
280 | struct sysfs_open_file *of = sysfs_of(file); | ||
281 | int ret; | ||
282 | |||
283 | if (!of->vm_ops) | ||
284 | return VM_FAULT_SIGBUS; | ||
285 | |||
286 | if (!sysfs_get_active(of->sd)) | ||
287 | return VM_FAULT_SIGBUS; | ||
288 | |||
289 | ret = VM_FAULT_SIGBUS; | ||
290 | if (of->vm_ops->fault) | ||
291 | ret = of->vm_ops->fault(vma, vmf); | ||
292 | |||
293 | sysfs_put_active(of->sd); | ||
294 | return ret; | ||
295 | } | ||
296 | |||
297 | static int kernfs_vma_page_mkwrite(struct vm_area_struct *vma, | ||
298 | struct vm_fault *vmf) | ||
299 | { | ||
300 | struct file *file = vma->vm_file; | ||
301 | struct sysfs_open_file *of = sysfs_of(file); | ||
302 | int ret; | ||
303 | |||
304 | if (!of->vm_ops) | ||
305 | return VM_FAULT_SIGBUS; | ||
306 | |||
307 | if (!sysfs_get_active(of->sd)) | ||
308 | return VM_FAULT_SIGBUS; | ||
309 | |||
310 | ret = 0; | ||
311 | if (of->vm_ops->page_mkwrite) | ||
312 | ret = of->vm_ops->page_mkwrite(vma, vmf); | ||
313 | else | ||
314 | file_update_time(file); | ||
315 | |||
316 | sysfs_put_active(of->sd); | ||
317 | return ret; | ||
318 | } | ||
319 | |||
320 | static int kernfs_vma_access(struct vm_area_struct *vma, unsigned long addr, | ||
321 | void *buf, int len, int write) | ||
322 | { | ||
323 | struct file *file = vma->vm_file; | ||
324 | struct sysfs_open_file *of = sysfs_of(file); | ||
325 | int ret; | ||
326 | |||
327 | if (!of->vm_ops) | ||
328 | return -EINVAL; | ||
329 | |||
330 | if (!sysfs_get_active(of->sd)) | ||
331 | return -EINVAL; | ||
332 | |||
333 | ret = -EINVAL; | ||
334 | if (of->vm_ops->access) | ||
335 | ret = of->vm_ops->access(vma, addr, buf, len, write); | ||
336 | |||
337 | sysfs_put_active(of->sd); | ||
338 | return ret; | ||
339 | } | ||
340 | |||
341 | #ifdef CONFIG_NUMA | ||
342 | static int kernfs_vma_set_policy(struct vm_area_struct *vma, | ||
343 | struct mempolicy *new) | ||
344 | { | ||
345 | struct file *file = vma->vm_file; | ||
346 | struct sysfs_open_file *of = sysfs_of(file); | ||
347 | int ret; | ||
348 | |||
349 | if (!of->vm_ops) | ||
350 | return 0; | ||
351 | |||
352 | if (!sysfs_get_active(of->sd)) | ||
353 | return -EINVAL; | ||
354 | |||
355 | ret = 0; | ||
356 | if (of->vm_ops->set_policy) | ||
357 | ret = of->vm_ops->set_policy(vma, new); | ||
358 | |||
359 | sysfs_put_active(of->sd); | ||
360 | return ret; | ||
361 | } | ||
362 | |||
363 | static struct mempolicy *kernfs_vma_get_policy(struct vm_area_struct *vma, | ||
364 | unsigned long addr) | ||
365 | { | ||
366 | struct file *file = vma->vm_file; | ||
367 | struct sysfs_open_file *of = sysfs_of(file); | ||
368 | struct mempolicy *pol; | ||
369 | |||
370 | if (!of->vm_ops) | ||
371 | return vma->vm_policy; | ||
372 | |||
373 | if (!sysfs_get_active(of->sd)) | ||
374 | return vma->vm_policy; | ||
375 | |||
376 | pol = vma->vm_policy; | ||
377 | if (of->vm_ops->get_policy) | ||
378 | pol = of->vm_ops->get_policy(vma, addr); | ||
379 | |||
380 | sysfs_put_active(of->sd); | ||
381 | return pol; | ||
382 | } | ||
383 | |||
384 | static int kernfs_vma_migrate(struct vm_area_struct *vma, | ||
385 | const nodemask_t *from, const nodemask_t *to, | ||
386 | unsigned long flags) | ||
387 | { | ||
388 | struct file *file = vma->vm_file; | ||
389 | struct sysfs_open_file *of = sysfs_of(file); | ||
390 | int ret; | ||
391 | |||
392 | if (!of->vm_ops) | ||
393 | return 0; | ||
394 | |||
395 | if (!sysfs_get_active(of->sd)) | ||
396 | return 0; | ||
397 | |||
398 | ret = 0; | ||
399 | if (of->vm_ops->migrate) | ||
400 | ret = of->vm_ops->migrate(vma, from, to, flags); | ||
401 | |||
402 | sysfs_put_active(of->sd); | ||
403 | return ret; | ||
404 | } | ||
405 | #endif | ||
406 | |||
407 | static const struct vm_operations_struct kernfs_vm_ops = { | ||
408 | .open = kernfs_vma_open, | ||
409 | .fault = kernfs_vma_fault, | ||
410 | .page_mkwrite = kernfs_vma_page_mkwrite, | ||
411 | .access = kernfs_vma_access, | ||
412 | #ifdef CONFIG_NUMA | ||
413 | .set_policy = kernfs_vma_set_policy, | ||
414 | .get_policy = kernfs_vma_get_policy, | ||
415 | .migrate = kernfs_vma_migrate, | ||
416 | #endif | ||
417 | }; | ||
418 | |||
419 | static int kernfs_file_mmap(struct file *file, struct vm_area_struct *vma) | ||
420 | { | ||
421 | struct sysfs_open_file *of = sysfs_of(file); | ||
422 | const struct kernfs_ops *ops; | ||
423 | int rc; | ||
424 | |||
425 | mutex_lock(&of->mutex); | ||
426 | |||
427 | rc = -ENODEV; | ||
428 | if (!sysfs_get_active(of->sd)) | ||
429 | goto out_unlock; | ||
430 | |||
431 | ops = kernfs_ops(of->sd); | ||
432 | if (ops->mmap) | ||
433 | rc = ops->mmap(of, vma); | ||
434 | if (rc) | ||
435 | goto out_put; | ||
436 | |||
437 | /* | ||
438 | * PowerPC's pci_mmap of legacy_mem uses shmem_zero_setup() | ||
439 | * to satisfy versions of X which crash if the mmap fails: that | ||
440 | * substitutes a new vm_file, and we don't then want bin_vm_ops. | ||
441 | */ | ||
442 | if (vma->vm_file != file) | ||
443 | goto out_put; | ||
444 | |||
445 | rc = -EINVAL; | ||
446 | if (of->mmapped && of->vm_ops != vma->vm_ops) | ||
447 | goto out_put; | ||
448 | |||
449 | /* | ||
450 | * It is not possible to successfully wrap close. | ||
451 | * So error if someone is trying to use close. | ||
452 | */ | ||
453 | rc = -EINVAL; | ||
454 | if (vma->vm_ops && vma->vm_ops->close) | ||
455 | goto out_put; | ||
456 | |||
457 | rc = 0; | ||
458 | of->mmapped = 1; | ||
459 | of->vm_ops = vma->vm_ops; | ||
460 | vma->vm_ops = &kernfs_vm_ops; | ||
461 | out_put: | ||
462 | sysfs_put_active(of->sd); | ||
463 | out_unlock: | ||
464 | mutex_unlock(&of->mutex); | ||
465 | |||
466 | return rc; | ||
467 | } | ||
468 | |||
469 | /** | ||
470 | * sysfs_get_open_dirent - get or create sysfs_open_dirent | ||
471 | * @sd: target sysfs_dirent | ||
472 | * @of: sysfs_open_file for this instance of open | ||
473 | * | ||
474 | * If @sd->s_attr.open exists, increment its reference count; | ||
475 | * otherwise, create one. @of is chained to the files list. | ||
476 | * | ||
477 | * LOCKING: | ||
478 | * Kernel thread context (may sleep). | ||
479 | * | ||
480 | * RETURNS: | ||
481 | * 0 on success, -errno on failure. | ||
482 | */ | ||
483 | static int sysfs_get_open_dirent(struct sysfs_dirent *sd, | ||
484 | struct sysfs_open_file *of) | ||
485 | { | ||
486 | struct sysfs_open_dirent *od, *new_od = NULL; | ||
487 | |||
488 | retry: | ||
489 | mutex_lock(&sysfs_open_file_mutex); | ||
490 | spin_lock_irq(&sysfs_open_dirent_lock); | ||
491 | |||
492 | if (!sd->s_attr.open && new_od) { | ||
493 | sd->s_attr.open = new_od; | ||
494 | new_od = NULL; | ||
495 | } | ||
496 | |||
497 | od = sd->s_attr.open; | ||
498 | if (od) { | ||
499 | atomic_inc(&od->refcnt); | ||
500 | list_add_tail(&of->list, &od->files); | ||
501 | } | ||
502 | |||
503 | spin_unlock_irq(&sysfs_open_dirent_lock); | ||
504 | mutex_unlock(&sysfs_open_file_mutex); | ||
505 | |||
506 | if (od) { | ||
507 | kfree(new_od); | ||
508 | return 0; | ||
509 | } | ||
510 | |||
511 | /* not there, initialize a new one and retry */ | ||
512 | new_od = kmalloc(sizeof(*new_od), GFP_KERNEL); | ||
513 | if (!new_od) | ||
514 | return -ENOMEM; | ||
515 | |||
516 | atomic_set(&new_od->refcnt, 0); | ||
517 | atomic_set(&new_od->event, 1); | ||
518 | init_waitqueue_head(&new_od->poll); | ||
519 | INIT_LIST_HEAD(&new_od->files); | ||
520 | goto retry; | ||
521 | } | ||
522 | |||
523 | /** | ||
524 | * sysfs_put_open_dirent - put sysfs_open_dirent | ||
525 | * @sd: target sysfs_dirent | ||
526 | * @of: associated sysfs_open_file | ||
527 | * | ||
528 | * Put @sd->s_attr.open and unlink @of from the files list. If | ||
529 | * reference count reaches zero, disassociate and free it. | ||
530 | * | ||
531 | * LOCKING: | ||
532 | * None. | ||
533 | */ | ||
534 | static void sysfs_put_open_dirent(struct sysfs_dirent *sd, | ||
535 | struct sysfs_open_file *of) | ||
536 | { | ||
537 | struct sysfs_open_dirent *od = sd->s_attr.open; | ||
538 | unsigned long flags; | ||
539 | |||
540 | mutex_lock(&sysfs_open_file_mutex); | ||
541 | spin_lock_irqsave(&sysfs_open_dirent_lock, flags); | ||
542 | |||
543 | if (of) | ||
544 | list_del(&of->list); | ||
545 | |||
546 | if (atomic_dec_and_test(&od->refcnt)) | ||
547 | sd->s_attr.open = NULL; | ||
548 | else | ||
549 | od = NULL; | ||
550 | |||
551 | spin_unlock_irqrestore(&sysfs_open_dirent_lock, flags); | ||
552 | mutex_unlock(&sysfs_open_file_mutex); | ||
553 | |||
554 | kfree(od); | ||
555 | } | ||
556 | |||
557 | static int kernfs_file_open(struct inode *inode, struct file *file) | ||
558 | { | ||
559 | struct sysfs_dirent *attr_sd = file->f_path.dentry->d_fsdata; | ||
560 | const struct kernfs_ops *ops; | ||
561 | struct sysfs_open_file *of; | ||
562 | bool has_read, has_write, has_mmap; | ||
563 | int error = -EACCES; | ||
564 | |||
565 | if (!sysfs_get_active(attr_sd)) | ||
566 | return -ENODEV; | ||
567 | |||
568 | ops = kernfs_ops(attr_sd); | ||
569 | |||
570 | has_read = ops->seq_show || ops->read || ops->mmap; | ||
571 | has_write = ops->write || ops->mmap; | ||
572 | has_mmap = ops->mmap; | ||
573 | |||
574 | /* check perms and supported operations */ | ||
575 | if ((file->f_mode & FMODE_WRITE) && | ||
576 | (!(inode->i_mode & S_IWUGO) || !has_write)) | ||
577 | goto err_out; | ||
578 | |||
579 | if ((file->f_mode & FMODE_READ) && | ||
580 | (!(inode->i_mode & S_IRUGO) || !has_read)) | ||
581 | goto err_out; | ||
582 | |||
583 | /* allocate a sysfs_open_file for the file */ | ||
584 | error = -ENOMEM; | ||
585 | of = kzalloc(sizeof(struct sysfs_open_file), GFP_KERNEL); | ||
586 | if (!of) | ||
587 | goto err_out; | ||
588 | |||
589 | /* | ||
590 | * The following is done to give a different lockdep key to | ||
591 | * @of->mutex for files which implement mmap. This is a rather | ||
592 | * crude way to avoid false positive lockdep warning around | ||
593 | * mm->mmap_sem - mmap nests @of->mutex under mm->mmap_sem and | ||
594 | * reading /sys/block/sda/trace/act_mask grabs sr_mutex, under | ||
595 | * which mm->mmap_sem nests, while holding @of->mutex. As each | ||
596 | * open file has a separate mutex, it's okay as long as those don't | ||
597 | * happen on the same file. At this point, we can't easily give | ||
598 | * each file a separate locking class. Let's differentiate on | ||
599 | * whether the file has mmap or not for now. | ||
600 | */ | ||
601 | if (has_mmap) | ||
602 | mutex_init(&of->mutex); | ||
603 | else | ||
604 | mutex_init(&of->mutex); | ||
605 | |||
606 | of->sd = attr_sd; | ||
607 | of->file = file; | ||
608 | |||
609 | /* | ||
610 | * Always instantiate seq_file even if read access doesn't use | ||
611 | * seq_file or is not requested. This unifies private data access | ||
612 | * and readable regular files are the vast majority anyway. | ||
613 | */ | ||
614 | if (ops->seq_show) | ||
615 | error = seq_open(file, &kernfs_seq_ops); | ||
616 | else | ||
617 | error = seq_open(file, NULL); | ||
618 | if (error) | ||
619 | goto err_free; | ||
620 | |||
621 | ((struct seq_file *)file->private_data)->private = of; | ||
622 | |||
623 | /* seq_file clears PWRITE unconditionally, restore it if WRITE */ | ||
624 | if (file->f_mode & FMODE_WRITE) | ||
625 | file->f_mode |= FMODE_PWRITE; | ||
626 | |||
627 | /* make sure we have open dirent struct */ | ||
628 | error = sysfs_get_open_dirent(attr_sd, of); | ||
629 | if (error) | ||
630 | goto err_close; | ||
631 | |||
632 | /* open succeeded, put active references */ | ||
633 | sysfs_put_active(attr_sd); | ||
634 | return 0; | ||
635 | |||
636 | err_close: | ||
637 | seq_release(inode, file); | ||
638 | err_free: | ||
639 | kfree(of); | ||
640 | err_out: | ||
641 | sysfs_put_active(attr_sd); | ||
642 | return error; | ||
643 | } | ||
644 | |||
645 | static int kernfs_file_release(struct inode *inode, struct file *filp) | ||
646 | { | ||
647 | struct sysfs_dirent *sd = filp->f_path.dentry->d_fsdata; | ||
648 | struct sysfs_open_file *of = sysfs_of(filp); | ||
649 | |||
650 | sysfs_put_open_dirent(sd, of); | ||
651 | seq_release(inode, filp); | ||
652 | kfree(of); | ||
653 | |||
654 | return 0; | ||
655 | } | ||
656 | |||
657 | void sysfs_unmap_bin_file(struct sysfs_dirent *sd) | ||
658 | { | ||
659 | struct sysfs_open_dirent *od; | ||
660 | struct sysfs_open_file *of; | ||
661 | |||
662 | if (!(sd->s_flags & SYSFS_FLAG_HAS_MMAP)) | ||
663 | return; | ||
664 | |||
665 | spin_lock_irq(&sysfs_open_dirent_lock); | ||
666 | od = sd->s_attr.open; | ||
667 | if (od) | ||
668 | atomic_inc(&od->refcnt); | ||
669 | spin_unlock_irq(&sysfs_open_dirent_lock); | ||
670 | if (!od) | ||
671 | return; | ||
672 | |||
673 | mutex_lock(&sysfs_open_file_mutex); | ||
674 | list_for_each_entry(of, &od->files, list) { | ||
675 | struct inode *inode = file_inode(of->file); | ||
676 | unmap_mapping_range(inode->i_mapping, 0, 0, 1); | ||
677 | } | ||
678 | mutex_unlock(&sysfs_open_file_mutex); | ||
679 | |||
680 | sysfs_put_open_dirent(sd, NULL); | ||
681 | } | ||
682 | |||
683 | /* Sysfs attribute files are pollable. The idea is that you read | ||
684 | * the content and then you use 'poll' or 'select' to wait for | ||
685 | * the content to change. When the content changes (assuming the | ||
686 | * manager for the kobject supports notification), poll will | ||
687 | * return POLLERR|POLLPRI, and select will return the fd whether | ||
688 | * it is waiting for read, write, or exceptions. | ||
689 | * Once poll/select indicates that the value has changed, you | ||
690 | * need to close and re-open the file, or seek to 0 and read again. | ||
691 | * Reminder: this only works for attributes which actively support | ||
692 | * it, and it is not possible to test an attribute from userspace | ||
693 | * to see if it supports poll (Neither 'poll' nor 'select' return | ||
694 | * an appropriate error code). When in doubt, set a suitable timeout value. | ||
695 | */ | ||
696 | static unsigned int kernfs_file_poll(struct file *filp, poll_table *wait) | ||
697 | { | ||
698 | struct sysfs_open_file *of = sysfs_of(filp); | ||
699 | struct sysfs_dirent *attr_sd = filp->f_path.dentry->d_fsdata; | ||
700 | struct sysfs_open_dirent *od = attr_sd->s_attr.open; | ||
701 | |||
702 | /* need parent for the kobj, grab both */ | ||
703 | if (!sysfs_get_active(attr_sd)) | ||
704 | goto trigger; | ||
705 | |||
706 | poll_wait(filp, &od->poll, wait); | ||
707 | |||
708 | sysfs_put_active(attr_sd); | ||
709 | |||
710 | if (of->event != atomic_read(&od->event)) | ||
711 | goto trigger; | ||
712 | |||
713 | return DEFAULT_POLLMASK; | ||
714 | |||
715 | trigger: | ||
716 | return DEFAULT_POLLMASK|POLLERR|POLLPRI; | ||
717 | } | ||
718 | |||
719 | /** | ||
720 | * kernfs_notify - notify a kernfs file | ||
721 | * @sd: file to notify | ||
722 | * | ||
723 | * Notify @sd such that poll(2) on @sd wakes up. | ||
724 | */ | ||
725 | void kernfs_notify(struct sysfs_dirent *sd) | ||
726 | { | ||
727 | struct sysfs_open_dirent *od; | ||
728 | unsigned long flags; | ||
729 | |||
730 | spin_lock_irqsave(&sysfs_open_dirent_lock, flags); | ||
731 | |||
732 | if (!WARN_ON(sysfs_type(sd) != SYSFS_KOBJ_ATTR)) { | ||
733 | od = sd->s_attr.open; | ||
734 | if (od) { | ||
735 | atomic_inc(&od->event); | ||
736 | wake_up_interruptible(&od->poll); | ||
737 | } | ||
738 | } | ||
739 | |||
740 | spin_unlock_irqrestore(&sysfs_open_dirent_lock, flags); | ||
741 | } | ||
742 | EXPORT_SYMBOL_GPL(kernfs_notify); | ||
743 | |||
744 | const struct file_operations kernfs_file_operations = { | ||
745 | .read = kernfs_file_read, | ||
746 | .write = kernfs_file_write, | ||
747 | .llseek = generic_file_llseek, | ||
748 | .mmap = kernfs_file_mmap, | ||
749 | .open = kernfs_file_open, | ||
750 | .release = kernfs_file_release, | ||
751 | .poll = kernfs_file_poll, | ||
752 | }; | ||
753 | |||
754 | /** | ||
755 | * kernfs_create_file_ns_key - create a file | ||
756 | * @parent: directory to create the file in | ||
757 | * @name: name of the file | ||
758 | * @mode: mode of the file | ||
759 | * @size: size of the file | ||
760 | * @ops: kernfs operations for the file | ||
761 | * @priv: private data for the file | ||
762 | * @ns: optional namespace tag of the file | ||
763 | * @key: lockdep key for the file's active_ref, %NULL to disable lockdep | ||
764 | * | ||
765 | * Returns the created node on success, ERR_PTR() value on error. | ||
766 | */ | ||
767 | struct sysfs_dirent *kernfs_create_file_ns_key(struct sysfs_dirent *parent, | ||
768 | const char *name, | ||
769 | umode_t mode, loff_t size, | ||
770 | const struct kernfs_ops *ops, | ||
771 | void *priv, const void *ns, | ||
772 | struct lock_class_key *key) | ||
773 | { | ||
774 | struct sysfs_addrm_cxt acxt; | ||
775 | struct sysfs_dirent *sd; | ||
776 | int rc; | ||
777 | |||
778 | sd = sysfs_new_dirent(name, (mode & S_IALLUGO) | S_IFREG, | ||
779 | SYSFS_KOBJ_ATTR); | ||
780 | if (!sd) | ||
781 | return ERR_PTR(-ENOMEM); | ||
782 | |||
783 | sd->s_attr.ops = ops; | ||
784 | sd->s_attr.size = size; | ||
785 | sd->s_ns = ns; | ||
786 | sd->priv = priv; | ||
787 | |||
788 | #ifdef CONFIG_DEBUG_LOCK_ALLOC | ||
789 | if (key) { | ||
790 | lockdep_init_map(&sd->dep_map, "s_active", key, 0); | ||
791 | sd->s_flags |= SYSFS_FLAG_LOCKDEP; | ||
792 | } | ||
793 | #endif | ||
794 | |||
795 | /* | ||
796 | * sd->s_attr.ops is accesible only while holding active ref. We | ||
797 | * need to know whether some ops are implemented outside active | ||
798 | * ref. Cache their existence in flags. | ||
799 | */ | ||
800 | if (ops->seq_show) | ||
801 | sd->s_flags |= SYSFS_FLAG_HAS_SEQ_SHOW; | ||
802 | if (ops->mmap) | ||
803 | sd->s_flags |= SYSFS_FLAG_HAS_MMAP; | ||
804 | |||
805 | sysfs_addrm_start(&acxt); | ||
806 | rc = sysfs_add_one(&acxt, sd, parent); | ||
807 | sysfs_addrm_finish(&acxt); | ||
808 | |||
809 | if (rc) { | ||
810 | kernfs_put(sd); | ||
811 | return ERR_PTR(rc); | ||
812 | } | ||
813 | return sd; | ||
814 | } | ||