aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMiklos Szeredi <miklos@szeredi.hu>2005-09-09 16:10:35 -0400
committerLinus Torvalds <torvalds@g5.osdl.org>2005-09-09 17:03:46 -0400
commit413ef8cb302511d8e995e2b0e5517ee1a65b9c77 (patch)
tree59acb15a73fa0dc4393a086fb83f016105d84b2a
parent5a53368277efa2d80dd2206dddc1f4b19ef0c32a (diff)
[PATCH] FUSE - direct I/O
This patch adds support for the "direct_io" mount option of FUSE. When this mount option is specified, the page cache is bypassed for read and write operations. This is useful for example, if the filesystem doesn't know the size of files before reading them, or when any kind of caching is harmful. Signed-off-by: Miklos Szeredi <miklos@szeredi.hu> Signed-off-by: Andrew Morton <akpm@osdl.org> Signed-off-by: Linus Torvalds <torvalds@osdl.org>
-rw-r--r--fs/fuse/file.c133
-rw-r--r--fs/fuse/fuse_i.h6
-rw-r--r--fs/fuse/inode.c9
3 files changed, 146 insertions, 2 deletions
diff --git a/fs/fuse/file.c b/fs/fuse/file.c
index 86ffb6db5fe7..6bc3fb26de39 100644
--- a/fs/fuse/file.c
+++ b/fs/fuse/file.c
@@ -363,6 +363,118 @@ static int fuse_commit_write(struct file *file, struct page *page,
363 return err; 363 return err;
364} 364}
365 365
366static void fuse_release_user_pages(struct fuse_req *req, int write)
367{
368 unsigned i;
369
370 for (i = 0; i < req->num_pages; i++) {
371 struct page *page = req->pages[i];
372 if (write)
373 set_page_dirty_lock(page);
374 put_page(page);
375 }
376}
377
378static int fuse_get_user_pages(struct fuse_req *req, const char __user *buf,
379 unsigned nbytes, int write)
380{
381 unsigned long user_addr = (unsigned long) buf;
382 unsigned offset = user_addr & ~PAGE_MASK;
383 int npages;
384
385 /* This doesn't work with nfsd */
386 if (!current->mm)
387 return -EPERM;
388
389 nbytes = min(nbytes, (unsigned) FUSE_MAX_PAGES_PER_REQ << PAGE_SHIFT);
390 npages = (nbytes + offset + PAGE_SIZE - 1) >> PAGE_SHIFT;
391 npages = min(npages, FUSE_MAX_PAGES_PER_REQ);
392 down_read(&current->mm->mmap_sem);
393 npages = get_user_pages(current, current->mm, user_addr, npages, write,
394 0, req->pages, NULL);
395 up_read(&current->mm->mmap_sem);
396 if (npages < 0)
397 return npages;
398
399 req->num_pages = npages;
400 req->page_offset = offset;
401 return 0;
402}
403
404static ssize_t fuse_direct_io(struct file *file, const char __user *buf,
405 size_t count, loff_t *ppos, int write)
406{
407 struct inode *inode = file->f_dentry->d_inode;
408 struct fuse_conn *fc = get_fuse_conn(inode);
409 size_t nmax = write ? fc->max_write : fc->max_read;
410 loff_t pos = *ppos;
411 ssize_t res = 0;
412 struct fuse_req *req = fuse_get_request(fc);
413 if (!req)
414 return -ERESTARTSYS;
415
416 while (count) {
417 size_t tmp;
418 size_t nres;
419 size_t nbytes = min(count, nmax);
420 int err = fuse_get_user_pages(req, buf, nbytes, !write);
421 if (err) {
422 res = err;
423 break;
424 }
425 tmp = (req->num_pages << PAGE_SHIFT) - req->page_offset;
426 nbytes = min(nbytes, tmp);
427 if (write)
428 nres = fuse_send_write(req, file, inode, pos, nbytes);
429 else
430 nres = fuse_send_read(req, file, inode, pos, nbytes);
431 fuse_release_user_pages(req, !write);
432 if (req->out.h.error) {
433 if (!res)
434 res = req->out.h.error;
435 break;
436 } else if (nres > nbytes) {
437 res = -EIO;
438 break;
439 }
440 count -= nres;
441 res += nres;
442 pos += nres;
443 buf += nres;
444 if (nres != nbytes)
445 break;
446 if (count)
447 fuse_reset_request(req);
448 }
449 fuse_put_request(fc, req);
450 if (res > 0) {
451 if (write && pos > i_size_read(inode))
452 i_size_write(inode, pos);
453 *ppos = pos;
454 } else if (write && (res == -EINTR || res == -EIO))
455 fuse_invalidate_attr(inode);
456
457 return res;
458}
459
460static ssize_t fuse_direct_read(struct file *file, char __user *buf,
461 size_t count, loff_t *ppos)
462{
463 return fuse_direct_io(file, buf, count, ppos, 0);
464}
465
466static ssize_t fuse_direct_write(struct file *file, const char __user *buf,
467 size_t count, loff_t *ppos)
468{
469 struct inode *inode = file->f_dentry->d_inode;
470 ssize_t res;
471 /* Don't allow parallel writes to the same file */
472 down(&inode->i_sem);
473 res = fuse_direct_io(file, buf, count, ppos, 1);
474 up(&inode->i_sem);
475 return res;
476}
477
366static int fuse_file_mmap(struct file *file, struct vm_area_struct *vma) 478static int fuse_file_mmap(struct file *file, struct vm_area_struct *vma)
367{ 479{
368 if ((vma->vm_flags & VM_SHARED)) { 480 if ((vma->vm_flags & VM_SHARED)) {
@@ -393,6 +505,17 @@ static struct file_operations fuse_file_operations = {
393 .sendfile = generic_file_sendfile, 505 .sendfile = generic_file_sendfile,
394}; 506};
395 507
508static struct file_operations fuse_direct_io_file_operations = {
509 .llseek = generic_file_llseek,
510 .read = fuse_direct_read,
511 .write = fuse_direct_write,
512 .open = fuse_open,
513 .flush = fuse_flush,
514 .release = fuse_release,
515 .fsync = fuse_fsync,
516 /* no mmap and sendfile */
517};
518
396static struct address_space_operations fuse_file_aops = { 519static struct address_space_operations fuse_file_aops = {
397 .readpage = fuse_readpage, 520 .readpage = fuse_readpage,
398 .prepare_write = fuse_prepare_write, 521 .prepare_write = fuse_prepare_write,
@@ -403,6 +526,12 @@ static struct address_space_operations fuse_file_aops = {
403 526
404void fuse_init_file_inode(struct inode *inode) 527void fuse_init_file_inode(struct inode *inode)
405{ 528{
406 inode->i_fop = &fuse_file_operations; 529 struct fuse_conn *fc = get_fuse_conn(inode);
407 inode->i_data.a_ops = &fuse_file_aops; 530
531 if (fc->flags & FUSE_DIRECT_IO)
532 inode->i_fop = &fuse_direct_io_file_operations;
533 else {
534 inode->i_fop = &fuse_file_operations;
535 inode->i_data.a_ops = &fuse_file_aops;
536 }
408} 537}
diff --git a/fs/fuse/fuse_i.h b/fs/fuse/fuse_i.h
index 3ec2aff3fdb5..0af1ac646927 100644
--- a/fs/fuse/fuse_i.h
+++ b/fs/fuse/fuse_i.h
@@ -34,6 +34,9 @@
34 be flushed on open */ 34 be flushed on open */
35#define FUSE_KERNEL_CACHE (1 << 2) 35#define FUSE_KERNEL_CACHE (1 << 2)
36 36
37/** Bypass the page cache for read and write operations */
38#define FUSE_DIRECT_IO (1 << 3)
39
37/** FUSE inode */ 40/** FUSE inode */
38struct fuse_inode { 41struct fuse_inode {
39 /** Inode data */ 42 /** Inode data */
@@ -207,6 +210,9 @@ struct fuse_conn {
207 /** Maximum read size */ 210 /** Maximum read size */
208 unsigned max_read; 211 unsigned max_read;
209 212
213 /** Maximum write size */
214 unsigned max_write;
215
210 /** Readers of the connection are waiting on this */ 216 /** Readers of the connection are waiting on this */
211 wait_queue_head_t waitq; 217 wait_queue_head_t waitq;
212 218
diff --git a/fs/fuse/inode.c b/fs/fuse/inode.c
index 298c1d4c1534..652c9d5df973 100644
--- a/fs/fuse/inode.c
+++ b/fs/fuse/inode.c
@@ -258,6 +258,7 @@ enum {
258 OPT_DEFAULT_PERMISSIONS, 258 OPT_DEFAULT_PERMISSIONS,
259 OPT_ALLOW_OTHER, 259 OPT_ALLOW_OTHER,
260 OPT_KERNEL_CACHE, 260 OPT_KERNEL_CACHE,
261 OPT_DIRECT_IO,
261 OPT_MAX_READ, 262 OPT_MAX_READ,
262 OPT_ERR 263 OPT_ERR
263}; 264};
@@ -270,6 +271,7 @@ static match_table_t tokens = {
270 {OPT_DEFAULT_PERMISSIONS, "default_permissions"}, 271 {OPT_DEFAULT_PERMISSIONS, "default_permissions"},
271 {OPT_ALLOW_OTHER, "allow_other"}, 272 {OPT_ALLOW_OTHER, "allow_other"},
272 {OPT_KERNEL_CACHE, "kernel_cache"}, 273 {OPT_KERNEL_CACHE, "kernel_cache"},
274 {OPT_DIRECT_IO, "direct_io"},
273 {OPT_MAX_READ, "max_read=%u"}, 275 {OPT_MAX_READ, "max_read=%u"},
274 {OPT_ERR, NULL} 276 {OPT_ERR, NULL}
275}; 277};
@@ -329,6 +331,10 @@ static int parse_fuse_opt(char *opt, struct fuse_mount_data *d)
329 d->flags |= FUSE_KERNEL_CACHE; 331 d->flags |= FUSE_KERNEL_CACHE;
330 break; 332 break;
331 333
334 case OPT_DIRECT_IO:
335 d->flags |= FUSE_DIRECT_IO;
336 break;
337
332 case OPT_MAX_READ: 338 case OPT_MAX_READ:
333 if (match_int(&args[0], &value)) 339 if (match_int(&args[0], &value))
334 return 0; 340 return 0;
@@ -359,6 +365,8 @@ static int fuse_show_options(struct seq_file *m, struct vfsmount *mnt)
359 seq_puts(m, ",allow_other"); 365 seq_puts(m, ",allow_other");
360 if (fc->flags & FUSE_KERNEL_CACHE) 366 if (fc->flags & FUSE_KERNEL_CACHE)
361 seq_puts(m, ",kernel_cache"); 367 seq_puts(m, ",kernel_cache");
368 if (fc->flags & FUSE_DIRECT_IO)
369 seq_puts(m, ",direct_io");
362 if (fc->max_read != ~0) 370 if (fc->max_read != ~0)
363 seq_printf(m, ",max_read=%u", fc->max_read); 371 seq_printf(m, ",max_read=%u", fc->max_read);
364 return 0; 372 return 0;
@@ -489,6 +497,7 @@ static int fuse_fill_super(struct super_block *sb, void *data, int silent)
489 fc->max_read = d.max_read; 497 fc->max_read = d.max_read;
490 if (fc->max_read / PAGE_CACHE_SIZE < fc->bdi.ra_pages) 498 if (fc->max_read / PAGE_CACHE_SIZE < fc->bdi.ra_pages)
491 fc->bdi.ra_pages = fc->max_read / PAGE_CACHE_SIZE; 499 fc->bdi.ra_pages = fc->max_read / PAGE_CACHE_SIZE;
500 fc->max_write = FUSE_MAX_IN / 2;
492 501
493 err = -ENOMEM; 502 err = -ENOMEM;
494 root = get_root_inode(sb, d.rootmode); 503 root = get_root_inode(sb, d.rootmode);