diff options
| author | Maxim Patlasov <MPatlasov@parallels.com> | 2013-10-02 13:38:32 -0400 |
|---|---|---|
| committer | Miklos Szeredi <mszeredi@suse.cz> | 2013-11-05 04:11:27 -0500 |
| commit | 6eaf4782eb09e28dbd13d23b9ce0fb7646daf37e (patch) | |
| tree | 10416e984f694f35454238a2b7f1b8f72a214bdb | |
| parent | f6011081f5e290756bd90fe96f1e86d3eac76f77 (diff) | |
fuse: writepages: crop secondary requests
If writeback happens while fuse is in FUSE_NOWRITE condition, the request
will be queued but not processed immediately (see fuse_flush_writepages()).
Until FUSE_NOWRITE becomes relaxed, more writebacks can happen. They will
be queued as "secondary" requests to that first ("primary") request.
Existing implementation crops only primary request. This is not correct
because a subsequent extending write(2) may increase i_size and then
secondary requests won't be cropped properly. The result would be stale
data written to the server to a file offset where zeros must be.
Similar problem may happen if secondary requests are attached to an
in-flight request that was already cropped.
The patch solves the issue by cropping all secondary requests in
fuse_writepage_end(). Thanks to Miklos for idea.
Signed-off-by: Maxim Patlasov <MPatlasov@parallels.com>
Signed-off-by: Miklos Szeredi <mszeredi@suse.cz>
| -rw-r--r-- | fs/fuse/file.c | 36 |
1 files changed, 31 insertions, 5 deletions
diff --git a/fs/fuse/file.c b/fs/fuse/file.c index 077b03844998..1cb303eba4d0 100644 --- a/fs/fuse/file.c +++ b/fs/fuse/file.c | |||
| @@ -1436,12 +1436,12 @@ static void fuse_writepage_finish(struct fuse_conn *fc, struct fuse_req *req) | |||
| 1436 | } | 1436 | } |
| 1437 | 1437 | ||
| 1438 | /* Called under fc->lock, may release and reacquire it */ | 1438 | /* Called under fc->lock, may release and reacquire it */ |
| 1439 | static void fuse_send_writepage(struct fuse_conn *fc, struct fuse_req *req) | 1439 | static void fuse_send_writepage(struct fuse_conn *fc, struct fuse_req *req, |
| 1440 | loff_t size) | ||
| 1440 | __releases(fc->lock) | 1441 | __releases(fc->lock) |
| 1441 | __acquires(fc->lock) | 1442 | __acquires(fc->lock) |
| 1442 | { | 1443 | { |
| 1443 | struct fuse_inode *fi = get_fuse_inode(req->inode); | 1444 | struct fuse_inode *fi = get_fuse_inode(req->inode); |
| 1444 | loff_t size = i_size_read(req->inode); | ||
| 1445 | struct fuse_write_in *inarg = &req->misc.write.in; | 1445 | struct fuse_write_in *inarg = &req->misc.write.in; |
| 1446 | __u64 data_size = req->num_pages * PAGE_CACHE_SIZE; | 1446 | __u64 data_size = req->num_pages * PAGE_CACHE_SIZE; |
| 1447 | 1447 | ||
| @@ -1482,12 +1482,13 @@ __acquires(fc->lock) | |||
| 1482 | { | 1482 | { |
| 1483 | struct fuse_conn *fc = get_fuse_conn(inode); | 1483 | struct fuse_conn *fc = get_fuse_conn(inode); |
| 1484 | struct fuse_inode *fi = get_fuse_inode(inode); | 1484 | struct fuse_inode *fi = get_fuse_inode(inode); |
| 1485 | size_t crop = i_size_read(inode); | ||
| 1485 | struct fuse_req *req; | 1486 | struct fuse_req *req; |
| 1486 | 1487 | ||
| 1487 | while (fi->writectr >= 0 && !list_empty(&fi->queued_writes)) { | 1488 | while (fi->writectr >= 0 && !list_empty(&fi->queued_writes)) { |
| 1488 | req = list_entry(fi->queued_writes.next, struct fuse_req, list); | 1489 | req = list_entry(fi->queued_writes.next, struct fuse_req, list); |
| 1489 | list_del_init(&req->list); | 1490 | list_del_init(&req->list); |
| 1490 | fuse_send_writepage(fc, req); | 1491 | fuse_send_writepage(fc, req, crop); |
| 1491 | } | 1492 | } |
| 1492 | } | 1493 | } |
| 1493 | 1494 | ||
| @@ -1499,12 +1500,37 @@ static void fuse_writepage_end(struct fuse_conn *fc, struct fuse_req *req) | |||
| 1499 | mapping_set_error(inode->i_mapping, req->out.h.error); | 1500 | mapping_set_error(inode->i_mapping, req->out.h.error); |
| 1500 | spin_lock(&fc->lock); | 1501 | spin_lock(&fc->lock); |
| 1501 | while (req->misc.write.next) { | 1502 | while (req->misc.write.next) { |
| 1503 | struct fuse_conn *fc = get_fuse_conn(inode); | ||
| 1504 | struct fuse_write_in *inarg = &req->misc.write.in; | ||
| 1502 | struct fuse_req *next = req->misc.write.next; | 1505 | struct fuse_req *next = req->misc.write.next; |
| 1503 | req->misc.write.next = next->misc.write.next; | 1506 | req->misc.write.next = next->misc.write.next; |
| 1504 | next->misc.write.next = NULL; | 1507 | next->misc.write.next = NULL; |
| 1505 | list_add(&next->writepages_entry, &fi->writepages); | 1508 | list_add(&next->writepages_entry, &fi->writepages); |
| 1506 | list_add_tail(&next->list, &fi->queued_writes); | 1509 | |
| 1507 | fuse_flush_writepages(inode); | 1510 | /* |
| 1511 | * Skip fuse_flush_writepages() to make it easy to crop requests | ||
| 1512 | * based on primary request size. | ||
| 1513 | * | ||
| 1514 | * 1st case (trivial): there are no concurrent activities using | ||
| 1515 | * fuse_set/release_nowrite. Then we're on safe side because | ||
| 1516 | * fuse_flush_writepages() would call fuse_send_writepage() | ||
| 1517 | * anyway. | ||
| 1518 | * | ||
| 1519 | * 2nd case: someone called fuse_set_nowrite and it is waiting | ||
| 1520 | * now for completion of all in-flight requests. This happens | ||
| 1521 | * rarely and no more than once per page, so this should be | ||
| 1522 | * okay. | ||
| 1523 | * | ||
| 1524 | * 3rd case: someone (e.g. fuse_do_setattr()) is in the middle | ||
| 1525 | * of fuse_set_nowrite..fuse_release_nowrite section. The fact | ||
| 1526 | * that fuse_set_nowrite returned implies that all in-flight | ||
| 1527 | * requests were completed along with all of their secondary | ||
| 1528 | * requests. Further primary requests are blocked by negative | ||
| 1529 | * writectr. Hence there cannot be any in-flight requests and | ||
| 1530 | * no invocations of fuse_writepage_end() while we're in | ||
| 1531 | * fuse_set_nowrite..fuse_release_nowrite section. | ||
| 1532 | */ | ||
| 1533 | fuse_send_writepage(fc, next, inarg->offset + inarg->size); | ||
| 1508 | } | 1534 | } |
| 1509 | fi->writectr--; | 1535 | fi->writectr--; |
| 1510 | fuse_writepage_finish(fc, req); | 1536 | fuse_writepage_finish(fc, req); |
