aboutsummaryrefslogtreecommitdiffstats
path: root/fs/nfs/write.c
diff options
context:
space:
mode:
Diffstat (limited to 'fs/nfs/write.c')
-rw-r--r--fs/nfs/write.c386
1 files changed, 247 insertions, 139 deletions
diff --git a/fs/nfs/write.c b/fs/nfs/write.c
index 10d648ea128b..e4cbc11a74ab 100644
--- a/fs/nfs/write.c
+++ b/fs/nfs/write.c
@@ -28,6 +28,7 @@
28#include "iostat.h" 28#include "iostat.h"
29#include "nfs4_fs.h" 29#include "nfs4_fs.h"
30#include "fscache.h" 30#include "fscache.h"
31#include "pnfs.h"
31 32
32#define NFSDBG_FACILITY NFSDBG_PAGECACHE 33#define NFSDBG_FACILITY NFSDBG_PAGECACHE
33 34
@@ -58,6 +59,7 @@ struct nfs_write_data *nfs_commitdata_alloc(void)
58 } 59 }
59 return p; 60 return p;
60} 61}
62EXPORT_SYMBOL_GPL(nfs_commitdata_alloc);
61 63
62void nfs_commit_free(struct nfs_write_data *p) 64void nfs_commit_free(struct nfs_write_data *p)
63{ 65{
@@ -65,6 +67,7 @@ void nfs_commit_free(struct nfs_write_data *p)
65 kfree(p->pagevec); 67 kfree(p->pagevec);
66 mempool_free(p, nfs_commit_mempool); 68 mempool_free(p, nfs_commit_mempool);
67} 69}
70EXPORT_SYMBOL_GPL(nfs_commit_free);
68 71
69struct nfs_write_data *nfs_writedata_alloc(unsigned int pagecount) 72struct nfs_write_data *nfs_writedata_alloc(unsigned int pagecount)
70{ 73{
@@ -96,6 +99,7 @@ void nfs_writedata_free(struct nfs_write_data *p)
96 99
97static void nfs_writedata_release(struct nfs_write_data *wdata) 100static void nfs_writedata_release(struct nfs_write_data *wdata)
98{ 101{
102 put_lseg(wdata->lseg);
99 put_nfs_open_context(wdata->args.context); 103 put_nfs_open_context(wdata->args.context);
100 nfs_writedata_free(wdata); 104 nfs_writedata_free(wdata);
101} 105}
@@ -177,8 +181,8 @@ static int wb_priority(struct writeback_control *wbc)
177 if (wbc->for_reclaim) 181 if (wbc->for_reclaim)
178 return FLUSH_HIGHPRI | FLUSH_STABLE; 182 return FLUSH_HIGHPRI | FLUSH_STABLE;
179 if (wbc->for_kupdate || wbc->for_background) 183 if (wbc->for_kupdate || wbc->for_background)
180 return FLUSH_LOWPRI; 184 return FLUSH_LOWPRI | FLUSH_COND_STABLE;
181 return 0; 185 return FLUSH_COND_STABLE;
182} 186}
183 187
184/* 188/*
@@ -385,11 +389,8 @@ static int nfs_inode_add_request(struct inode *inode, struct nfs_page *req)
385 spin_lock(&inode->i_lock); 389 spin_lock(&inode->i_lock);
386 error = radix_tree_insert(&nfsi->nfs_page_tree, req->wb_index, req); 390 error = radix_tree_insert(&nfsi->nfs_page_tree, req->wb_index, req);
387 BUG_ON(error); 391 BUG_ON(error);
388 if (!nfsi->npages) { 392 if (!nfsi->npages && nfs_have_delegation(inode, FMODE_WRITE))
389 igrab(inode); 393 nfsi->change_attr++;
390 if (nfs_have_delegation(inode, FMODE_WRITE))
391 nfsi->change_attr++;
392 }
393 set_bit(PG_MAPPED, &req->wb_flags); 394 set_bit(PG_MAPPED, &req->wb_flags);
394 SetPagePrivate(req->wb_page); 395 SetPagePrivate(req->wb_page);
395 set_page_private(req->wb_page, (unsigned long)req); 396 set_page_private(req->wb_page, (unsigned long)req);
@@ -419,11 +420,7 @@ static void nfs_inode_remove_request(struct nfs_page *req)
419 clear_bit(PG_MAPPED, &req->wb_flags); 420 clear_bit(PG_MAPPED, &req->wb_flags);
420 radix_tree_delete(&nfsi->nfs_page_tree, req->wb_index); 421 radix_tree_delete(&nfsi->nfs_page_tree, req->wb_index);
421 nfsi->npages--; 422 nfsi->npages--;
422 if (!nfsi->npages) { 423 spin_unlock(&inode->i_lock);
423 spin_unlock(&inode->i_lock);
424 iput(inode);
425 } else
426 spin_unlock(&inode->i_lock);
427 nfs_release_request(req); 424 nfs_release_request(req);
428} 425}
429 426
@@ -439,7 +436,7 @@ nfs_mark_request_dirty(struct nfs_page *req)
439 * Add a request to the inode's commit list. 436 * Add a request to the inode's commit list.
440 */ 437 */
441static void 438static void
442nfs_mark_request_commit(struct nfs_page *req) 439nfs_mark_request_commit(struct nfs_page *req, struct pnfs_layout_segment *lseg)
443{ 440{
444 struct inode *inode = req->wb_context->path.dentry->d_inode; 441 struct inode *inode = req->wb_context->path.dentry->d_inode;
445 struct nfs_inode *nfsi = NFS_I(inode); 442 struct nfs_inode *nfsi = NFS_I(inode);
@@ -451,6 +448,7 @@ nfs_mark_request_commit(struct nfs_page *req)
451 NFS_PAGE_TAG_COMMIT); 448 NFS_PAGE_TAG_COMMIT);
452 nfsi->ncommit++; 449 nfsi->ncommit++;
453 spin_unlock(&inode->i_lock); 450 spin_unlock(&inode->i_lock);
451 pnfs_mark_request_commit(req, lseg);
454 inc_zone_page_state(req->wb_page, NR_UNSTABLE_NFS); 452 inc_zone_page_state(req->wb_page, NR_UNSTABLE_NFS);
455 inc_bdi_stat(req->wb_page->mapping->backing_dev_info, BDI_RECLAIMABLE); 453 inc_bdi_stat(req->wb_page->mapping->backing_dev_info, BDI_RECLAIMABLE);
456 __mark_inode_dirty(inode, I_DIRTY_DATASYNC); 454 __mark_inode_dirty(inode, I_DIRTY_DATASYNC);
@@ -472,14 +470,18 @@ nfs_clear_request_commit(struct nfs_page *req)
472static inline 470static inline
473int nfs_write_need_commit(struct nfs_write_data *data) 471int nfs_write_need_commit(struct nfs_write_data *data)
474{ 472{
475 return data->verf.committed != NFS_FILE_SYNC; 473 if (data->verf.committed == NFS_DATA_SYNC)
474 return data->lseg == NULL;
475 else
476 return data->verf.committed != NFS_FILE_SYNC;
476} 477}
477 478
478static inline 479static inline
479int nfs_reschedule_unstable_write(struct nfs_page *req) 480int nfs_reschedule_unstable_write(struct nfs_page *req,
481 struct nfs_write_data *data)
480{ 482{
481 if (test_and_clear_bit(PG_NEED_COMMIT, &req->wb_flags)) { 483 if (test_and_clear_bit(PG_NEED_COMMIT, &req->wb_flags)) {
482 nfs_mark_request_commit(req); 484 nfs_mark_request_commit(req, data->lseg);
483 return 1; 485 return 1;
484 } 486 }
485 if (test_and_clear_bit(PG_NEED_RESCHED, &req->wb_flags)) { 487 if (test_and_clear_bit(PG_NEED_RESCHED, &req->wb_flags)) {
@@ -490,7 +492,7 @@ int nfs_reschedule_unstable_write(struct nfs_page *req)
490} 492}
491#else 493#else
492static inline void 494static inline void
493nfs_mark_request_commit(struct nfs_page *req) 495nfs_mark_request_commit(struct nfs_page *req, struct pnfs_layout_segment *lseg)
494{ 496{
495} 497}
496 498
@@ -507,7 +509,8 @@ int nfs_write_need_commit(struct nfs_write_data *data)
507} 509}
508 510
509static inline 511static inline
510int nfs_reschedule_unstable_write(struct nfs_page *req) 512int nfs_reschedule_unstable_write(struct nfs_page *req,
513 struct nfs_write_data *data)
511{ 514{
512 return 0; 515 return 0;
513} 516}
@@ -539,11 +542,15 @@ nfs_scan_commit(struct inode *inode, struct list_head *dst, pgoff_t idx_start, u
539 if (!nfs_need_commit(nfsi)) 542 if (!nfs_need_commit(nfsi))
540 return 0; 543 return 0;
541 544
545 spin_lock(&inode->i_lock);
542 ret = nfs_scan_list(nfsi, dst, idx_start, npages, NFS_PAGE_TAG_COMMIT); 546 ret = nfs_scan_list(nfsi, dst, idx_start, npages, NFS_PAGE_TAG_COMMIT);
543 if (ret > 0) 547 if (ret > 0)
544 nfsi->ncommit -= ret; 548 nfsi->ncommit -= ret;
549 spin_unlock(&inode->i_lock);
550
545 if (nfs_need_commit(NFS_I(inode))) 551 if (nfs_need_commit(NFS_I(inode)))
546 __mark_inode_dirty(inode, I_DIRTY_DATASYNC); 552 __mark_inode_dirty(inode, I_DIRTY_DATASYNC);
553
547 return ret; 554 return ret;
548} 555}
549#else 556#else
@@ -610,9 +617,11 @@ static struct nfs_page *nfs_try_to_update_request(struct inode *inode,
610 } 617 }
611 618
612 if (nfs_clear_request_commit(req) && 619 if (nfs_clear_request_commit(req) &&
613 radix_tree_tag_clear(&NFS_I(inode)->nfs_page_tree, 620 radix_tree_tag_clear(&NFS_I(inode)->nfs_page_tree,
614 req->wb_index, NFS_PAGE_TAG_COMMIT) != NULL) 621 req->wb_index, NFS_PAGE_TAG_COMMIT) != NULL) {
615 NFS_I(inode)->ncommit--; 622 NFS_I(inode)->ncommit--;
623 pnfs_clear_request_commit(req);
624 }
616 625
617 /* Okay, the request matches. Update the region */ 626 /* Okay, the request matches. Update the region */
618 if (offset < req->wb_offset) { 627 if (offset < req->wb_offset) {
@@ -760,11 +769,12 @@ int nfs_updatepage(struct file *file, struct page *page,
760 return status; 769 return status;
761} 770}
762 771
763static void nfs_writepage_release(struct nfs_page *req) 772static void nfs_writepage_release(struct nfs_page *req,
773 struct nfs_write_data *data)
764{ 774{
765 struct page *page = req->wb_page; 775 struct page *page = req->wb_page;
766 776
767 if (PageError(req->wb_page) || !nfs_reschedule_unstable_write(req)) 777 if (PageError(req->wb_page) || !nfs_reschedule_unstable_write(req, data))
768 nfs_inode_remove_request(req); 778 nfs_inode_remove_request(req);
769 nfs_clear_page_tag_locked(req); 779 nfs_clear_page_tag_locked(req);
770 nfs_end_page_writeback(page); 780 nfs_end_page_writeback(page);
@@ -781,25 +791,21 @@ static int flush_task_priority(int how)
781 return RPC_PRIORITY_NORMAL; 791 return RPC_PRIORITY_NORMAL;
782} 792}
783 793
784/* 794int nfs_initiate_write(struct nfs_write_data *data,
785 * Set up the argument/result storage required for the RPC call. 795 struct rpc_clnt *clnt,
786 */ 796 const struct rpc_call_ops *call_ops,
787static int nfs_write_rpcsetup(struct nfs_page *req, 797 int how)
788 struct nfs_write_data *data,
789 const struct rpc_call_ops *call_ops,
790 unsigned int count, unsigned int offset,
791 int how)
792{ 798{
793 struct inode *inode = req->wb_context->path.dentry->d_inode; 799 struct inode *inode = data->inode;
794 int priority = flush_task_priority(how); 800 int priority = flush_task_priority(how);
795 struct rpc_task *task; 801 struct rpc_task *task;
796 struct rpc_message msg = { 802 struct rpc_message msg = {
797 .rpc_argp = &data->args, 803 .rpc_argp = &data->args,
798 .rpc_resp = &data->res, 804 .rpc_resp = &data->res,
799 .rpc_cred = req->wb_context->cred, 805 .rpc_cred = data->cred,
800 }; 806 };
801 struct rpc_task_setup task_setup_data = { 807 struct rpc_task_setup task_setup_data = {
802 .rpc_client = NFS_CLIENT(inode), 808 .rpc_client = clnt,
803 .task = &data->task, 809 .task = &data->task,
804 .rpc_message = &msg, 810 .rpc_message = &msg,
805 .callback_ops = call_ops, 811 .callback_ops = call_ops,
@@ -810,12 +816,52 @@ static int nfs_write_rpcsetup(struct nfs_page *req,
810 }; 816 };
811 int ret = 0; 817 int ret = 0;
812 818
819 /* Set up the initial task struct. */
820 NFS_PROTO(inode)->write_setup(data, &msg);
821
822 dprintk("NFS: %5u initiated write call "
823 "(req %s/%lld, %u bytes @ offset %llu)\n",
824 data->task.tk_pid,
825 inode->i_sb->s_id,
826 (long long)NFS_FILEID(inode),
827 data->args.count,
828 (unsigned long long)data->args.offset);
829
830 task = rpc_run_task(&task_setup_data);
831 if (IS_ERR(task)) {
832 ret = PTR_ERR(task);
833 goto out;
834 }
835 if (how & FLUSH_SYNC) {
836 ret = rpc_wait_for_completion_task(task);
837 if (ret == 0)
838 ret = task->tk_status;
839 }
840 rpc_put_task(task);
841out:
842 return ret;
843}
844EXPORT_SYMBOL_GPL(nfs_initiate_write);
845
846/*
847 * Set up the argument/result storage required for the RPC call.
848 */
849static int nfs_write_rpcsetup(struct nfs_page *req,
850 struct nfs_write_data *data,
851 const struct rpc_call_ops *call_ops,
852 unsigned int count, unsigned int offset,
853 struct pnfs_layout_segment *lseg,
854 int how)
855{
856 struct inode *inode = req->wb_context->path.dentry->d_inode;
857
813 /* Set up the RPC argument and reply structs 858 /* Set up the RPC argument and reply structs
814 * NB: take care not to mess about with data->commit et al. */ 859 * NB: take care not to mess about with data->commit et al. */
815 860
816 data->req = req; 861 data->req = req;
817 data->inode = inode = req->wb_context->path.dentry->d_inode; 862 data->inode = inode = req->wb_context->path.dentry->d_inode;
818 data->cred = msg.rpc_cred; 863 data->cred = req->wb_context->cred;
864 data->lseg = get_lseg(lseg);
819 865
820 data->args.fh = NFS_FH(inode); 866 data->args.fh = NFS_FH(inode);
821 data->args.offset = req_offset(req) + offset; 867 data->args.offset = req_offset(req) + offset;
@@ -825,7 +871,7 @@ static int nfs_write_rpcsetup(struct nfs_page *req,
825 data->args.context = get_nfs_open_context(req->wb_context); 871 data->args.context = get_nfs_open_context(req->wb_context);
826 data->args.lock_context = req->wb_lock_context; 872 data->args.lock_context = req->wb_lock_context;
827 data->args.stable = NFS_UNSTABLE; 873 data->args.stable = NFS_UNSTABLE;
828 if (how & FLUSH_STABLE) { 874 if (how & (FLUSH_STABLE | FLUSH_COND_STABLE)) {
829 data->args.stable = NFS_DATA_SYNC; 875 data->args.stable = NFS_DATA_SYNC;
830 if (!nfs_need_commit(NFS_I(inode))) 876 if (!nfs_need_commit(NFS_I(inode)))
831 data->args.stable = NFS_FILE_SYNC; 877 data->args.stable = NFS_FILE_SYNC;
@@ -836,30 +882,11 @@ static int nfs_write_rpcsetup(struct nfs_page *req,
836 data->res.verf = &data->verf; 882 data->res.verf = &data->verf;
837 nfs_fattr_init(&data->fattr); 883 nfs_fattr_init(&data->fattr);
838 884
839 /* Set up the initial task struct. */ 885 if (data->lseg &&
840 NFS_PROTO(inode)->write_setup(data, &msg); 886 (pnfs_try_to_write_data(data, call_ops, how) == PNFS_ATTEMPTED))
841 887 return 0;
842 dprintk("NFS: %5u initiated write call "
843 "(req %s/%lld, %u bytes @ offset %llu)\n",
844 data->task.tk_pid,
845 inode->i_sb->s_id,
846 (long long)NFS_FILEID(inode),
847 count,
848 (unsigned long long)data->args.offset);
849 888
850 task = rpc_run_task(&task_setup_data); 889 return nfs_initiate_write(data, NFS_CLIENT(inode), call_ops, how);
851 if (IS_ERR(task)) {
852 ret = PTR_ERR(task);
853 goto out;
854 }
855 if (how & FLUSH_SYNC) {
856 ret = rpc_wait_for_completion_task(task);
857 if (ret == 0)
858 ret = task->tk_status;
859 }
860 rpc_put_task(task);
861out:
862 return ret;
863} 890}
864 891
865/* If a nfs_flush_* function fails, it should remove reqs from @head and 892/* If a nfs_flush_* function fails, it should remove reqs from @head and
@@ -879,20 +906,27 @@ static void nfs_redirty_request(struct nfs_page *req)
879 * Generate multiple small requests to write out a single 906 * Generate multiple small requests to write out a single
880 * contiguous dirty area on one page. 907 * contiguous dirty area on one page.
881 */ 908 */
882static int nfs_flush_multi(struct inode *inode, struct list_head *head, unsigned int npages, size_t count, int how) 909static int nfs_flush_multi(struct nfs_pageio_descriptor *desc)
883{ 910{
884 struct nfs_page *req = nfs_list_entry(head->next); 911 struct nfs_page *req = nfs_list_entry(desc->pg_list.next);
885 struct page *page = req->wb_page; 912 struct page *page = req->wb_page;
886 struct nfs_write_data *data; 913 struct nfs_write_data *data;
887 size_t wsize = NFS_SERVER(inode)->wsize, nbytes; 914 size_t wsize = NFS_SERVER(desc->pg_inode)->wsize, nbytes;
888 unsigned int offset; 915 unsigned int offset;
889 int requests = 0; 916 int requests = 0;
890 int ret = 0; 917 int ret = 0;
918 struct pnfs_layout_segment *lseg;
891 LIST_HEAD(list); 919 LIST_HEAD(list);
892 920
893 nfs_list_remove_request(req); 921 nfs_list_remove_request(req);
894 922
895 nbytes = count; 923 if ((desc->pg_ioflags & FLUSH_COND_STABLE) &&
924 (desc->pg_moreio || NFS_I(desc->pg_inode)->ncommit ||
925 desc->pg_count > wsize))
926 desc->pg_ioflags &= ~FLUSH_COND_STABLE;
927
928
929 nbytes = desc->pg_count;
896 do { 930 do {
897 size_t len = min(nbytes, wsize); 931 size_t len = min(nbytes, wsize);
898 932
@@ -905,9 +939,11 @@ static int nfs_flush_multi(struct inode *inode, struct list_head *head, unsigned
905 } while (nbytes != 0); 939 } while (nbytes != 0);
906 atomic_set(&req->wb_complete, requests); 940 atomic_set(&req->wb_complete, requests);
907 941
942 BUG_ON(desc->pg_lseg);
943 lseg = pnfs_update_layout(desc->pg_inode, req->wb_context, IOMODE_RW);
908 ClearPageError(page); 944 ClearPageError(page);
909 offset = 0; 945 offset = 0;
910 nbytes = count; 946 nbytes = desc->pg_count;
911 do { 947 do {
912 int ret2; 948 int ret2;
913 949
@@ -919,20 +955,22 @@ static int nfs_flush_multi(struct inode *inode, struct list_head *head, unsigned
919 if (nbytes < wsize) 955 if (nbytes < wsize)
920 wsize = nbytes; 956 wsize = nbytes;
921 ret2 = nfs_write_rpcsetup(req, data, &nfs_write_partial_ops, 957 ret2 = nfs_write_rpcsetup(req, data, &nfs_write_partial_ops,
922 wsize, offset, how); 958 wsize, offset, lseg, desc->pg_ioflags);
923 if (ret == 0) 959 if (ret == 0)
924 ret = ret2; 960 ret = ret2;
925 offset += wsize; 961 offset += wsize;
926 nbytes -= wsize; 962 nbytes -= wsize;
927 } while (nbytes != 0); 963 } while (nbytes != 0);
928 964
965 put_lseg(lseg);
966 desc->pg_lseg = NULL;
929 return ret; 967 return ret;
930 968
931out_bad: 969out_bad:
932 while (!list_empty(&list)) { 970 while (!list_empty(&list)) {
933 data = list_entry(list.next, struct nfs_write_data, pages); 971 data = list_entry(list.next, struct nfs_write_data, pages);
934 list_del(&data->pages); 972 list_del(&data->pages);
935 nfs_writedata_release(data); 973 nfs_writedata_free(data);
936 } 974 }
937 nfs_redirty_request(req); 975 nfs_redirty_request(req);
938 return -ENOMEM; 976 return -ENOMEM;
@@ -946,16 +984,26 @@ out_bad:
946 * This is the case if nfs_updatepage detects a conflicting request 984 * This is the case if nfs_updatepage detects a conflicting request
947 * that has been written but not committed. 985 * that has been written but not committed.
948 */ 986 */
949static int nfs_flush_one(struct inode *inode, struct list_head *head, unsigned int npages, size_t count, int how) 987static int nfs_flush_one(struct nfs_pageio_descriptor *desc)
950{ 988{
951 struct nfs_page *req; 989 struct nfs_page *req;
952 struct page **pages; 990 struct page **pages;
953 struct nfs_write_data *data; 991 struct nfs_write_data *data;
992 struct list_head *head = &desc->pg_list;
993 struct pnfs_layout_segment *lseg = desc->pg_lseg;
994 int ret;
954 995
955 data = nfs_writedata_alloc(npages); 996 data = nfs_writedata_alloc(nfs_page_array_len(desc->pg_base,
956 if (!data) 997 desc->pg_count));
957 goto out_bad; 998 if (!data) {
958 999 while (!list_empty(head)) {
1000 req = nfs_list_entry(head->next);
1001 nfs_list_remove_request(req);
1002 nfs_redirty_request(req);
1003 }
1004 ret = -ENOMEM;
1005 goto out;
1006 }
959 pages = data->pagevec; 1007 pages = data->pagevec;
960 while (!list_empty(head)) { 1008 while (!list_empty(head)) {
961 req = nfs_list_entry(head->next); 1009 req = nfs_list_entry(head->next);
@@ -965,16 +1013,19 @@ static int nfs_flush_one(struct inode *inode, struct list_head *head, unsigned i
965 *pages++ = req->wb_page; 1013 *pages++ = req->wb_page;
966 } 1014 }
967 req = nfs_list_entry(data->pages.next); 1015 req = nfs_list_entry(data->pages.next);
1016 if ((!lseg) && list_is_singular(&data->pages))
1017 lseg = pnfs_update_layout(desc->pg_inode, req->wb_context, IOMODE_RW);
1018
1019 if ((desc->pg_ioflags & FLUSH_COND_STABLE) &&
1020 (desc->pg_moreio || NFS_I(desc->pg_inode)->ncommit))
1021 desc->pg_ioflags &= ~FLUSH_COND_STABLE;
968 1022
969 /* Set up the argument struct */ 1023 /* Set up the argument struct */
970 return nfs_write_rpcsetup(req, data, &nfs_write_full_ops, count, 0, how); 1024 ret = nfs_write_rpcsetup(req, data, &nfs_write_full_ops, desc->pg_count, 0, lseg, desc->pg_ioflags);
971 out_bad: 1025out:
972 while (!list_empty(head)) { 1026 put_lseg(lseg); /* Cleans any gotten in ->pg_test */
973 req = nfs_list_entry(head->next); 1027 desc->pg_lseg = NULL;
974 nfs_list_remove_request(req); 1028 return ret;
975 nfs_redirty_request(req);
976 }
977 return -ENOMEM;
978} 1029}
979 1030
980static void nfs_pageio_init_write(struct nfs_pageio_descriptor *pgio, 1031static void nfs_pageio_init_write(struct nfs_pageio_descriptor *pgio,
@@ -982,6 +1033,8 @@ static void nfs_pageio_init_write(struct nfs_pageio_descriptor *pgio,
982{ 1033{
983 size_t wsize = NFS_SERVER(inode)->wsize; 1034 size_t wsize = NFS_SERVER(inode)->wsize;
984 1035
1036 pnfs_pageio_init_write(pgio, inode);
1037
985 if (wsize < PAGE_CACHE_SIZE) 1038 if (wsize < PAGE_CACHE_SIZE)
986 nfs_pageio_init(pgio, inode, nfs_flush_multi, wsize, ioflags); 1039 nfs_pageio_init(pgio, inode, nfs_flush_multi, wsize, ioflags);
987 else 1040 else
@@ -1039,7 +1092,7 @@ static void nfs_writeback_release_partial(void *calldata)
1039 1092
1040out: 1093out:
1041 if (atomic_dec_and_test(&req->wb_complete)) 1094 if (atomic_dec_and_test(&req->wb_complete))
1042 nfs_writepage_release(req); 1095 nfs_writepage_release(req, data);
1043 nfs_writedata_release(calldata); 1096 nfs_writedata_release(calldata);
1044} 1097}
1045 1098
@@ -1106,7 +1159,7 @@ static void nfs_writeback_release_full(void *calldata)
1106 1159
1107 if (nfs_write_need_commit(data)) { 1160 if (nfs_write_need_commit(data)) {
1108 memcpy(&req->wb_verf, &data->verf, sizeof(req->wb_verf)); 1161 memcpy(&req->wb_verf, &data->verf, sizeof(req->wb_verf));
1109 nfs_mark_request_commit(req); 1162 nfs_mark_request_commit(req, data->lseg);
1110 dprintk(" marked for commit\n"); 1163 dprintk(" marked for commit\n");
1111 goto next; 1164 goto next;
1112 } 1165 }
@@ -1132,7 +1185,7 @@ static const struct rpc_call_ops nfs_write_full_ops = {
1132/* 1185/*
1133 * This function is called when the WRITE call is complete. 1186 * This function is called when the WRITE call is complete.
1134 */ 1187 */
1135int nfs_writeback_done(struct rpc_task *task, struct nfs_write_data *data) 1188void nfs_writeback_done(struct rpc_task *task, struct nfs_write_data *data)
1136{ 1189{
1137 struct nfs_writeargs *argp = &data->args; 1190 struct nfs_writeargs *argp = &data->args;
1138 struct nfs_writeres *resp = &data->res; 1191 struct nfs_writeres *resp = &data->res;
@@ -1151,7 +1204,7 @@ int nfs_writeback_done(struct rpc_task *task, struct nfs_write_data *data)
1151 */ 1204 */
1152 status = NFS_PROTO(data->inode)->write_done(task, data); 1205 status = NFS_PROTO(data->inode)->write_done(task, data);
1153 if (status != 0) 1206 if (status != 0)
1154 return status; 1207 return;
1155 nfs_add_stats(data->inode, NFSIOS_SERVERWRITTENBYTES, resp->count); 1208 nfs_add_stats(data->inode, NFSIOS_SERVERWRITTENBYTES, resp->count);
1156 1209
1157#if defined(CONFIG_NFS_V3) || defined(CONFIG_NFS_V4) 1210#if defined(CONFIG_NFS_V3) || defined(CONFIG_NFS_V4)
@@ -1166,6 +1219,7 @@ int nfs_writeback_done(struct rpc_task *task, struct nfs_write_data *data)
1166 */ 1219 */
1167 static unsigned long complain; 1220 static unsigned long complain;
1168 1221
1222 /* Note this will print the MDS for a DS write */
1169 if (time_before(complain, jiffies)) { 1223 if (time_before(complain, jiffies)) {
1170 dprintk("NFS: faulty NFS server %s:" 1224 dprintk("NFS: faulty NFS server %s:"
1171 " (committed = %d) != (stable = %d)\n", 1225 " (committed = %d) != (stable = %d)\n",
@@ -1186,6 +1240,7 @@ int nfs_writeback_done(struct rpc_task *task, struct nfs_write_data *data)
1186 /* Was this an NFSv2 write or an NFSv3 stable write? */ 1240 /* Was this an NFSv2 write or an NFSv3 stable write? */
1187 if (resp->verf->committed != NFS_UNSTABLE) { 1241 if (resp->verf->committed != NFS_UNSTABLE) {
1188 /* Resend from where the server left off */ 1242 /* Resend from where the server left off */
1243 data->mds_offset += resp->count;
1189 argp->offset += resp->count; 1244 argp->offset += resp->count;
1190 argp->pgbase += resp->count; 1245 argp->pgbase += resp->count;
1191 argp->count -= resp->count; 1246 argp->count -= resp->count;
@@ -1196,7 +1251,7 @@ int nfs_writeback_done(struct rpc_task *task, struct nfs_write_data *data)
1196 argp->stable = NFS_FILE_SYNC; 1251 argp->stable = NFS_FILE_SYNC;
1197 } 1252 }
1198 nfs_restart_rpc(task, server->nfs_client); 1253 nfs_restart_rpc(task, server->nfs_client);
1199 return -EAGAIN; 1254 return;
1200 } 1255 }
1201 if (time_before(complain, jiffies)) { 1256 if (time_before(complain, jiffies)) {
1202 printk(KERN_WARNING 1257 printk(KERN_WARNING
@@ -1207,64 +1262,89 @@ int nfs_writeback_done(struct rpc_task *task, struct nfs_write_data *data)
1207 /* Can't do anything about it except throw an error. */ 1262 /* Can't do anything about it except throw an error. */
1208 task->tk_status = -EIO; 1263 task->tk_status = -EIO;
1209 } 1264 }
1210 return 0; 1265 return;
1211} 1266}
1212 1267
1213 1268
1214#if defined(CONFIG_NFS_V3) || defined(CONFIG_NFS_V4) 1269#if defined(CONFIG_NFS_V3) || defined(CONFIG_NFS_V4)
1215static int nfs_commit_set_lock(struct nfs_inode *nfsi, int may_wait) 1270static int nfs_commit_set_lock(struct nfs_inode *nfsi, int may_wait)
1216{ 1271{
1272 int ret;
1273
1217 if (!test_and_set_bit(NFS_INO_COMMIT, &nfsi->flags)) 1274 if (!test_and_set_bit(NFS_INO_COMMIT, &nfsi->flags))
1218 return 1; 1275 return 1;
1219 if (may_wait && !out_of_line_wait_on_bit_lock(&nfsi->flags, 1276 if (!may_wait)
1220 NFS_INO_COMMIT, nfs_wait_bit_killable, 1277 return 0;
1221 TASK_KILLABLE)) 1278 ret = out_of_line_wait_on_bit_lock(&nfsi->flags,
1222 return 1; 1279 NFS_INO_COMMIT,
1223 return 0; 1280 nfs_wait_bit_killable,
1281 TASK_KILLABLE);
1282 return (ret < 0) ? ret : 1;
1224} 1283}
1225 1284
1226static void nfs_commit_clear_lock(struct nfs_inode *nfsi) 1285void nfs_commit_clear_lock(struct nfs_inode *nfsi)
1227{ 1286{
1228 clear_bit(NFS_INO_COMMIT, &nfsi->flags); 1287 clear_bit(NFS_INO_COMMIT, &nfsi->flags);
1229 smp_mb__after_clear_bit(); 1288 smp_mb__after_clear_bit();
1230 wake_up_bit(&nfsi->flags, NFS_INO_COMMIT); 1289 wake_up_bit(&nfsi->flags, NFS_INO_COMMIT);
1231} 1290}
1291EXPORT_SYMBOL_GPL(nfs_commit_clear_lock);
1232 1292
1233 1293void nfs_commitdata_release(void *data)
1234static void nfs_commitdata_release(void *data)
1235{ 1294{
1236 struct nfs_write_data *wdata = data; 1295 struct nfs_write_data *wdata = data;
1237 1296
1297 put_lseg(wdata->lseg);
1238 put_nfs_open_context(wdata->args.context); 1298 put_nfs_open_context(wdata->args.context);
1239 nfs_commit_free(wdata); 1299 nfs_commit_free(wdata);
1240} 1300}
1301EXPORT_SYMBOL_GPL(nfs_commitdata_release);
1241 1302
1242/* 1303int nfs_initiate_commit(struct nfs_write_data *data, struct rpc_clnt *clnt,
1243 * Set up the argument/result storage required for the RPC call. 1304 const struct rpc_call_ops *call_ops,
1244 */ 1305 int how)
1245static int nfs_commit_rpcsetup(struct list_head *head,
1246 struct nfs_write_data *data,
1247 int how)
1248{ 1306{
1249 struct nfs_page *first = nfs_list_entry(head->next);
1250 struct inode *inode = first->wb_context->path.dentry->d_inode;
1251 int priority = flush_task_priority(how);
1252 struct rpc_task *task; 1307 struct rpc_task *task;
1308 int priority = flush_task_priority(how);
1253 struct rpc_message msg = { 1309 struct rpc_message msg = {
1254 .rpc_argp = &data->args, 1310 .rpc_argp = &data->args,
1255 .rpc_resp = &data->res, 1311 .rpc_resp = &data->res,
1256 .rpc_cred = first->wb_context->cred, 1312 .rpc_cred = data->cred,
1257 }; 1313 };
1258 struct rpc_task_setup task_setup_data = { 1314 struct rpc_task_setup task_setup_data = {
1259 .task = &data->task, 1315 .task = &data->task,
1260 .rpc_client = NFS_CLIENT(inode), 1316 .rpc_client = clnt,
1261 .rpc_message = &msg, 1317 .rpc_message = &msg,
1262 .callback_ops = &nfs_commit_ops, 1318 .callback_ops = call_ops,
1263 .callback_data = data, 1319 .callback_data = data,
1264 .workqueue = nfsiod_workqueue, 1320 .workqueue = nfsiod_workqueue,
1265 .flags = RPC_TASK_ASYNC, 1321 .flags = RPC_TASK_ASYNC,
1266 .priority = priority, 1322 .priority = priority,
1267 }; 1323 };
1324 /* Set up the initial task struct. */
1325 NFS_PROTO(data->inode)->commit_setup(data, &msg);
1326
1327 dprintk("NFS: %5u initiated commit call\n", data->task.tk_pid);
1328
1329 task = rpc_run_task(&task_setup_data);
1330 if (IS_ERR(task))
1331 return PTR_ERR(task);
1332 if (how & FLUSH_SYNC)
1333 rpc_wait_for_completion_task(task);
1334 rpc_put_task(task);
1335 return 0;
1336}
1337EXPORT_SYMBOL_GPL(nfs_initiate_commit);
1338
1339/*
1340 * Set up the argument/result storage required for the RPC call.
1341 */
1342void nfs_init_commit(struct nfs_write_data *data,
1343 struct list_head *head,
1344 struct pnfs_layout_segment *lseg)
1345{
1346 struct nfs_page *first = nfs_list_entry(head->next);
1347 struct inode *inode = first->wb_context->path.dentry->d_inode;
1268 1348
1269 /* Set up the RPC argument and reply structs 1349 /* Set up the RPC argument and reply structs
1270 * NB: take care not to mess about with data->commit et al. */ 1350 * NB: take care not to mess about with data->commit et al. */
@@ -1272,7 +1352,9 @@ static int nfs_commit_rpcsetup(struct list_head *head,
1272 list_splice_init(head, &data->pages); 1352 list_splice_init(head, &data->pages);
1273 1353
1274 data->inode = inode; 1354 data->inode = inode;
1275 data->cred = msg.rpc_cred; 1355 data->cred = first->wb_context->cred;
1356 data->lseg = lseg; /* reference transferred */
1357 data->mds_ops = &nfs_commit_ops;
1276 1358
1277 data->args.fh = NFS_FH(data->inode); 1359 data->args.fh = NFS_FH(data->inode);
1278 /* Note: we always request a commit of the entire inode */ 1360 /* Note: we always request a commit of the entire inode */
@@ -1283,18 +1365,25 @@ static int nfs_commit_rpcsetup(struct list_head *head,
1283 data->res.fattr = &data->fattr; 1365 data->res.fattr = &data->fattr;
1284 data->res.verf = &data->verf; 1366 data->res.verf = &data->verf;
1285 nfs_fattr_init(&data->fattr); 1367 nfs_fattr_init(&data->fattr);
1368}
1369EXPORT_SYMBOL_GPL(nfs_init_commit);
1286 1370
1287 /* Set up the initial task struct. */ 1371void nfs_retry_commit(struct list_head *page_list,
1288 NFS_PROTO(inode)->commit_setup(data, &msg); 1372 struct pnfs_layout_segment *lseg)
1289 1373{
1290 dprintk("NFS: %5u initiated commit call\n", data->task.tk_pid); 1374 struct nfs_page *req;
1291 1375
1292 task = rpc_run_task(&task_setup_data); 1376 while (!list_empty(page_list)) {
1293 if (IS_ERR(task)) 1377 req = nfs_list_entry(page_list->next);
1294 return PTR_ERR(task); 1378 nfs_list_remove_request(req);
1295 rpc_put_task(task); 1379 nfs_mark_request_commit(req, lseg);
1296 return 0; 1380 dec_zone_page_state(req->wb_page, NR_UNSTABLE_NFS);
1381 dec_bdi_stat(req->wb_page->mapping->backing_dev_info,
1382 BDI_RECLAIMABLE);
1383 nfs_clear_page_tag_locked(req);
1384 }
1297} 1385}
1386EXPORT_SYMBOL_GPL(nfs_retry_commit);
1298 1387
1299/* 1388/*
1300 * Commit dirty pages 1389 * Commit dirty pages
@@ -1303,7 +1392,6 @@ static int
1303nfs_commit_list(struct inode *inode, struct list_head *head, int how) 1392nfs_commit_list(struct inode *inode, struct list_head *head, int how)
1304{ 1393{
1305 struct nfs_write_data *data; 1394 struct nfs_write_data *data;
1306 struct nfs_page *req;
1307 1395
1308 data = nfs_commitdata_alloc(); 1396 data = nfs_commitdata_alloc();
1309 1397
@@ -1311,17 +1399,10 @@ nfs_commit_list(struct inode *inode, struct list_head *head, int how)
1311 goto out_bad; 1399 goto out_bad;
1312 1400
1313 /* Set up the argument struct */ 1401 /* Set up the argument struct */
1314 return nfs_commit_rpcsetup(head, data, how); 1402 nfs_init_commit(data, head, NULL);
1403 return nfs_initiate_commit(data, NFS_CLIENT(inode), data->mds_ops, how);
1315 out_bad: 1404 out_bad:
1316 while (!list_empty(head)) { 1405 nfs_retry_commit(head, NULL);
1317 req = nfs_list_entry(head->next);
1318 nfs_list_remove_request(req);
1319 nfs_mark_request_commit(req);
1320 dec_zone_page_state(req->wb_page, NR_UNSTABLE_NFS);
1321 dec_bdi_stat(req->wb_page->mapping->backing_dev_info,
1322 BDI_RECLAIMABLE);
1323 nfs_clear_page_tag_locked(req);
1324 }
1325 nfs_commit_clear_lock(NFS_I(inode)); 1406 nfs_commit_clear_lock(NFS_I(inode));
1326 return -ENOMEM; 1407 return -ENOMEM;
1327} 1408}
@@ -1341,10 +1422,9 @@ static void nfs_commit_done(struct rpc_task *task, void *calldata)
1341 return; 1422 return;
1342} 1423}
1343 1424
1344static void nfs_commit_release(void *calldata) 1425void nfs_commit_release_pages(struct nfs_write_data *data)
1345{ 1426{
1346 struct nfs_write_data *data = calldata; 1427 struct nfs_page *req;
1347 struct nfs_page *req;
1348 int status = data->task.tk_status; 1428 int status = data->task.tk_status;
1349 1429
1350 while (!list_empty(&data->pages)) { 1430 while (!list_empty(&data->pages)) {
@@ -1378,6 +1458,14 @@ static void nfs_commit_release(void *calldata)
1378 next: 1458 next:
1379 nfs_clear_page_tag_locked(req); 1459 nfs_clear_page_tag_locked(req);
1380 } 1460 }
1461}
1462EXPORT_SYMBOL_GPL(nfs_commit_release_pages);
1463
1464static void nfs_commit_release(void *calldata)
1465{
1466 struct nfs_write_data *data = calldata;
1467
1468 nfs_commit_release_pages(data);
1381 nfs_commit_clear_lock(NFS_I(data->inode)); 1469 nfs_commit_clear_lock(NFS_I(data->inode));
1382 nfs_commitdata_release(calldata); 1470 nfs_commitdata_release(calldata);
1383} 1471}
@@ -1394,23 +1482,28 @@ int nfs_commit_inode(struct inode *inode, int how)
1394{ 1482{
1395 LIST_HEAD(head); 1483 LIST_HEAD(head);
1396 int may_wait = how & FLUSH_SYNC; 1484 int may_wait = how & FLUSH_SYNC;
1397 int res = 0; 1485 int res;
1398 1486
1399 if (!nfs_commit_set_lock(NFS_I(inode), may_wait)) 1487 res = nfs_commit_set_lock(NFS_I(inode), may_wait);
1488 if (res <= 0)
1400 goto out_mark_dirty; 1489 goto out_mark_dirty;
1401 spin_lock(&inode->i_lock);
1402 res = nfs_scan_commit(inode, &head, 0, 0); 1490 res = nfs_scan_commit(inode, &head, 0, 0);
1403 spin_unlock(&inode->i_lock);
1404 if (res) { 1491 if (res) {
1405 int error = nfs_commit_list(inode, &head, how); 1492 int error;
1493
1494 error = pnfs_commit_list(inode, &head, how);
1495 if (error == PNFS_NOT_ATTEMPTED)
1496 error = nfs_commit_list(inode, &head, how);
1406 if (error < 0) 1497 if (error < 0)
1407 return error; 1498 return error;
1408 if (may_wait) 1499 if (!may_wait)
1409 wait_on_bit(&NFS_I(inode)->flags, NFS_INO_COMMIT,
1410 nfs_wait_bit_killable,
1411 TASK_KILLABLE);
1412 else
1413 goto out_mark_dirty; 1500 goto out_mark_dirty;
1501 error = wait_on_bit(&NFS_I(inode)->flags,
1502 NFS_INO_COMMIT,
1503 nfs_wait_bit_killable,
1504 TASK_KILLABLE);
1505 if (error < 0)
1506 return error;
1414 } else 1507 } else
1415 nfs_commit_clear_lock(NFS_I(inode)); 1508 nfs_commit_clear_lock(NFS_I(inode));
1416 return res; 1509 return res;
@@ -1464,7 +1557,22 @@ static int nfs_commit_unstable_pages(struct inode *inode, struct writeback_contr
1464 1557
1465int nfs_write_inode(struct inode *inode, struct writeback_control *wbc) 1558int nfs_write_inode(struct inode *inode, struct writeback_control *wbc)
1466{ 1559{
1467 return nfs_commit_unstable_pages(inode, wbc); 1560 int ret;
1561
1562 ret = nfs_commit_unstable_pages(inode, wbc);
1563 if (ret >= 0 && test_bit(NFS_INO_LAYOUTCOMMIT, &NFS_I(inode)->flags)) {
1564 int status;
1565 bool sync = true;
1566
1567 if (wbc->sync_mode == WB_SYNC_NONE || wbc->nonblocking ||
1568 wbc->for_background)
1569 sync = false;
1570
1571 status = pnfs_layoutcommit_inode(inode, sync);
1572 if (status < 0)
1573 return status;
1574 }
1575 return ret;
1468} 1576}
1469 1577
1470/* 1578/*