aboutsummaryrefslogtreecommitdiffstats
path: root/fs/nfs/nfs4filelayout.c
diff options
context:
space:
mode:
authorFred Isaman <iisaman@netapp.com>2011-03-23 09:27:53 -0400
committerTrond Myklebust <Trond.Myklebust@netapp.com>2011-03-23 15:29:04 -0400
commite0c2b3801828aadb65dec9f67f7c6b7a675ad007 (patch)
tree547d70967ad8f41a18f2d3112dbd12e64f972af2 /fs/nfs/nfs4filelayout.c
parent988b6dceb0ae6d642587c8594529b94f6be0c5ea (diff)
NFSv4.1: filelayout driver specific code for COMMIT
Implement all the hooks created in the previous patches. This requires exporting quite a few functions and adding a few structure fields. Signed-off-by: Fred Isaman <iisaman@netapp.com> Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
Diffstat (limited to 'fs/nfs/nfs4filelayout.c')
-rw-r--r--fs/nfs/nfs4filelayout.c235
1 files changed, 235 insertions, 0 deletions
diff --git a/fs/nfs/nfs4filelayout.c b/fs/nfs/nfs4filelayout.c
index 03ff80c67c6e..97e75a22af72 100644
--- a/fs/nfs/nfs4filelayout.c
+++ b/fs/nfs/nfs4filelayout.c
@@ -213,6 +213,37 @@ static int filelayout_write_done_cb(struct rpc_task *task,
213 return 0; 213 return 0;
214} 214}
215 215
216/* Fake up some data that will cause nfs_commit_release to retry the writes. */
217static void prepare_to_resend_writes(struct nfs_write_data *data)
218{
219 struct nfs_page *first = nfs_list_entry(data->pages.next);
220
221 data->task.tk_status = 0;
222 memcpy(data->verf.verifier, first->wb_verf.verifier,
223 sizeof(first->wb_verf.verifier));
224 data->verf.verifier[0]++; /* ensure verifier mismatch */
225}
226
227static int filelayout_commit_done_cb(struct rpc_task *task,
228 struct nfs_write_data *data)
229{
230 int reset = 0;
231
232 if (filelayout_async_handle_error(task, data->args.context->state,
233 data->ds_clp, &reset) == -EAGAIN) {
234 dprintk("%s calling restart ds_clp %p ds_clp->cl_session %p\n",
235 __func__, data->ds_clp, data->ds_clp->cl_session);
236 if (reset) {
237 prepare_to_resend_writes(data);
238 filelayout_set_lo_fail(data->lseg);
239 } else
240 nfs_restart_rpc(task, data->ds_clp);
241 return -EAGAIN;
242 }
243
244 return 0;
245}
246
216static void filelayout_write_prepare(struct rpc_task *task, void *data) 247static void filelayout_write_prepare(struct rpc_task *task, void *data)
217{ 248{
218 struct nfs_write_data *wdata = (struct nfs_write_data *)data; 249 struct nfs_write_data *wdata = (struct nfs_write_data *)data;
@@ -240,6 +271,16 @@ static void filelayout_write_release(void *data)
240 wdata->mds_ops->rpc_release(data); 271 wdata->mds_ops->rpc_release(data);
241} 272}
242 273
274static void filelayout_commit_release(void *data)
275{
276 struct nfs_write_data *wdata = (struct nfs_write_data *)data;
277
278 nfs_commit_release_pages(wdata);
279 if (atomic_dec_and_test(&NFS_I(wdata->inode)->commits_outstanding))
280 nfs_commit_clear_lock(NFS_I(wdata->inode));
281 nfs_commitdata_release(wdata);
282}
283
243struct rpc_call_ops filelayout_read_call_ops = { 284struct rpc_call_ops filelayout_read_call_ops = {
244 .rpc_call_prepare = filelayout_read_prepare, 285 .rpc_call_prepare = filelayout_read_prepare,
245 .rpc_call_done = filelayout_read_call_done, 286 .rpc_call_done = filelayout_read_call_done,
@@ -252,6 +293,12 @@ struct rpc_call_ops filelayout_write_call_ops = {
252 .rpc_release = filelayout_write_release, 293 .rpc_release = filelayout_write_release,
253}; 294};
254 295
296struct rpc_call_ops filelayout_commit_call_ops = {
297 .rpc_call_prepare = filelayout_write_prepare,
298 .rpc_call_done = filelayout_write_call_done,
299 .rpc_release = filelayout_commit_release,
300};
301
255static enum pnfs_try_status 302static enum pnfs_try_status
256filelayout_read_pagelist(struct nfs_read_data *data) 303filelayout_read_pagelist(struct nfs_read_data *data)
257{ 304{
@@ -574,6 +621,191 @@ filelayout_pg_test(struct nfs_pageio_descriptor *pgio, struct nfs_page *prev,
574 return (p_stripe == r_stripe); 621 return (p_stripe == r_stripe);
575} 622}
576 623
624static bool filelayout_mark_pnfs_commit(struct pnfs_layout_segment *lseg)
625{
626 return !FILELAYOUT_LSEG(lseg)->commit_through_mds;
627}
628
629static u32 select_bucket_index(struct nfs4_filelayout_segment *fl, u32 j)
630{
631 if (fl->stripe_type == STRIPE_SPARSE)
632 return nfs4_fl_calc_ds_index(&fl->generic_hdr, j);
633 else
634 return j;
635}
636
637struct list_head *filelayout_choose_commit_list(struct nfs_page *req)
638{
639 struct pnfs_layout_segment *lseg = req->wb_commit_lseg;
640 struct nfs4_filelayout_segment *fl = FILELAYOUT_LSEG(lseg);
641 u32 i, j;
642 struct list_head *list;
643
644 /* Note that we are calling nfs4_fl_calc_j_index on each page
645 * that ends up being committed to a data server. An attractive
646 * alternative is to add a field to nfs_write_data and nfs_page
647 * to store the value calculated in filelayout_write_pagelist
648 * and just use that here.
649 */
650 j = nfs4_fl_calc_j_index(lseg,
651 (loff_t)req->wb_index << PAGE_CACHE_SHIFT);
652 i = select_bucket_index(fl, j);
653 list = &fl->commit_buckets[i];
654 if (list_empty(list)) {
655 /* Non-empty buckets hold a reference on the lseg */
656 get_lseg(lseg);
657 }
658 return list;
659}
660
661static u32 calc_ds_index_from_commit(struct pnfs_layout_segment *lseg, u32 i)
662{
663 struct nfs4_filelayout_segment *flseg = FILELAYOUT_LSEG(lseg);
664
665 if (flseg->stripe_type == STRIPE_SPARSE)
666 return i;
667 else
668 return nfs4_fl_calc_ds_index(lseg, i);
669}
670
671static struct nfs_fh *
672select_ds_fh_from_commit(struct pnfs_layout_segment *lseg, u32 i)
673{
674 struct nfs4_filelayout_segment *flseg = FILELAYOUT_LSEG(lseg);
675
676 if (flseg->stripe_type == STRIPE_SPARSE) {
677 if (flseg->num_fh == 1)
678 i = 0;
679 else if (flseg->num_fh == 0)
680 /* Use the MDS OPEN fh set in nfs_read_rpcsetup */
681 return NULL;
682 }
683 return flseg->fh_array[i];
684}
685
686static int filelayout_initiate_commit(struct nfs_write_data *data, int how)
687{
688 struct pnfs_layout_segment *lseg = data->lseg;
689 struct nfs4_pnfs_ds *ds;
690 u32 idx;
691 struct nfs_fh *fh;
692
693 idx = calc_ds_index_from_commit(lseg, data->ds_commit_index);
694 ds = nfs4_fl_prepare_ds(lseg, idx);
695 if (!ds) {
696 printk(KERN_ERR "%s: prepare_ds failed, use MDS\n", __func__);
697 set_bit(lo_fail_bit(IOMODE_RW), &lseg->pls_layout->plh_flags);
698 set_bit(lo_fail_bit(IOMODE_READ), &lseg->pls_layout->plh_flags);
699 prepare_to_resend_writes(data);
700 data->mds_ops->rpc_release(data);
701 return -EAGAIN;
702 }
703 dprintk("%s ino %lu, how %d\n", __func__, data->inode->i_ino, how);
704 data->write_done_cb = filelayout_commit_done_cb;
705 data->ds_clp = ds->ds_clp;
706 fh = select_ds_fh_from_commit(lseg, data->ds_commit_index);
707 if (fh)
708 data->args.fh = fh;
709 return nfs_initiate_commit(data, ds->ds_clp->cl_rpcclient,
710 &filelayout_commit_call_ops, how);
711}
712
713/*
714 * This is only useful while we are using whole file layouts.
715 */
716static struct pnfs_layout_segment *find_only_write_lseg(struct inode *inode)
717{
718 struct pnfs_layout_segment *lseg, *rv = NULL;
719
720 spin_lock(&inode->i_lock);
721 list_for_each_entry(lseg, &NFS_I(inode)->layout->plh_segs, pls_list)
722 if (lseg->pls_range.iomode == IOMODE_RW)
723 rv = get_lseg(lseg);
724 spin_unlock(&inode->i_lock);
725 return rv;
726}
727
728static int alloc_ds_commits(struct inode *inode, struct list_head *list)
729{
730 struct pnfs_layout_segment *lseg;
731 struct nfs4_filelayout_segment *fl;
732 struct nfs_write_data *data;
733 int i, j;
734
735 /* Won't need this when non-whole file layout segments are supported
736 * instead we will use a pnfs_layout_hdr structure */
737 lseg = find_only_write_lseg(inode);
738 if (!lseg)
739 return 0;
740 fl = FILELAYOUT_LSEG(lseg);
741 for (i = 0; i < fl->number_of_buckets; i++) {
742 if (list_empty(&fl->commit_buckets[i]))
743 continue;
744 data = nfs_commitdata_alloc();
745 if (!data)
746 goto out_bad;
747 data->ds_commit_index = i;
748 data->lseg = lseg;
749 list_add(&data->pages, list);
750 }
751 put_lseg(lseg);
752 return 0;
753
754out_bad:
755 for (j = i; j < fl->number_of_buckets; j++) {
756 if (list_empty(&fl->commit_buckets[i]))
757 continue;
758 nfs_retry_commit(&fl->commit_buckets[i], lseg);
759 put_lseg(lseg); /* associated with emptying bucket */
760 }
761 put_lseg(lseg);
762 /* Caller will clean up entries put on list */
763 return -ENOMEM;
764}
765
766/* This follows nfs_commit_list pretty closely */
767static int
768filelayout_commit_pagelist(struct inode *inode, struct list_head *mds_pages,
769 int how)
770{
771 struct nfs_write_data *data, *tmp;
772 LIST_HEAD(list);
773
774 if (!list_empty(mds_pages)) {
775 data = nfs_commitdata_alloc();
776 if (!data)
777 goto out_bad;
778 data->lseg = NULL;
779 list_add(&data->pages, &list);
780 }
781
782 if (alloc_ds_commits(inode, &list))
783 goto out_bad;
784
785 list_for_each_entry_safe(data, tmp, &list, pages) {
786 list_del_init(&data->pages);
787 atomic_inc(&NFS_I(inode)->commits_outstanding);
788 if (!data->lseg) {
789 nfs_init_commit(data, mds_pages, NULL);
790 nfs_initiate_commit(data, NFS_CLIENT(inode),
791 data->mds_ops, how);
792 } else {
793 nfs_init_commit(data, &FILELAYOUT_LSEG(data->lseg)->commit_buckets[data->ds_commit_index], data->lseg);
794 filelayout_initiate_commit(data, how);
795 }
796 }
797 return 0;
798 out_bad:
799 list_for_each_entry_safe(data, tmp, &list, pages) {
800 nfs_retry_commit(&data->pages, data->lseg);
801 list_del_init(&data->pages);
802 nfs_commit_free(data);
803 }
804 nfs_retry_commit(mds_pages, NULL);
805 nfs_commit_clear_lock(NFS_I(inode));
806 return -ENOMEM;
807}
808
577static struct pnfs_layoutdriver_type filelayout_type = { 809static struct pnfs_layoutdriver_type filelayout_type = {
578 .id = LAYOUT_NFSV4_1_FILES, 810 .id = LAYOUT_NFSV4_1_FILES,
579 .name = "LAYOUT_NFSV4_1_FILES", 811 .name = "LAYOUT_NFSV4_1_FILES",
@@ -581,6 +813,9 @@ static struct pnfs_layoutdriver_type filelayout_type = {
581 .alloc_lseg = filelayout_alloc_lseg, 813 .alloc_lseg = filelayout_alloc_lseg,
582 .free_lseg = filelayout_free_lseg, 814 .free_lseg = filelayout_free_lseg,
583 .pg_test = filelayout_pg_test, 815 .pg_test = filelayout_pg_test,
816 .mark_pnfs_commit = filelayout_mark_pnfs_commit,
817 .choose_commit_list = filelayout_choose_commit_list,
818 .commit_pagelist = filelayout_commit_pagelist,
584 .read_pagelist = filelayout_read_pagelist, 819 .read_pagelist = filelayout_read_pagelist,
585 .write_pagelist = filelayout_write_pagelist, 820 .write_pagelist = filelayout_write_pagelist,
586}; 821};