aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorTrond Myklebust <Trond.Myklebust@netapp.com>2012-09-11 16:01:22 -0400
committerTrond Myklebust <Trond.Myklebust@netapp.com>2012-09-28 16:03:05 -0400
commit05990d1bf2708b9e84d67074551f964d3738eedc (patch)
treeb4133627b503563eadea21aab695df78080402e1
parent795a88c968eef031f370973512b42124bacb2f17 (diff)
NFS: Fix fdatasync/fsync() when confronted with a server reboot
If the server reboots before it can commit the unstable writes to disk, then nfs_commit_release_pages() will detect this when it compares the verifier returned by COMMIT to the one returned by WRITE. When this happens, the client needs to resend those writes in order to guarantee that they make it to stable storage. This patch adds a signalling mechanism to notify fsync() that it needs to retry all writes before it can exit. Signed-off-by: Trond Myklebust <Trond.Myklebust@netapp.com>
-rw-r--r--fs/nfs/file.c34
-rw-r--r--fs/nfs/nfs4file.c22
-rw-r--r--fs/nfs/write.c1
-rw-r--r--include/linux/nfs_fs.h1
4 files changed, 36 insertions, 22 deletions
diff --git a/fs/nfs/file.c b/fs/nfs/file.c
index 6a7fcab7ecb..cc9b56691be 100644
--- a/fs/nfs/file.c
+++ b/fs/nfs/file.c
@@ -259,7 +259,7 @@ nfs_file_fsync_commit(struct file *file, loff_t start, loff_t end, int datasync)
259 struct dentry *dentry = file->f_path.dentry; 259 struct dentry *dentry = file->f_path.dentry;
260 struct nfs_open_context *ctx = nfs_file_open_context(file); 260 struct nfs_open_context *ctx = nfs_file_open_context(file);
261 struct inode *inode = dentry->d_inode; 261 struct inode *inode = dentry->d_inode;
262 int have_error, status; 262 int have_error, do_resend, status;
263 int ret = 0; 263 int ret = 0;
264 264
265 dprintk("NFS: fsync file(%s/%s) datasync %d\n", 265 dprintk("NFS: fsync file(%s/%s) datasync %d\n",
@@ -267,15 +267,23 @@ nfs_file_fsync_commit(struct file *file, loff_t start, loff_t end, int datasync)
267 datasync); 267 datasync);
268 268
269 nfs_inc_stats(inode, NFSIOS_VFSFSYNC); 269 nfs_inc_stats(inode, NFSIOS_VFSFSYNC);
270 do_resend = test_and_clear_bit(NFS_CONTEXT_RESEND_WRITES, &ctx->flags);
270 have_error = test_and_clear_bit(NFS_CONTEXT_ERROR_WRITE, &ctx->flags); 271 have_error = test_and_clear_bit(NFS_CONTEXT_ERROR_WRITE, &ctx->flags);
271 status = nfs_commit_inode(inode, FLUSH_SYNC); 272 status = nfs_commit_inode(inode, FLUSH_SYNC);
272 if (status >= 0 && ret < 0)
273 status = ret;
274 have_error |= test_bit(NFS_CONTEXT_ERROR_WRITE, &ctx->flags); 273 have_error |= test_bit(NFS_CONTEXT_ERROR_WRITE, &ctx->flags);
275 if (have_error) 274 if (have_error) {
276 ret = xchg(&ctx->error, 0); 275 ret = xchg(&ctx->error, 0);
277 if (!ret && status < 0) 276 if (ret)
277 goto out;
278 }
279 if (status < 0) {
278 ret = status; 280 ret = status;
281 goto out;
282 }
283 do_resend |= test_bit(NFS_CONTEXT_RESEND_WRITES, &ctx->flags);
284 if (do_resend)
285 ret = -EAGAIN;
286out:
279 return ret; 287 return ret;
280} 288}
281EXPORT_SYMBOL_GPL(nfs_file_fsync_commit); 289EXPORT_SYMBOL_GPL(nfs_file_fsync_commit);
@@ -286,13 +294,15 @@ nfs_file_fsync(struct file *file, loff_t start, loff_t end, int datasync)
286 int ret; 294 int ret;
287 struct inode *inode = file->f_path.dentry->d_inode; 295 struct inode *inode = file->f_path.dentry->d_inode;
288 296
289 ret = filemap_write_and_wait_range(inode->i_mapping, start, end); 297 do {
290 if (ret != 0) 298 ret = filemap_write_and_wait_range(inode->i_mapping, start, end);
291 goto out; 299 if (ret != 0)
292 mutex_lock(&inode->i_mutex); 300 break;
293 ret = nfs_file_fsync_commit(file, start, end, datasync); 301 mutex_lock(&inode->i_mutex);
294 mutex_unlock(&inode->i_mutex); 302 ret = nfs_file_fsync_commit(file, start, end, datasync);
295out: 303 mutex_unlock(&inode->i_mutex);
304 } while (ret == -EAGAIN);
305
296 return ret; 306 return ret;
297} 307}
298 308
diff --git a/fs/nfs/nfs4file.c b/fs/nfs/nfs4file.c
index eb5eb8eef4d..eef1b38a1b0 100644
--- a/fs/nfs/nfs4file.c
+++ b/fs/nfs/nfs4file.c
@@ -95,16 +95,18 @@ nfs4_file_fsync(struct file *file, loff_t start, loff_t end, int datasync)
95 int ret; 95 int ret;
96 struct inode *inode = file->f_path.dentry->d_inode; 96 struct inode *inode = file->f_path.dentry->d_inode;
97 97
98 ret = filemap_write_and_wait_range(inode->i_mapping, start, end); 98 do {
99 if (ret != 0) 99 ret = filemap_write_and_wait_range(inode->i_mapping, start, end);
100 goto out; 100 if (ret != 0)
101 mutex_lock(&inode->i_mutex); 101 break;
102 ret = nfs_file_fsync_commit(file, start, end, datasync); 102 mutex_lock(&inode->i_mutex);
103 if (!ret && !datasync) 103 ret = nfs_file_fsync_commit(file, start, end, datasync);
104 /* application has asked for meta-data sync */ 104 if (!ret && !datasync)
105 ret = pnfs_layoutcommit_inode(inode, true); 105 /* application has asked for meta-data sync */
106 mutex_unlock(&inode->i_mutex); 106 ret = pnfs_layoutcommit_inode(inode, true);
107out: 107 mutex_unlock(&inode->i_mutex);
108 } while (ret == -EAGAIN);
109
108 return ret; 110 return ret;
109} 111}
110 112
diff --git a/fs/nfs/write.c b/fs/nfs/write.c
index e1b5fe4d873..9347ab7c957 100644
--- a/fs/nfs/write.c
+++ b/fs/nfs/write.c
@@ -1580,6 +1580,7 @@ static void nfs_commit_release_pages(struct nfs_commit_data *data)
1580 /* We have a mismatch. Write the page again */ 1580 /* We have a mismatch. Write the page again */
1581 dprintk(" mismatch\n"); 1581 dprintk(" mismatch\n");
1582 nfs_mark_request_dirty(req); 1582 nfs_mark_request_dirty(req);
1583 set_bit(NFS_CONTEXT_RESEND_WRITES, &req->wb_context->flags);
1583 next: 1584 next:
1584 nfs_unlock_and_release_request(req); 1585 nfs_unlock_and_release_request(req);
1585 } 1586 }
diff --git a/include/linux/nfs_fs.h b/include/linux/nfs_fs.h
index 869eac0c263..383f3313f05 100644
--- a/include/linux/nfs_fs.h
+++ b/include/linux/nfs_fs.h
@@ -103,6 +103,7 @@ struct nfs_open_context {
103 103
104 unsigned long flags; 104 unsigned long flags;
105#define NFS_CONTEXT_ERROR_WRITE (0) 105#define NFS_CONTEXT_ERROR_WRITE (0)
106#define NFS_CONTEXT_RESEND_WRITES (1)
106 int error; 107 int error;
107 108
108 struct list_head list; 109 struct list_head list;