diff options
author | Yan, Zheng <zheng.z.yan@intel.com> | 2013-07-02 00:40:19 -0400 |
---|---|---|
committer | Sage Weil <sage@inktank.com> | 2013-07-03 18:32:56 -0400 |
commit | b415bf4f9fe25f39934f5c464125e4a2dffb6d08 (patch) | |
tree | f38df9c1746a1419e7942afb4534625175a5d353 /fs/ceph/inode.c | |
parent | 5446429630257f4723829409337a26c076907d5d (diff) |
ceph: fix pending vmtruncate race
The locking order for pending vmtruncate is wrong, it can lead to
following race:
write wmtruncate work
------------------------ ----------------------
lock i_mutex
check i_truncate_pending check i_truncate_pending
truncate_inode_pages() lock i_mutex (blocked)
copy data to page cache
unlock i_mutex
truncate_inode_pages()
The fix is take i_mutex before calling __ceph_do_pending_vmtruncate()
Fixes: http://tracker.ceph.com/issues/5453
Signed-off-by: Yan, Zheng <zheng.z.yan@intel.com>
Reviewed-by: Sage Weil <sage@inktank.com>
Diffstat (limited to 'fs/ceph/inode.c')
-rw-r--r-- | fs/ceph/inode.c | 14 |
1 files changed, 6 insertions, 8 deletions
diff --git a/fs/ceph/inode.c b/fs/ceph/inode.c index be0f7e20d62e..4906ada4a97c 100644 --- a/fs/ceph/inode.c +++ b/fs/ceph/inode.c | |||
@@ -1465,7 +1465,9 @@ static void ceph_vmtruncate_work(struct work_struct *work) | |||
1465 | struct inode *inode = &ci->vfs_inode; | 1465 | struct inode *inode = &ci->vfs_inode; |
1466 | 1466 | ||
1467 | dout("vmtruncate_work %p\n", inode); | 1467 | dout("vmtruncate_work %p\n", inode); |
1468 | __ceph_do_pending_vmtruncate(inode, true); | 1468 | mutex_lock(&inode->i_mutex); |
1469 | __ceph_do_pending_vmtruncate(inode); | ||
1470 | mutex_unlock(&inode->i_mutex); | ||
1469 | iput(inode); | 1471 | iput(inode); |
1470 | } | 1472 | } |
1471 | 1473 | ||
@@ -1492,7 +1494,7 @@ void ceph_queue_vmtruncate(struct inode *inode) | |||
1492 | * Make sure any pending truncation is applied before doing anything | 1494 | * Make sure any pending truncation is applied before doing anything |
1493 | * that may depend on it. | 1495 | * that may depend on it. |
1494 | */ | 1496 | */ |
1495 | void __ceph_do_pending_vmtruncate(struct inode *inode, bool needlock) | 1497 | void __ceph_do_pending_vmtruncate(struct inode *inode) |
1496 | { | 1498 | { |
1497 | struct ceph_inode_info *ci = ceph_inode(inode); | 1499 | struct ceph_inode_info *ci = ceph_inode(inode); |
1498 | u64 to; | 1500 | u64 to; |
@@ -1525,11 +1527,7 @@ retry: | |||
1525 | ci->i_truncate_pending, to); | 1527 | ci->i_truncate_pending, to); |
1526 | spin_unlock(&ci->i_ceph_lock); | 1528 | spin_unlock(&ci->i_ceph_lock); |
1527 | 1529 | ||
1528 | if (needlock) | ||
1529 | mutex_lock(&inode->i_mutex); | ||
1530 | truncate_inode_pages(inode->i_mapping, to); | 1530 | truncate_inode_pages(inode->i_mapping, to); |
1531 | if (needlock) | ||
1532 | mutex_unlock(&inode->i_mutex); | ||
1533 | 1531 | ||
1534 | spin_lock(&ci->i_ceph_lock); | 1532 | spin_lock(&ci->i_ceph_lock); |
1535 | if (to == ci->i_truncate_size) { | 1533 | if (to == ci->i_truncate_size) { |
@@ -1588,7 +1586,7 @@ int ceph_setattr(struct dentry *dentry, struct iattr *attr) | |||
1588 | if (ceph_snap(inode) != CEPH_NOSNAP) | 1586 | if (ceph_snap(inode) != CEPH_NOSNAP) |
1589 | return -EROFS; | 1587 | return -EROFS; |
1590 | 1588 | ||
1591 | __ceph_do_pending_vmtruncate(inode, false); | 1589 | __ceph_do_pending_vmtruncate(inode); |
1592 | 1590 | ||
1593 | err = inode_change_ok(inode, attr); | 1591 | err = inode_change_ok(inode, attr); |
1594 | if (err != 0) | 1592 | if (err != 0) |
@@ -1770,7 +1768,7 @@ int ceph_setattr(struct dentry *dentry, struct iattr *attr) | |||
1770 | ceph_cap_string(dirtied), mask); | 1768 | ceph_cap_string(dirtied), mask); |
1771 | 1769 | ||
1772 | ceph_mdsc_put_request(req); | 1770 | ceph_mdsc_put_request(req); |
1773 | __ceph_do_pending_vmtruncate(inode, false); | 1771 | __ceph_do_pending_vmtruncate(inode); |
1774 | return err; | 1772 | return err; |
1775 | out: | 1773 | out: |
1776 | spin_unlock(&ci->i_ceph_lock); | 1774 | spin_unlock(&ci->i_ceph_lock); |