aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--fs/xfs/xfs_dfrag.c14
-rw-r--r--fs/xfs/xfs_inode.h1
-rw-r--r--fs/xfs/xfs_vnodeops.c162
3 files changed, 44 insertions, 133 deletions
diff --git a/fs/xfs/xfs_dfrag.c b/fs/xfs/xfs_dfrag.c
index d92407842e3b..5ce91a00425f 100644
--- a/fs/xfs/xfs_dfrag.c
+++ b/fs/xfs/xfs_dfrag.c
@@ -128,7 +128,6 @@ xfs_swap_extents(
128 xfs_swapext_t *sxp) 128 xfs_swapext_t *sxp)
129{ 129{
130 xfs_mount_t *mp; 130 xfs_mount_t *mp;
131 xfs_inode_t *ips[2];
132 xfs_trans_t *tp; 131 xfs_trans_t *tp;
133 xfs_bstat_t *sbp = &sxp->sx_stat; 132 xfs_bstat_t *sbp = &sxp->sx_stat;
134 bhv_vnode_t *vp, *tvp; 133 bhv_vnode_t *vp, *tvp;
@@ -153,16 +152,7 @@ xfs_swap_extents(
153 vp = VFS_I(ip); 152 vp = VFS_I(ip);
154 tvp = VFS_I(tip); 153 tvp = VFS_I(tip);
155 154
156 /* Lock in i_ino order */ 155 xfs_lock_two_inodes(ip, tip, lock_flags);
157 if (ip->i_ino < tip->i_ino) {
158 ips[0] = ip;
159 ips[1] = tip;
160 } else {
161 ips[0] = tip;
162 ips[1] = ip;
163 }
164
165 xfs_lock_inodes(ips, 2, lock_flags);
166 locked = 1; 156 locked = 1;
167 157
168 /* Verify that both files have the same format */ 158 /* Verify that both files have the same format */
@@ -265,7 +255,7 @@ xfs_swap_extents(
265 locked = 0; 255 locked = 0;
266 goto error0; 256 goto error0;
267 } 257 }
268 xfs_lock_inodes(ips, 2, XFS_ILOCK_EXCL); 258 xfs_lock_two_inodes(ip, tip, XFS_ILOCK_EXCL);
269 259
270 /* 260 /*
271 * Count the number of extended attribute blocks 261 * Count the number of extended attribute blocks
diff --git a/fs/xfs/xfs_inode.h b/fs/xfs/xfs_inode.h
index 4088951230aa..ec9f454b464e 100644
--- a/fs/xfs/xfs_inode.h
+++ b/fs/xfs/xfs_inode.h
@@ -531,6 +531,7 @@ void xfs_iflush_all(struct xfs_mount *);
531void xfs_ichgtime(xfs_inode_t *, int); 531void xfs_ichgtime(xfs_inode_t *, int);
532xfs_fsize_t xfs_file_last_byte(xfs_inode_t *); 532xfs_fsize_t xfs_file_last_byte(xfs_inode_t *);
533void xfs_lock_inodes(xfs_inode_t **, int, uint); 533void xfs_lock_inodes(xfs_inode_t **, int, uint);
534void xfs_lock_two_inodes(xfs_inode_t *, xfs_inode_t *, uint);
534 535
535void xfs_synchronize_atime(xfs_inode_t *); 536void xfs_synchronize_atime(xfs_inode_t *);
536void xfs_mark_inode_dirty_sync(xfs_inode_t *); 537void xfs_mark_inode_dirty_sync(xfs_inode_t *);
diff --git a/fs/xfs/xfs_vnodeops.c b/fs/xfs/xfs_vnodeops.c
index c5dc7ea85260..077c86b6cb22 100644
--- a/fs/xfs/xfs_vnodeops.c
+++ b/fs/xfs/xfs_vnodeops.c
@@ -1708,111 +1708,6 @@ std_return:
1708} 1708}
1709 1709
1710#ifdef DEBUG 1710#ifdef DEBUG
1711/*
1712 * Some counters to see if (and how often) we are hitting some deadlock
1713 * prevention code paths.
1714 */
1715
1716int xfs_rm_locks;
1717int xfs_rm_lock_delays;
1718int xfs_rm_attempts;
1719#endif
1720
1721/*
1722 * The following routine will lock the inodes associated with the
1723 * directory and the named entry in the directory. The locks are
1724 * acquired in increasing inode number.
1725 *
1726 * If the entry is "..", then only the directory is locked. The
1727 * vnode ref count will still include that from the .. entry in
1728 * this case.
1729 *
1730 * There is a deadlock we need to worry about. If the locked directory is
1731 * in the AIL, it might be blocking up the log. The next inode we lock
1732 * could be already locked by another thread waiting for log space (e.g
1733 * a permanent log reservation with a long running transaction (see
1734 * xfs_itruncate_finish)). To solve this, we must check if the directory
1735 * is in the ail and use lock_nowait. If we can't lock, we need to
1736 * drop the inode lock on the directory and try again. xfs_iunlock will
1737 * potentially push the tail if we were holding up the log.
1738 */
1739STATIC int
1740xfs_lock_dir_and_entry(
1741 xfs_inode_t *dp,
1742 xfs_inode_t *ip) /* inode of entry 'name' */
1743{
1744 int attempts;
1745 xfs_ino_t e_inum;
1746 xfs_inode_t *ips[2];
1747 xfs_log_item_t *lp;
1748
1749#ifdef DEBUG
1750 xfs_rm_locks++;
1751#endif
1752 attempts = 0;
1753
1754again:
1755 xfs_ilock(dp, XFS_ILOCK_EXCL | XFS_ILOCK_PARENT);
1756
1757 e_inum = ip->i_ino;
1758
1759 xfs_itrace_ref(ip);
1760
1761 /*
1762 * We want to lock in increasing inum. Since we've already
1763 * acquired the lock on the directory, we may need to release
1764 * if if the inum of the entry turns out to be less.
1765 */
1766 if (e_inum > dp->i_ino) {
1767 /*
1768 * We are already in the right order, so just
1769 * lock on the inode of the entry.
1770 * We need to use nowait if dp is in the AIL.
1771 */
1772
1773 lp = (xfs_log_item_t *)dp->i_itemp;
1774 if (lp && (lp->li_flags & XFS_LI_IN_AIL)) {
1775 if (!xfs_ilock_nowait(ip, XFS_ILOCK_EXCL)) {
1776 attempts++;
1777#ifdef DEBUG
1778 xfs_rm_attempts++;
1779#endif
1780
1781 /*
1782 * Unlock dp and try again.
1783 * xfs_iunlock will try to push the tail
1784 * if the inode is in the AIL.
1785 */
1786
1787 xfs_iunlock(dp, XFS_ILOCK_EXCL);
1788
1789 if ((attempts % 5) == 0) {
1790 delay(1); /* Don't just spin the CPU */
1791#ifdef DEBUG
1792 xfs_rm_lock_delays++;
1793#endif
1794 }
1795 goto again;
1796 }
1797 } else {
1798 xfs_ilock(ip, XFS_ILOCK_EXCL);
1799 }
1800 } else if (e_inum < dp->i_ino) {
1801 xfs_iunlock(dp, XFS_ILOCK_EXCL);
1802
1803 ips[0] = ip;
1804 ips[1] = dp;
1805 xfs_lock_inodes(ips, 2, XFS_ILOCK_EXCL);
1806 }
1807 /* else e_inum == dp->i_ino */
1808 /* This can happen if we're asked to lock /x/..
1809 * the entry is "..", which is also the parent directory.
1810 */
1811
1812 return 0;
1813}
1814
1815#ifdef DEBUG
1816int xfs_locked_n; 1711int xfs_locked_n;
1817int xfs_small_retries; 1712int xfs_small_retries;
1818int xfs_middle_retries; 1713int xfs_middle_retries;
@@ -1946,6 +1841,45 @@ again:
1946#endif 1841#endif
1947} 1842}
1948 1843
1844void
1845xfs_lock_two_inodes(
1846 xfs_inode_t *ip0,
1847 xfs_inode_t *ip1,
1848 uint lock_mode)
1849{
1850 xfs_inode_t *temp;
1851 int attempts = 0;
1852 xfs_log_item_t *lp;
1853
1854 ASSERT(ip0->i_ino != ip1->i_ino);
1855
1856 if (ip0->i_ino > ip1->i_ino) {
1857 temp = ip0;
1858 ip0 = ip1;
1859 ip1 = temp;
1860 }
1861
1862 again:
1863 xfs_ilock(ip0, xfs_lock_inumorder(lock_mode, 0));
1864
1865 /*
1866 * If the first lock we have locked is in the AIL, we must TRY to get
1867 * the second lock. If we can't get it, we must release the first one
1868 * and try again.
1869 */
1870 lp = (xfs_log_item_t *)ip0->i_itemp;
1871 if (lp && (lp->li_flags & XFS_LI_IN_AIL)) {
1872 if (!xfs_ilock_nowait(ip1, xfs_lock_inumorder(lock_mode, 1))) {
1873 xfs_iunlock(ip0, lock_mode);
1874 if ((++attempts % 5) == 0)
1875 delay(1); /* Don't just spin the CPU */
1876 goto again;
1877 }
1878 } else {
1879 xfs_ilock(ip1, xfs_lock_inumorder(lock_mode, 1));
1880 }
1881}
1882
1949int 1883int
1950xfs_remove( 1884xfs_remove(
1951 xfs_inode_t *dp, 1885 xfs_inode_t *dp,
@@ -2018,9 +1952,7 @@ xfs_remove(
2018 goto out_trans_cancel; 1952 goto out_trans_cancel;
2019 } 1953 }
2020 1954
2021 error = xfs_lock_dir_and_entry(dp, ip); 1955 xfs_lock_two_inodes(dp, ip, XFS_ILOCK_EXCL);
2022 if (error)
2023 goto out_trans_cancel;
2024 1956
2025 /* 1957 /*
2026 * At this point, we've gotten both the directory and the entry 1958 * At this point, we've gotten both the directory and the entry
@@ -2047,9 +1979,6 @@ xfs_remove(
2047 } 1979 }
2048 } 1980 }
2049 1981
2050 /*
2051 * Entry must exist since we did a lookup in xfs_lock_dir_and_entry.
2052 */
2053 XFS_BMAP_INIT(&free_list, &first_block); 1982 XFS_BMAP_INIT(&free_list, &first_block);
2054 error = xfs_dir_removename(tp, dp, name, ip->i_ino, 1983 error = xfs_dir_removename(tp, dp, name, ip->i_ino,
2055 &first_block, &free_list, resblks); 1984 &first_block, &free_list, resblks);
@@ -2155,7 +2084,6 @@ xfs_link(
2155{ 2084{
2156 xfs_mount_t *mp = tdp->i_mount; 2085 xfs_mount_t *mp = tdp->i_mount;
2157 xfs_trans_t *tp; 2086 xfs_trans_t *tp;
2158 xfs_inode_t *ips[2];
2159 int error; 2087 int error;
2160 xfs_bmap_free_t free_list; 2088 xfs_bmap_free_t free_list;
2161 xfs_fsblock_t first_block; 2089 xfs_fsblock_t first_block;
@@ -2203,15 +2131,7 @@ xfs_link(
2203 goto error_return; 2131 goto error_return;
2204 } 2132 }
2205 2133
2206 if (sip->i_ino < tdp->i_ino) { 2134 xfs_lock_two_inodes(sip, tdp, XFS_ILOCK_EXCL);
2207 ips[0] = sip;
2208 ips[1] = tdp;
2209 } else {
2210 ips[0] = tdp;
2211 ips[1] = sip;
2212 }
2213
2214 xfs_lock_inodes(ips, 2, XFS_ILOCK_EXCL);
2215 2135
2216 /* 2136 /*
2217 * Increment vnode ref counts since xfs_trans_commit & 2137 * Increment vnode ref counts since xfs_trans_commit &