diff options
author | Josef Bacik <jbacik@fb.com> | 2015-02-11 15:08:59 -0500 |
---|---|---|
committer | Chris Mason <clm@fb.com> | 2015-02-14 11:22:48 -0500 |
commit | dcab6a3b2ae657a2017637083c28ee303b6b1b8e (patch) | |
tree | 4aa9951e7ab997702f90aec9882f305e1885fc40 /fs/btrfs/extent-tree.c | |
parent | 3266789f9d08b27275bae5ab1dcd27d1bbf15e79 (diff) |
Btrfs: account for large extents with enospc
On our gluster boxes we stream large tar balls of backups onto our fses. With
160gb of ram this means we get really large contiguous ranges of dirty data, but
the way our ENOSPC stuff works is that as long as it's contiguous we only hold
metadata reservation for one extent. The problem is we limit our extents to
128mb, so we'll end up with at least 800 extents so our enospc accounting is
quite a bit lower than what we need. To keep track of this make sure we
increase outstanding_extents for every multiple of the max extent size so we can
be sure to have enough reserved metadata space. Thanks,
Signed-off-by: Josef Bacik <jbacik@fb.com>
Signed-off-by: Chris Mason <clm@fb.com>
Diffstat (limited to 'fs/btrfs/extent-tree.c')
-rw-r--r-- | fs/btrfs/extent-tree.c | 16 |
1 files changed, 11 insertions, 5 deletions
diff --git a/fs/btrfs/extent-tree.c b/fs/btrfs/extent-tree.c index 50de1fa6fc9e..0f6737063142 100644 --- a/fs/btrfs/extent-tree.c +++ b/fs/btrfs/extent-tree.c | |||
@@ -4963,19 +4963,25 @@ void btrfs_subvolume_release_metadata(struct btrfs_root *root, | |||
4963 | /** | 4963 | /** |
4964 | * drop_outstanding_extent - drop an outstanding extent | 4964 | * drop_outstanding_extent - drop an outstanding extent |
4965 | * @inode: the inode we're dropping the extent for | 4965 | * @inode: the inode we're dropping the extent for |
4966 | * @num_bytes: the number of bytes we're relaseing. | ||
4966 | * | 4967 | * |
4967 | * This is called when we are freeing up an outstanding extent, either called | 4968 | * This is called when we are freeing up an outstanding extent, either called |
4968 | * after an error or after an extent is written. This will return the number of | 4969 | * after an error or after an extent is written. This will return the number of |
4969 | * reserved extents that need to be freed. This must be called with | 4970 | * reserved extents that need to be freed. This must be called with |
4970 | * BTRFS_I(inode)->lock held. | 4971 | * BTRFS_I(inode)->lock held. |
4971 | */ | 4972 | */ |
4972 | static unsigned drop_outstanding_extent(struct inode *inode) | 4973 | static unsigned drop_outstanding_extent(struct inode *inode, u64 num_bytes) |
4973 | { | 4974 | { |
4974 | unsigned drop_inode_space = 0; | 4975 | unsigned drop_inode_space = 0; |
4975 | unsigned dropped_extents = 0; | 4976 | unsigned dropped_extents = 0; |
4977 | unsigned num_extents = 0; | ||
4976 | 4978 | ||
4977 | BUG_ON(!BTRFS_I(inode)->outstanding_extents); | 4979 | num_extents = (unsigned)div64_u64(num_bytes + |
4978 | BTRFS_I(inode)->outstanding_extents--; | 4980 | BTRFS_MAX_EXTENT_SIZE - 1, |
4981 | BTRFS_MAX_EXTENT_SIZE); | ||
4982 | ASSERT(num_extents); | ||
4983 | ASSERT(BTRFS_I(inode)->outstanding_extents >= num_extents); | ||
4984 | BTRFS_I(inode)->outstanding_extents -= num_extents; | ||
4979 | 4985 | ||
4980 | if (BTRFS_I(inode)->outstanding_extents == 0 && | 4986 | if (BTRFS_I(inode)->outstanding_extents == 0 && |
4981 | test_and_clear_bit(BTRFS_INODE_DELALLOC_META_RESERVED, | 4987 | test_and_clear_bit(BTRFS_INODE_DELALLOC_META_RESERVED, |
@@ -5146,7 +5152,7 @@ int btrfs_delalloc_reserve_metadata(struct inode *inode, u64 num_bytes) | |||
5146 | 5152 | ||
5147 | out_fail: | 5153 | out_fail: |
5148 | spin_lock(&BTRFS_I(inode)->lock); | 5154 | spin_lock(&BTRFS_I(inode)->lock); |
5149 | dropped = drop_outstanding_extent(inode); | 5155 | dropped = drop_outstanding_extent(inode, num_bytes); |
5150 | /* | 5156 | /* |
5151 | * If the inodes csum_bytes is the same as the original | 5157 | * If the inodes csum_bytes is the same as the original |
5152 | * csum_bytes then we know we haven't raced with any free()ers | 5158 | * csum_bytes then we know we haven't raced with any free()ers |
@@ -5225,7 +5231,7 @@ void btrfs_delalloc_release_metadata(struct inode *inode, u64 num_bytes) | |||
5225 | 5231 | ||
5226 | num_bytes = ALIGN(num_bytes, root->sectorsize); | 5232 | num_bytes = ALIGN(num_bytes, root->sectorsize); |
5227 | spin_lock(&BTRFS_I(inode)->lock); | 5233 | spin_lock(&BTRFS_I(inode)->lock); |
5228 | dropped = drop_outstanding_extent(inode); | 5234 | dropped = drop_outstanding_extent(inode, num_bytes); |
5229 | 5235 | ||
5230 | if (num_bytes) | 5236 | if (num_bytes) |
5231 | to_free = calc_csum_metadata_size(inode, num_bytes, 0); | 5237 | to_free = calc_csum_metadata_size(inode, num_bytes, 0); |