diff options
author | Dmitry Monakhov <dmonakhov@openvz.org> | 2013-03-04 00:34:34 -0500 |
---|---|---|
committer | Theodore Ts'o <tytso@mit.edu> | 2013-03-04 00:34:34 -0500 |
commit | 357b66fdc8ad4cea6e6336956a70742f961f0a4d (patch) | |
tree | bbb15a0d60de8c3ab70595484e72b3ef38515026 | |
parent | 9b2ff35753c0512bc8c6adae9e9c87cbeee86f82 (diff) |
ext4: ext4_split_extent should take care of extent zeroout
When ext4_split_extent_at() ends up doing zeroout & conversion to
initialized instead of split & conversion, ext4_split_extent() gets
confused and can wrongly mark the extent back as uninitialized
resulting in end IO code getting confused from large unwritten extents
and may result in data loss.
The example of problematic behavior is:
lblk len lblk len
ext4_split_extent() (ex=[1000,30,uninit], map=[1010,10])
ext4_split_extent_at() (split [1000,30,uninit] at 1020)
ext4_ext_insert_extent() -> ENOSPC
ext4_ext_zeroout()
-> extent [1000,30] is now initialized
ext4_split_extent_at() (split [1000,30,init] at 1010,
MARK_UNINIT1 | MARK_UNINIT2)
-> extent is split and parts marked as uninitialized
Fix the problem by rechecking extent type after the first
ext4_split_extent_at() returns. None of split_flags can not be applied
to initialized extent so this patch also add BUG_ON to prevent similar
issues in future.
TESTCASE: https://github.com/dmonakhov/xfstests/commit/b8a55eb5ce28c6ff29e620ab090902fcd5833597
Signed-off-by: Dmitry Monakhov <dmonakhov@openvz.org>
Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
Reviewed-by: Jan Kara <jack@suse.cz>
-rw-r--r-- | fs/ext4/extents.c | 23 |
1 files changed, 17 insertions, 6 deletions
diff --git a/fs/ext4/extents.c b/fs/ext4/extents.c index 372b2cbee07e..bef194a14437 100644 --- a/fs/ext4/extents.c +++ b/fs/ext4/extents.c | |||
@@ -2943,6 +2943,10 @@ static int ext4_split_extent_at(handle_t *handle, | |||
2943 | newblock = split - ee_block + ext4_ext_pblock(ex); | 2943 | newblock = split - ee_block + ext4_ext_pblock(ex); |
2944 | 2944 | ||
2945 | BUG_ON(split < ee_block || split >= (ee_block + ee_len)); | 2945 | BUG_ON(split < ee_block || split >= (ee_block + ee_len)); |
2946 | BUG_ON(!ext4_ext_is_uninitialized(ex) && | ||
2947 | split_flag & (EXT4_EXT_MAY_ZEROOUT | | ||
2948 | EXT4_EXT_MARK_UNINIT1 | | ||
2949 | EXT4_EXT_MARK_UNINIT2)); | ||
2946 | 2950 | ||
2947 | err = ext4_ext_get_access(handle, inode, path + depth); | 2951 | err = ext4_ext_get_access(handle, inode, path + depth); |
2948 | if (err) | 2952 | if (err) |
@@ -3061,19 +3065,26 @@ static int ext4_split_extent(handle_t *handle, | |||
3061 | if (err) | 3065 | if (err) |
3062 | goto out; | 3066 | goto out; |
3063 | } | 3067 | } |
3064 | 3068 | /* | |
3069 | * Update path is required because previous ext4_split_extent_at() may | ||
3070 | * result in split of original leaf or extent zeroout. | ||
3071 | */ | ||
3065 | ext4_ext_drop_refs(path); | 3072 | ext4_ext_drop_refs(path); |
3066 | path = ext4_ext_find_extent(inode, map->m_lblk, path); | 3073 | path = ext4_ext_find_extent(inode, map->m_lblk, path); |
3067 | if (IS_ERR(path)) | 3074 | if (IS_ERR(path)) |
3068 | return PTR_ERR(path); | 3075 | return PTR_ERR(path); |
3076 | depth = ext_depth(inode); | ||
3077 | ex = path[depth].p_ext; | ||
3078 | uninitialized = ext4_ext_is_uninitialized(ex); | ||
3079 | split_flag1 = 0; | ||
3069 | 3080 | ||
3070 | if (map->m_lblk >= ee_block) { | 3081 | if (map->m_lblk >= ee_block) { |
3071 | split_flag1 = split_flag & (EXT4_EXT_MAY_ZEROOUT | | 3082 | split_flag1 = split_flag & EXT4_EXT_DATA_VALID2; |
3072 | EXT4_EXT_DATA_VALID2); | 3083 | if (uninitialized) { |
3073 | if (uninitialized) | ||
3074 | split_flag1 |= EXT4_EXT_MARK_UNINIT1; | 3084 | split_flag1 |= EXT4_EXT_MARK_UNINIT1; |
3075 | if (split_flag & EXT4_EXT_MARK_UNINIT2) | 3085 | split_flag1 |= split_flag & (EXT4_EXT_MAY_ZEROOUT | |
3076 | split_flag1 |= EXT4_EXT_MARK_UNINIT2; | 3086 | EXT4_EXT_MARK_UNINIT2); |
3087 | } | ||
3077 | err = ext4_split_extent_at(handle, inode, path, | 3088 | err = ext4_split_extent_at(handle, inode, path, |
3078 | map->m_lblk, split_flag1, flags); | 3089 | map->m_lblk, split_flag1, flags); |
3079 | if (err) | 3090 | if (err) |