diff options
author | Theodore Ts'o <tytso@mit.edu> | 2014-02-15 21:33:13 -0500 |
---|---|---|
committer | Greg Kroah-Hartman <gregkh@linuxfoundation.org> | 2014-03-07 00:30:00 -0500 |
commit | 94a197c6bc4976fdec2ea37a0612df226839c541 (patch) | |
tree | 6d0dcf35195e9ef1a444d0ad45f45933793fe819 /fs | |
parent | f13ea132887a8649cc6d45942e2be27f4362351f (diff) |
ext4: fix online resize with very large inode tables
commit b93c95353413041a8cebad915a8109619f66bcc6 upstream.
If a file system has a large number of inodes per block group, all of
the metadata blocks in a flex_bg may be larger than what can fit in a
single block group. Unfortunately, ext4_alloc_group_tables() in
resize.c was never tested to see if it would handle this case
correctly, and there were a large number of bugs which caused the
following sequence to result in a BUG_ON:
kernel bug at fs/ext4/resize.c:409!
...
call trace:
[<ffffffff81256768>] ext4_flex_group_add+0x1448/0x1830
[<ffffffff81257de2>] ext4_resize_fs+0x7b2/0xe80
[<ffffffff8123ac50>] ext4_ioctl+0xbf0/0xf00
[<ffffffff811c111d>] do_vfs_ioctl+0x2dd/0x4b0
[<ffffffff811b9df2>] ? final_putname+0x22/0x50
[<ffffffff811c1371>] sys_ioctl+0x81/0xa0
[<ffffffff81676aa9>] system_call_fastpath+0x16/0x1b
code: c8 4c 89 df e8 41 96 f8 ff 44 89 e8 49 01 c4 44 29 6d d4 0
rip [<ffffffff81254fa1>] set_flexbg_block_bitmap+0x171/0x180
This can be reproduced with the following command sequence:
mke2fs -t ext4 -i 4096 /dev/vdd 1G
mount -t ext4 /dev/vdd /vdd
resize2fs /dev/vdd 8G
To fix this, we need to make sure the right thing happens when a block
group's inode table straddles two block groups, which means the
following bugs had to be fixed:
1) Not clearing the BLOCK_UNINIT flag in the second block group in
ext4_alloc_group_tables --- the was proximate cause of the BUG_ON.
2) Incorrectly determining how many block groups contained contiguous
free blocks in ext4_alloc_group_tables().
3) Incorrectly setting the start of the next block range to be marked
in use after a discontinuity in setup_new_flex_group_blocks().
Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Diffstat (limited to 'fs')
-rw-r--r-- | fs/ext4/resize.c | 32 |
1 files changed, 20 insertions, 12 deletions
diff --git a/fs/ext4/resize.c b/fs/ext4/resize.c index 49d3c01eabf8..6bb79434861f 100644 --- a/fs/ext4/resize.c +++ b/fs/ext4/resize.c | |||
@@ -238,6 +238,7 @@ static int ext4_alloc_group_tables(struct super_block *sb, | |||
238 | ext4_group_t group; | 238 | ext4_group_t group; |
239 | ext4_group_t last_group; | 239 | ext4_group_t last_group; |
240 | unsigned overhead; | 240 | unsigned overhead; |
241 | __u16 uninit_mask = (flexbg_size > 1) ? ~EXT4_BG_BLOCK_UNINIT : ~0; | ||
241 | 242 | ||
242 | BUG_ON(flex_gd->count == 0 || group_data == NULL); | 243 | BUG_ON(flex_gd->count == 0 || group_data == NULL); |
243 | 244 | ||
@@ -261,7 +262,7 @@ next_group: | |||
261 | src_group++; | 262 | src_group++; |
262 | for (; src_group <= last_group; src_group++) { | 263 | for (; src_group <= last_group; src_group++) { |
263 | overhead = ext4_group_overhead_blocks(sb, src_group); | 264 | overhead = ext4_group_overhead_blocks(sb, src_group); |
264 | if (overhead != 0) | 265 | if (overhead == 0) |
265 | last_blk += group_data[src_group - group].blocks_count; | 266 | last_blk += group_data[src_group - group].blocks_count; |
266 | else | 267 | else |
267 | break; | 268 | break; |
@@ -275,8 +276,7 @@ next_group: | |||
275 | group = ext4_get_group_number(sb, start_blk - 1); | 276 | group = ext4_get_group_number(sb, start_blk - 1); |
276 | group -= group_data[0].group; | 277 | group -= group_data[0].group; |
277 | group_data[group].free_blocks_count--; | 278 | group_data[group].free_blocks_count--; |
278 | if (flexbg_size > 1) | 279 | flex_gd->bg_flags[group] &= uninit_mask; |
279 | flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT; | ||
280 | } | 280 | } |
281 | 281 | ||
282 | /* Allocate inode bitmaps */ | 282 | /* Allocate inode bitmaps */ |
@@ -287,22 +287,30 @@ next_group: | |||
287 | group = ext4_get_group_number(sb, start_blk - 1); | 287 | group = ext4_get_group_number(sb, start_blk - 1); |
288 | group -= group_data[0].group; | 288 | group -= group_data[0].group; |
289 | group_data[group].free_blocks_count--; | 289 | group_data[group].free_blocks_count--; |
290 | if (flexbg_size > 1) | 290 | flex_gd->bg_flags[group] &= uninit_mask; |
291 | flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT; | ||
292 | } | 291 | } |
293 | 292 | ||
294 | /* Allocate inode tables */ | 293 | /* Allocate inode tables */ |
295 | for (; it_index < flex_gd->count; it_index++) { | 294 | for (; it_index < flex_gd->count; it_index++) { |
296 | if (start_blk + EXT4_SB(sb)->s_itb_per_group > last_blk) | 295 | unsigned int itb = EXT4_SB(sb)->s_itb_per_group; |
296 | ext4_fsblk_t next_group_start; | ||
297 | |||
298 | if (start_blk + itb > last_blk) | ||
297 | goto next_group; | 299 | goto next_group; |
298 | group_data[it_index].inode_table = start_blk; | 300 | group_data[it_index].inode_table = start_blk; |
299 | group = ext4_get_group_number(sb, start_blk - 1); | 301 | group = ext4_get_group_number(sb, start_blk); |
302 | next_group_start = ext4_group_first_block_no(sb, group + 1); | ||
300 | group -= group_data[0].group; | 303 | group -= group_data[0].group; |
301 | group_data[group].free_blocks_count -= | ||
302 | EXT4_SB(sb)->s_itb_per_group; | ||
303 | if (flexbg_size > 1) | ||
304 | flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT; | ||
305 | 304 | ||
305 | if (start_blk + itb > next_group_start) { | ||
306 | flex_gd->bg_flags[group + 1] &= uninit_mask; | ||
307 | overhead = start_blk + itb - next_group_start; | ||
308 | group_data[group + 1].free_blocks_count -= overhead; | ||
309 | itb -= overhead; | ||
310 | } | ||
311 | |||
312 | group_data[group].free_blocks_count -= itb; | ||
313 | flex_gd->bg_flags[group] &= uninit_mask; | ||
306 | start_blk += EXT4_SB(sb)->s_itb_per_group; | 314 | start_blk += EXT4_SB(sb)->s_itb_per_group; |
307 | } | 315 | } |
308 | 316 | ||
@@ -615,7 +623,7 @@ handle_ib: | |||
615 | if (err) | 623 | if (err) |
616 | goto out; | 624 | goto out; |
617 | count = group_table_count[j]; | 625 | count = group_table_count[j]; |
618 | start = group_data[i].block_bitmap; | 626 | start = (&group_data[i].block_bitmap)[j]; |
619 | block = start; | 627 | block = start; |
620 | } | 628 | } |
621 | 629 | ||