aboutsummaryrefslogtreecommitdiffstats
path: root/fs
diff options
context:
space:
mode:
authorTheodore Ts'o <tytso@mit.edu>2014-02-15 21:33:13 -0500
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>2014-03-07 00:30:00 -0500
commit94a197c6bc4976fdec2ea37a0612df226839c541 (patch)
tree6d0dcf35195e9ef1a444d0ad45f45933793fe819 /fs
parentf13ea132887a8649cc6d45942e2be27f4362351f (diff)
ext4: fix online resize with very large inode tables
commit b93c95353413041a8cebad915a8109619f66bcc6 upstream. If a file system has a large number of inodes per block group, all of the metadata blocks in a flex_bg may be larger than what can fit in a single block group. Unfortunately, ext4_alloc_group_tables() in resize.c was never tested to see if it would handle this case correctly, and there were a large number of bugs which caused the following sequence to result in a BUG_ON: kernel bug at fs/ext4/resize.c:409! ... call trace: [<ffffffff81256768>] ext4_flex_group_add+0x1448/0x1830 [<ffffffff81257de2>] ext4_resize_fs+0x7b2/0xe80 [<ffffffff8123ac50>] ext4_ioctl+0xbf0/0xf00 [<ffffffff811c111d>] do_vfs_ioctl+0x2dd/0x4b0 [<ffffffff811b9df2>] ? final_putname+0x22/0x50 [<ffffffff811c1371>] sys_ioctl+0x81/0xa0 [<ffffffff81676aa9>] system_call_fastpath+0x16/0x1b code: c8 4c 89 df e8 41 96 f8 ff 44 89 e8 49 01 c4 44 29 6d d4 0 rip [<ffffffff81254fa1>] set_flexbg_block_bitmap+0x171/0x180 This can be reproduced with the following command sequence: mke2fs -t ext4 -i 4096 /dev/vdd 1G mount -t ext4 /dev/vdd /vdd resize2fs /dev/vdd 8G To fix this, we need to make sure the right thing happens when a block group's inode table straddles two block groups, which means the following bugs had to be fixed: 1) Not clearing the BLOCK_UNINIT flag in the second block group in ext4_alloc_group_tables --- the was proximate cause of the BUG_ON. 2) Incorrectly determining how many block groups contained contiguous free blocks in ext4_alloc_group_tables(). 3) Incorrectly setting the start of the next block range to be marked in use after a discontinuity in setup_new_flex_group_blocks(). Signed-off-by: "Theodore Ts'o" <tytso@mit.edu> Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Diffstat (limited to 'fs')
-rw-r--r--fs/ext4/resize.c32
1 files changed, 20 insertions, 12 deletions
diff --git a/fs/ext4/resize.c b/fs/ext4/resize.c
index 49d3c01eabf8..6bb79434861f 100644
--- a/fs/ext4/resize.c
+++ b/fs/ext4/resize.c
@@ -238,6 +238,7 @@ static int ext4_alloc_group_tables(struct super_block *sb,
238 ext4_group_t group; 238 ext4_group_t group;
239 ext4_group_t last_group; 239 ext4_group_t last_group;
240 unsigned overhead; 240 unsigned overhead;
241 __u16 uninit_mask = (flexbg_size > 1) ? ~EXT4_BG_BLOCK_UNINIT : ~0;
241 242
242 BUG_ON(flex_gd->count == 0 || group_data == NULL); 243 BUG_ON(flex_gd->count == 0 || group_data == NULL);
243 244
@@ -261,7 +262,7 @@ next_group:
261 src_group++; 262 src_group++;
262 for (; src_group <= last_group; src_group++) { 263 for (; src_group <= last_group; src_group++) {
263 overhead = ext4_group_overhead_blocks(sb, src_group); 264 overhead = ext4_group_overhead_blocks(sb, src_group);
264 if (overhead != 0) 265 if (overhead == 0)
265 last_blk += group_data[src_group - group].blocks_count; 266 last_blk += group_data[src_group - group].blocks_count;
266 else 267 else
267 break; 268 break;
@@ -275,8 +276,7 @@ next_group:
275 group = ext4_get_group_number(sb, start_blk - 1); 276 group = ext4_get_group_number(sb, start_blk - 1);
276 group -= group_data[0].group; 277 group -= group_data[0].group;
277 group_data[group].free_blocks_count--; 278 group_data[group].free_blocks_count--;
278 if (flexbg_size > 1) 279 flex_gd->bg_flags[group] &= uninit_mask;
279 flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT;
280 } 280 }
281 281
282 /* Allocate inode bitmaps */ 282 /* Allocate inode bitmaps */
@@ -287,22 +287,30 @@ next_group:
287 group = ext4_get_group_number(sb, start_blk - 1); 287 group = ext4_get_group_number(sb, start_blk - 1);
288 group -= group_data[0].group; 288 group -= group_data[0].group;
289 group_data[group].free_blocks_count--; 289 group_data[group].free_blocks_count--;
290 if (flexbg_size > 1) 290 flex_gd->bg_flags[group] &= uninit_mask;
291 flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT;
292 } 291 }
293 292
294 /* Allocate inode tables */ 293 /* Allocate inode tables */
295 for (; it_index < flex_gd->count; it_index++) { 294 for (; it_index < flex_gd->count; it_index++) {
296 if (start_blk + EXT4_SB(sb)->s_itb_per_group > last_blk) 295 unsigned int itb = EXT4_SB(sb)->s_itb_per_group;
296 ext4_fsblk_t next_group_start;
297
298 if (start_blk + itb > last_blk)
297 goto next_group; 299 goto next_group;
298 group_data[it_index].inode_table = start_blk; 300 group_data[it_index].inode_table = start_blk;
299 group = ext4_get_group_number(sb, start_blk - 1); 301 group = ext4_get_group_number(sb, start_blk);
302 next_group_start = ext4_group_first_block_no(sb, group + 1);
300 group -= group_data[0].group; 303 group -= group_data[0].group;
301 group_data[group].free_blocks_count -=
302 EXT4_SB(sb)->s_itb_per_group;
303 if (flexbg_size > 1)
304 flex_gd->bg_flags[group] &= ~EXT4_BG_BLOCK_UNINIT;
305 304
305 if (start_blk + itb > next_group_start) {
306 flex_gd->bg_flags[group + 1] &= uninit_mask;
307 overhead = start_blk + itb - next_group_start;
308 group_data[group + 1].free_blocks_count -= overhead;
309 itb -= overhead;
310 }
311
312 group_data[group].free_blocks_count -= itb;
313 flex_gd->bg_flags[group] &= uninit_mask;
306 start_blk += EXT4_SB(sb)->s_itb_per_group; 314 start_blk += EXT4_SB(sb)->s_itb_per_group;
307 } 315 }
308 316
@@ -615,7 +623,7 @@ handle_ib:
615 if (err) 623 if (err)
616 goto out; 624 goto out;
617 count = group_table_count[j]; 625 count = group_table_count[j];
618 start = group_data[i].block_bitmap; 626 start = (&group_data[i].block_bitmap)[j];
619 block = start; 627 block = start;
620 } 628 }
621 629