diff options
author | Pekka Enberg <penberg@cs.helsinki.fi> | 2009-02-15 18:07:52 -0500 |
---|---|---|
committer | Theodore Ts'o <tytso@mit.edu> | 2009-02-15 18:07:52 -0500 |
commit | 705895b61133ef43d106fe6a6bbdb2eec923867e (patch) | |
tree | ea05232098c0425fda052240a8bb0e6218bb5e82 /fs | |
parent | 3d0518f4758eca4339e75e5b9dbb7e06a5ce08b4 (diff) |
ext4: allocate ->s_blockgroup_lock separately
As spotted by kmemtrace, struct ext4_sb_info is 17664 bytes on 64-bit
which makes it a very bad fit for SLAB allocators. The culprit of the
wasted memory is ->s_blockgroup_lock which can be as big as 16 KB when
NR_CPUS >= 32.
To fix that, allocate ->s_blockgroup_lock, which fits nicely in a order 2
page in the worst case, separately. This shinks down struct ext4_sb_info
enough to fit a 2 KB slab cache so now we allocate 16 KB + 2 KB instead of
32 KB saving 14 KB of memory.
Acked-by: Andreas Dilger <adilger@sun.com>
Signed-off-by: Pekka Enberg <penberg@cs.helsinki.fi>
Cc: <linux-ext4@vger.kernel.org>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
Diffstat (limited to 'fs')
-rw-r--r-- | fs/ext4/ext4_sb.h | 4 | ||||
-rw-r--r-- | fs/ext4/super.c | 10 |
2 files changed, 11 insertions, 3 deletions
diff --git a/fs/ext4/ext4_sb.h b/fs/ext4/ext4_sb.h index e318f486cc2..4e4d9cc3f40 100644 --- a/fs/ext4/ext4_sb.h +++ b/fs/ext4/ext4_sb.h | |||
@@ -62,7 +62,7 @@ struct ext4_sb_info { | |||
62 | struct percpu_counter s_freeinodes_counter; | 62 | struct percpu_counter s_freeinodes_counter; |
63 | struct percpu_counter s_dirs_counter; | 63 | struct percpu_counter s_dirs_counter; |
64 | struct percpu_counter s_dirtyblocks_counter; | 64 | struct percpu_counter s_dirtyblocks_counter; |
65 | struct blockgroup_lock s_blockgroup_lock; | 65 | struct blockgroup_lock *s_blockgroup_lock; |
66 | struct proc_dir_entry *s_proc; | 66 | struct proc_dir_entry *s_proc; |
67 | 67 | ||
68 | /* Journaling */ | 68 | /* Journaling */ |
@@ -149,7 +149,7 @@ struct ext4_sb_info { | |||
149 | static inline spinlock_t * | 149 | static inline spinlock_t * |
150 | sb_bgl_lock(struct ext4_sb_info *sbi, unsigned int block_group) | 150 | sb_bgl_lock(struct ext4_sb_info *sbi, unsigned int block_group) |
151 | { | 151 | { |
152 | return bgl_lock_ptr(&sbi->s_blockgroup_lock, block_group); | 152 | return bgl_lock_ptr(sbi->s_blockgroup_lock, block_group); |
153 | } | 153 | } |
154 | 154 | ||
155 | #endif /* _EXT4_SB */ | 155 | #endif /* _EXT4_SB */ |
diff --git a/fs/ext4/super.c b/fs/ext4/super.c index f7371a6a923..a3768709ce0 100644 --- a/fs/ext4/super.c +++ b/fs/ext4/super.c | |||
@@ -615,6 +615,7 @@ static void ext4_put_super(struct super_block *sb) | |||
615 | ext4_blkdev_remove(sbi); | 615 | ext4_blkdev_remove(sbi); |
616 | } | 616 | } |
617 | sb->s_fs_info = NULL; | 617 | sb->s_fs_info = NULL; |
618 | kfree(sbi->s_blockgroup_lock); | ||
618 | kfree(sbi); | 619 | kfree(sbi); |
619 | return; | 620 | return; |
620 | } | 621 | } |
@@ -2021,6 +2022,13 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) | |||
2021 | sbi = kzalloc(sizeof(*sbi), GFP_KERNEL); | 2022 | sbi = kzalloc(sizeof(*sbi), GFP_KERNEL); |
2022 | if (!sbi) | 2023 | if (!sbi) |
2023 | return -ENOMEM; | 2024 | return -ENOMEM; |
2025 | |||
2026 | sbi->s_blockgroup_lock = | ||
2027 | kzalloc(sizeof(struct blockgroup_lock), GFP_KERNEL); | ||
2028 | if (!sbi->s_blockgroup_lock) { | ||
2029 | kfree(sbi); | ||
2030 | return -ENOMEM; | ||
2031 | } | ||
2024 | sb->s_fs_info = sbi; | 2032 | sb->s_fs_info = sbi; |
2025 | sbi->s_mount_opt = 0; | 2033 | sbi->s_mount_opt = 0; |
2026 | sbi->s_resuid = EXT4_DEF_RESUID; | 2034 | sbi->s_resuid = EXT4_DEF_RESUID; |
@@ -2332,7 +2340,7 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) | |||
2332 | &sbi->s_inode_readahead_blks); | 2340 | &sbi->s_inode_readahead_blks); |
2333 | #endif | 2341 | #endif |
2334 | 2342 | ||
2335 | bgl_lock_init(&sbi->s_blockgroup_lock); | 2343 | bgl_lock_init(sbi->s_blockgroup_lock); |
2336 | 2344 | ||
2337 | for (i = 0; i < db_count; i++) { | 2345 | for (i = 0; i < db_count; i++) { |
2338 | block = descriptor_loc(sb, logical_sb_block, i); | 2346 | block = descriptor_loc(sb, logical_sb_block, i); |