diff options
author | Yinghai Lu <yhlu.kernel@gmail.com> | 2008-04-13 14:51:06 -0400 |
---|---|---|
committer | Ingo Molnar <mingo@elte.hu> | 2008-04-26 16:51:07 -0400 |
commit | e123dd3f0ec1664576456ea1ea045591a0a95f0c (patch) | |
tree | b73895fd0750749a1b0d85599ca02da4a920c9c0 | |
parent | 539a5fe22620a1665cce504167953a71a43232ad (diff) |
mm: make mem_map allocation continuous
vmemmap allocation currently has this layout:
[ffffe20000000000-ffffe200001fffff] PMD ->ffff810001400000 on node 0
[ffffe20000200000-ffffe200003fffff] PMD ->ffff810001800000 on node 0
[ffffe20000400000-ffffe200005fffff] PMD ->ffff810001c00000 on node 0
[ffffe20000600000-ffffe200007fffff] PMD ->ffff810002000000 on node 0
[ffffe20000800000-ffffe200009fffff] PMD ->ffff810002400000 on node 0
...
note that there is a 2M hole between them - not optimal.
the root cause is that usemap (24 bytes) will be allocated after every 2M
mem_map, and it will push next vmemmap (2M) to the next (2M) alignment.
solution: try to allocate the mem_map continously.
after the patch, we get:
[ffffe20000000000-ffffe200001fffff] PMD ->ffff810001400000 on node 0
[ffffe20000200000-ffffe200003fffff] PMD ->ffff810001600000 on node 0
[ffffe20000400000-ffffe200005fffff] PMD ->ffff810001800000 on node 0
[ffffe20000600000-ffffe200007fffff] PMD ->ffff810001a00000 on node 0
[ffffe20000800000-ffffe200009fffff] PMD ->ffff810001c00000 on node 0
...
which is the ideal layout.
and usemap will share a page because of they are allocated continuously too:
sparse_early_usemap_alloc: usemap = ffff810024e00000 size = 24
sparse_early_usemap_alloc: usemap = ffff810024e00080 size = 24
sparse_early_usemap_alloc: usemap = ffff810024e00100 size = 24
sparse_early_usemap_alloc: usemap = ffff810024e00180 size = 24
...
so we make the bootmem allocation more compact and use less memory
for usemap => mission accomplished ;-)
Signed-off-by: Yinghai Lu <yhlu.kernel@gmail.com>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
-rw-r--r-- | mm/sparse.c | 32 |
1 files changed, 29 insertions, 3 deletions
diff --git a/mm/sparse.c b/mm/sparse.c index 98d6b39c3472..458109b99e61 100644 --- a/mm/sparse.c +++ b/mm/sparse.c | |||
@@ -304,22 +304,48 @@ void __init sparse_init(void) | |||
304 | unsigned long pnum; | 304 | unsigned long pnum; |
305 | struct page *map; | 305 | struct page *map; |
306 | unsigned long *usemap; | 306 | unsigned long *usemap; |
307 | unsigned long **usemap_map; | ||
308 | int size; | ||
309 | |||
310 | /* | ||
311 | * map is using big page (aka 2M in x86 64 bit) | ||
312 | * usemap is less one page (aka 24 bytes) | ||
313 | * so alloc 2M (with 2M align) and 24 bytes in turn will | ||
314 | * make next 2M slip to one more 2M later. | ||
315 | * then in big system, the memory will have a lot of holes... | ||
316 | * here try to allocate 2M pages continously. | ||
317 | * | ||
318 | * powerpc need to call sparse_init_one_section right after each | ||
319 | * sparse_early_mem_map_alloc, so allocate usemap_map at first. | ||
320 | */ | ||
321 | size = sizeof(unsigned long *) * NR_MEM_SECTIONS; | ||
322 | usemap_map = alloc_bootmem(size); | ||
323 | if (!usemap_map) | ||
324 | panic("can not allocate usemap_map\n"); | ||
307 | 325 | ||
308 | for (pnum = 0; pnum < NR_MEM_SECTIONS; pnum++) { | 326 | for (pnum = 0; pnum < NR_MEM_SECTIONS; pnum++) { |
309 | if (!present_section_nr(pnum)) | 327 | if (!present_section_nr(pnum)) |
310 | continue; | 328 | continue; |
329 | usemap_map[pnum] = sparse_early_usemap_alloc(pnum); | ||
330 | } | ||
311 | 331 | ||
312 | map = sparse_early_mem_map_alloc(pnum); | 332 | for (pnum = 0; pnum < NR_MEM_SECTIONS; pnum++) { |
313 | if (!map) | 333 | if (!present_section_nr(pnum)) |
314 | continue; | 334 | continue; |
315 | 335 | ||
316 | usemap = sparse_early_usemap_alloc(pnum); | 336 | usemap = usemap_map[pnum]; |
317 | if (!usemap) | 337 | if (!usemap) |
318 | continue; | 338 | continue; |
319 | 339 | ||
340 | map = sparse_early_mem_map_alloc(pnum); | ||
341 | if (!map) | ||
342 | continue; | ||
343 | |||
320 | sparse_init_one_section(__nr_to_section(pnum), pnum, map, | 344 | sparse_init_one_section(__nr_to_section(pnum), pnum, map, |
321 | usemap); | 345 | usemap); |
322 | } | 346 | } |
347 | |||
348 | free_bootmem(__pa(usemap_map), size); | ||
323 | } | 349 | } |
324 | 350 | ||
325 | #ifdef CONFIG_MEMORY_HOTPLUG | 351 | #ifdef CONFIG_MEMORY_HOTPLUG |