aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorTejun Heo <tj@kernel.org>2009-07-03 19:10:59 -0400
committerTejun Heo <tj@kernel.org>2009-07-03 19:10:59 -0400
commitd4b95f80399471e4bce5e992700ff7f06ef91f6a (patch)
treea7b97c549629ea1032c36a41048ea847a20b8d27
parent788e5abc5441e9046dd91c995c6f1f75bbd144bf (diff)
x86,percpu: generalize 4k first chunk allocator
Generalize and move x86 setup_pcpu_4k() into pcpu_4k_first_chunk(). setup_pcpu_4k() now is a simple wrapper around the generalized version. Other than taking size parameters and using arch supplied callbacks to allocate/free memory, pcpu_4k_first_chunk() is identical to the original implementation. This simplifies arch code and will help converting more archs to dynamic percpu allocator. While at it, s/pcpu_populate_pte_fn_t/pcpu_fc_populate_pte_fn_t/ for consistency. [ Impact: code reorganization and generalization ] Signed-off-by: Tejun Heo <tj@kernel.org> Cc: Ingo Molnar <mingo@elte.hu>
-rw-r--r--arch/x86/kernel/setup_percpu.c78
-rw-r--r--include/linux/percpu.h12
-rw-r--r--mm/percpu.c85
3 files changed, 113 insertions, 62 deletions
diff --git a/arch/x86/kernel/setup_percpu.c b/arch/x86/kernel/setup_percpu.c
index 14728206fb52..ab896b31e80b 100644
--- a/arch/x86/kernel/setup_percpu.c
+++ b/arch/x86/kernel/setup_percpu.c
@@ -124,6 +124,19 @@ static void * __init pcpu_alloc_bootmem(unsigned int cpu, unsigned long size,
124} 124}
125 125
126/* 126/*
127 * Helpers for first chunk memory allocation
128 */
129static void * __init pcpu_fc_alloc(unsigned int cpu, size_t size)
130{
131 return pcpu_alloc_bootmem(cpu, size, size);
132}
133
134static void __init pcpu_fc_free(void *ptr, size_t size)
135{
136 free_bootmem(__pa(ptr), size);
137}
138
139/*
127 * Large page remap allocator 140 * Large page remap allocator
128 * 141 *
129 * This allocator uses PMD page as unit. A PMD page is allocated for 142 * This allocator uses PMD page as unit. A PMD page is allocated for
@@ -346,22 +359,11 @@ static ssize_t __init setup_pcpu_embed(size_t static_size, bool chosen)
346} 359}
347 360
348/* 361/*
349 * 4k page allocator 362 * 4k allocator
350 * 363 *
351 * This is the basic allocator. Static percpu area is allocated 364 * Boring fallback 4k allocator. This allocator puts more pressure on
352 * page-by-page and most of initialization is done by the generic 365 * PTE TLBs but other than that behaves nicely on both UMA and NUMA.
353 * setup function.
354 */ 366 */
355static struct page **pcpu4k_pages __initdata;
356static int pcpu4k_nr_static_pages __initdata;
357
358static struct page * __init pcpu4k_get_page(unsigned int cpu, int pageno)
359{
360 if (pageno < pcpu4k_nr_static_pages)
361 return pcpu4k_pages[cpu * pcpu4k_nr_static_pages + pageno];
362 return NULL;
363}
364
365static void __init pcpu4k_populate_pte(unsigned long addr) 367static void __init pcpu4k_populate_pte(unsigned long addr)
366{ 368{
367 populate_extra_pte(addr); 369 populate_extra_pte(addr);
@@ -369,51 +371,9 @@ static void __init pcpu4k_populate_pte(unsigned long addr)
369 371
370static ssize_t __init setup_pcpu_4k(size_t static_size) 372static ssize_t __init setup_pcpu_4k(size_t static_size)
371{ 373{
372 size_t pages_size; 374 return pcpu_4k_first_chunk(static_size, PERCPU_FIRST_CHUNK_RESERVE,
373 unsigned int cpu; 375 pcpu_fc_alloc, pcpu_fc_free,
374 int i, j; 376 pcpu4k_populate_pte);
375 ssize_t ret;
376
377 pcpu4k_nr_static_pages = PFN_UP(static_size);
378
379 /* unaligned allocations can't be freed, round up to page size */
380 pages_size = PFN_ALIGN(pcpu4k_nr_static_pages * num_possible_cpus()
381 * sizeof(pcpu4k_pages[0]));
382 pcpu4k_pages = alloc_bootmem(pages_size);
383
384 /* allocate and copy */
385 j = 0;
386 for_each_possible_cpu(cpu)
387 for (i = 0; i < pcpu4k_nr_static_pages; i++) {
388 void *ptr;
389
390 ptr = pcpu_alloc_bootmem(cpu, PAGE_SIZE, PAGE_SIZE);
391 if (!ptr) {
392 pr_warning("PERCPU: failed to allocate "
393 "4k page for cpu%u\n", cpu);
394 goto enomem;
395 }
396
397 memcpy(ptr, __per_cpu_load + i * PAGE_SIZE, PAGE_SIZE);
398 pcpu4k_pages[j++] = virt_to_page(ptr);
399 }
400
401 /* we're ready, commit */
402 pr_info("PERCPU: Allocated %d 4k pages, static data %zu bytes\n",
403 pcpu4k_nr_static_pages, static_size);
404
405 ret = pcpu_setup_first_chunk(pcpu4k_get_page, static_size,
406 PERCPU_FIRST_CHUNK_RESERVE, -1,
407 -1, NULL, pcpu4k_populate_pte);
408 goto out_free_ar;
409
410enomem:
411 while (--j >= 0)
412 free_bootmem(__pa(page_address(pcpu4k_pages[j])), PAGE_SIZE);
413 ret = -ENOMEM;
414out_free_ar:
415 free_bootmem(__pa(pcpu4k_pages), pages_size);
416 return ret;
417} 377}
418 378
419/* for explicit first chunk allocator selection */ 379/* for explicit first chunk allocator selection */
diff --git a/include/linux/percpu.h b/include/linux/percpu.h
index 83bff053bd1c..41b5bfab4195 100644
--- a/include/linux/percpu.h
+++ b/include/linux/percpu.h
@@ -59,18 +59,26 @@
59extern void *pcpu_base_addr; 59extern void *pcpu_base_addr;
60 60
61typedef struct page * (*pcpu_get_page_fn_t)(unsigned int cpu, int pageno); 61typedef struct page * (*pcpu_get_page_fn_t)(unsigned int cpu, int pageno);
62typedef void (*pcpu_populate_pte_fn_t)(unsigned long addr); 62typedef void * (*pcpu_fc_alloc_fn_t)(unsigned int cpu, size_t size);
63typedef void (*pcpu_fc_free_fn_t)(void *ptr, size_t size);
64typedef void (*pcpu_fc_populate_pte_fn_t)(unsigned long addr);
63 65
64extern size_t __init pcpu_setup_first_chunk(pcpu_get_page_fn_t get_page_fn, 66extern size_t __init pcpu_setup_first_chunk(pcpu_get_page_fn_t get_page_fn,
65 size_t static_size, size_t reserved_size, 67 size_t static_size, size_t reserved_size,
66 ssize_t dyn_size, ssize_t unit_size, 68 ssize_t dyn_size, ssize_t unit_size,
67 void *base_addr, 69 void *base_addr,
68 pcpu_populate_pte_fn_t populate_pte_fn); 70 pcpu_fc_populate_pte_fn_t populate_pte_fn);
69 71
70extern ssize_t __init pcpu_embed_first_chunk( 72extern ssize_t __init pcpu_embed_first_chunk(
71 size_t static_size, size_t reserved_size, 73 size_t static_size, size_t reserved_size,
72 ssize_t dyn_size); 74 ssize_t dyn_size);
73 75
76extern ssize_t __init pcpu_4k_first_chunk(
77 size_t static_size, size_t reserved_size,
78 pcpu_fc_alloc_fn_t alloc_fn,
79 pcpu_fc_free_fn_t free_fn,
80 pcpu_fc_populate_pte_fn_t populate_pte_fn);
81
74/* 82/*
75 * Use this to get to a cpu's version of the per-cpu object 83 * Use this to get to a cpu's version of the per-cpu object
76 * dynamically allocated. Non-atomic access to the current CPU's 84 * dynamically allocated. Non-atomic access to the current CPU's
diff --git a/mm/percpu.c b/mm/percpu.c
index fc6babe6e554..27b0f40a3ea8 100644
--- a/mm/percpu.c
+++ b/mm/percpu.c
@@ -1037,7 +1037,7 @@ size_t __init pcpu_setup_first_chunk(pcpu_get_page_fn_t get_page_fn,
1037 size_t static_size, size_t reserved_size, 1037 size_t static_size, size_t reserved_size,
1038 ssize_t dyn_size, ssize_t unit_size, 1038 ssize_t dyn_size, ssize_t unit_size,
1039 void *base_addr, 1039 void *base_addr,
1040 pcpu_populate_pte_fn_t populate_pte_fn) 1040 pcpu_fc_populate_pte_fn_t populate_pte_fn)
1041{ 1041{
1042 static struct vm_struct first_vm; 1042 static struct vm_struct first_vm;
1043 static int smap[2], dmap[2]; 1043 static int smap[2], dmap[2];
@@ -1271,6 +1271,89 @@ ssize_t __init pcpu_embed_first_chunk(size_t static_size, size_t reserved_size,
1271} 1271}
1272 1272
1273/* 1273/*
1274 * 4k page first chunk setup helper.
1275 */
1276static struct page **pcpu4k_pages __initdata;
1277static int pcpu4k_nr_static_pages __initdata;
1278
1279static struct page * __init pcpu4k_get_page(unsigned int cpu, int pageno)
1280{
1281 if (pageno < pcpu4k_nr_static_pages)
1282 return pcpu4k_pages[cpu * pcpu4k_nr_static_pages + pageno];
1283 return NULL;
1284}
1285
1286/**
1287 * pcpu_4k_first_chunk - map the first chunk using PAGE_SIZE pages
1288 * @static_size: the size of static percpu area in bytes
1289 * @reserved_size: the size of reserved percpu area in bytes
1290 * @alloc_fn: function to allocate percpu page, always called with PAGE_SIZE
1291 * @free_fn: funtion to free percpu page, always called with PAGE_SIZE
1292 * @populate_pte_fn: function to populate pte
1293 *
1294 * This is a helper to ease setting up embedded first percpu chunk and
1295 * can be called where pcpu_setup_first_chunk() is expected.
1296 *
1297 * This is the basic allocator. Static percpu area is allocated
1298 * page-by-page into vmalloc area.
1299 *
1300 * RETURNS:
1301 * The determined pcpu_unit_size which can be used to initialize
1302 * percpu access on success, -errno on failure.
1303 */
1304ssize_t __init pcpu_4k_first_chunk(size_t static_size, size_t reserved_size,
1305 pcpu_fc_alloc_fn_t alloc_fn,
1306 pcpu_fc_free_fn_t free_fn,
1307 pcpu_fc_populate_pte_fn_t populate_pte_fn)
1308{
1309 size_t pages_size;
1310 unsigned int cpu;
1311 int i, j;
1312 ssize_t ret;
1313
1314 pcpu4k_nr_static_pages = PFN_UP(static_size);
1315
1316 /* unaligned allocations can't be freed, round up to page size */
1317 pages_size = PFN_ALIGN(pcpu4k_nr_static_pages * num_possible_cpus() *
1318 sizeof(pcpu4k_pages[0]));
1319 pcpu4k_pages = alloc_bootmem(pages_size);
1320
1321 /* allocate and copy */
1322 j = 0;
1323 for_each_possible_cpu(cpu)
1324 for (i = 0; i < pcpu4k_nr_static_pages; i++) {
1325 void *ptr;
1326
1327 ptr = alloc_fn(cpu, PAGE_SIZE);
1328 if (!ptr) {
1329 pr_warning("PERCPU: failed to allocate "
1330 "4k page for cpu%u\n", cpu);
1331 goto enomem;
1332 }
1333
1334 memcpy(ptr, __per_cpu_load + i * PAGE_SIZE, PAGE_SIZE);
1335 pcpu4k_pages[j++] = virt_to_page(ptr);
1336 }
1337
1338 /* we're ready, commit */
1339 pr_info("PERCPU: Allocated %d 4k pages, static data %zu bytes\n",
1340 pcpu4k_nr_static_pages, static_size);
1341
1342 ret = pcpu_setup_first_chunk(pcpu4k_get_page, static_size,
1343 reserved_size, -1,
1344 -1, NULL, populate_pte_fn);
1345 goto out_free_ar;
1346
1347enomem:
1348 while (--j >= 0)
1349 free_fn(page_address(pcpu4k_pages[j]), PAGE_SIZE);
1350 ret = -ENOMEM;
1351out_free_ar:
1352 free_bootmem(__pa(pcpu4k_pages), pages_size);
1353 return ret;
1354}
1355
1356/*
1274 * Generic percpu area setup. 1357 * Generic percpu area setup.
1275 * 1358 *
1276 * The embedding helper is used because its behavior closely resembles 1359 * The embedding helper is used because its behavior closely resembles