aboutsummaryrefslogtreecommitdiffstats
path: root/arch/x86/kernel
diff options
context:
space:
mode:
authorYinghai Lu <yhlu.kernel@gmail.com>2008-03-07 18:02:50 -0500
committerIngo Molnar <mingo@elte.hu>2008-04-19 13:19:55 -0400
commit752bea4abbff5e3ffef36802b860e80d0b632990 (patch)
tree4ffb673c7b03700d3eefc3a3954d80dfd50a6ebf /arch/x86/kernel
parent6ec6e0d9f2fd7cb6ca6bc3bfab5ae7b5cdd8c36f (diff)
x86: reserve dma32 early for gart
a system with 256 GB of RAM, when NUMA is disabled crashes the following way: Your BIOS doesn't leave a aperture memory hole Please enable the IOMMU option in the BIOS setup This costs you 64 MB of RAM Cannot allocate aperture memory hole (ffff8101c0000000,65536K) Kernel panic - not syncing: Not enough memory for aperture Pid: 0, comm: swapper Not tainted 2.6.25-rc4-x86-latest.git #33 Call Trace: [<ffffffff84037c62>] panic+0xb2/0x190 [<ffffffff840381fc>] ? release_console_sem+0x7c/0x250 [<ffffffff847b1628>] ? __alloc_bootmem_nopanic+0x48/0x90 [<ffffffff847b0ac9>] ? free_bootmem+0x29/0x50 [<ffffffff847ac1f7>] gart_iommu_hole_init+0x5e7/0x680 [<ffffffff847b255b>] ? alloc_large_system_hash+0x16b/0x310 [<ffffffff84506a2f>] ? _etext+0x0/0x1 [<ffffffff847a2e8c>] pci_iommu_alloc+0x1c/0x40 [<ffffffff847ac795>] mem_init+0x45/0x1a0 [<ffffffff8479ff35>] start_kernel+0x295/0x380 [<ffffffff8479f1c2>] _sinittext+0x1c2/0x230 the root cause is : memmap PMD is too big, [ffffe200e0600000-ffffe200e07fffff] PMD ->ffff81383c000000 on node 0 almost near 4G..., and vmemmap_alloc_block will use up the ram under 4G. solution will be: 1. make memmap allocation get memory above 4G... 2. reserve some dma32 range early before we try to set up memmap for all. and release that before pci_iommu_alloc, so gart or swiotlb could get some range under 4g limit for sure. the patch is using method 2. because method1 may need more code to handle SPARSEMEM and SPASEMEM_VMEMMAP will get Your BIOS doesn't leave a aperture memory hole Please enable the IOMMU option in the BIOS setup This costs you 64 MB of RAM Mapping aperture over 65536 KB of RAM @ 4000000 Memory: 264245736k/268959744k available (8484k kernel code, 4187464k reserved, 4004k data, 724k init) Signed-off-by: Yinghai Lu <yhlu.kernel@gmail.com> Signed-off-by: Ingo Molnar <mingo@elte.hu> Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Diffstat (limited to 'arch/x86/kernel')
-rw-r--r--arch/x86/kernel/pci-dma_64.c49
-rw-r--r--arch/x86/kernel/setup_64.c2
2 files changed, 51 insertions, 0 deletions
diff --git a/arch/x86/kernel/pci-dma_64.c b/arch/x86/kernel/pci-dma_64.c
index ada5a0604992..e4fffaabe53b 100644
--- a/arch/x86/kernel/pci-dma_64.c
+++ b/arch/x86/kernel/pci-dma_64.c
@@ -8,6 +8,8 @@
8#include <linux/pci.h> 8#include <linux/pci.h>
9#include <linux/module.h> 9#include <linux/module.h>
10#include <linux/dmar.h> 10#include <linux/dmar.h>
11#include <linux/bootmem.h>
12#include <asm/proto.h>
11#include <asm/io.h> 13#include <asm/io.h>
12#include <asm/gart.h> 14#include <asm/gart.h>
13#include <asm/calgary.h> 15#include <asm/calgary.h>
@@ -286,8 +288,55 @@ static __init int iommu_setup(char *p)
286} 288}
287early_param("iommu", iommu_setup); 289early_param("iommu", iommu_setup);
288 290
291static __initdata void *dma32_bootmem_ptr;
292static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
293
294static int __init parse_dma32_size_opt(char *p)
295{
296 if (!p)
297 return -EINVAL;
298 dma32_bootmem_size = memparse(p, &p);
299 return 0;
300}
301early_param("dma32_size", parse_dma32_size_opt);
302
303void __init dma32_reserve_bootmem(void)
304{
305 unsigned long size, align;
306 if (end_pfn <= MAX_DMA32_PFN)
307 return;
308
309 align = 64ULL<<20;
310 size = round_up(dma32_bootmem_size, align);
311 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
312 __pa(MAX_DMA_ADDRESS));
313 if (dma32_bootmem_ptr)
314 dma32_bootmem_size = size;
315 else
316 dma32_bootmem_size = 0;
317}
318static void __init dma32_free_bootmem(void)
319{
320 int node;
321
322 if (end_pfn <= MAX_DMA32_PFN)
323 return;
324
325 if (!dma32_bootmem_ptr)
326 return;
327
328 for_each_online_node(node)
329 free_bootmem_node(NODE_DATA(node), __pa(dma32_bootmem_ptr),
330 dma32_bootmem_size);
331
332 dma32_bootmem_ptr = NULL;
333 dma32_bootmem_size = 0;
334}
335
289void __init pci_iommu_alloc(void) 336void __init pci_iommu_alloc(void)
290{ 337{
338 /* free the range so iommu could get some range less than 4G */
339 dma32_free_bootmem();
291 /* 340 /*
292 * The order of these functions is important for 341 * The order of these functions is important for
293 * fall-back/fail-over reasons 342 * fall-back/fail-over reasons
diff --git a/arch/x86/kernel/setup_64.c b/arch/x86/kernel/setup_64.c
index 0aa291bff4e0..6b8e11f0c15d 100644
--- a/arch/x86/kernel/setup_64.c
+++ b/arch/x86/kernel/setup_64.c
@@ -398,6 +398,8 @@ void __init setup_arch(char **cmdline_p)
398 398
399 early_res_to_bootmem(); 399 early_res_to_bootmem();
400 400
401 dma32_reserve_bootmem();
402
401#ifdef CONFIG_ACPI_SLEEP 403#ifdef CONFIG_ACPI_SLEEP
402 /* 404 /*
403 * Reserve low memory region for sleep support. 405 * Reserve low memory region for sleep support.