diff options
author | Ken'ichi Ohmichi <oomichi@mxs.nes.nec.co.jp> | 2007-10-17 02:27:27 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@woody.linux-foundation.org> | 2007-10-17 11:42:54 -0400 |
commit | fd59d231f81cb02870b9cf15f456a897f3669b4e (patch) | |
tree | 5713c13bd678774f1ba3c42bfff5008c1812deae | |
parent | 0e647c04f665e9b3451a1ebe8252b38ffe0207c8 (diff) |
Add vmcoreinfo
This patch set frees the restriction that makedumpfile users should install a
vmlinux file (including the debugging information) into each system.
makedumpfile command is the dump filtering feature for kdump. It creates a
small dumpfile by filtering unnecessary pages for the analysis. To
distinguish unnecessary pages, it needs a vmlinux file including the debugging
information. These days, the debugging package becomes a huge file, and it is
hard to install it into each system.
To solve the problem, kdump developers discussed it at lkml and kexec-ml. As
the result, we reached the conclusion that necessary information for dump
filtering (called "vmcoreinfo") should be embedded into the first kernel file
and it should be accessed through /proc/vmcore during the second kernel.
(http://www.uwsg.iu.edu/hypermail/linux/kernel/0707.0/1806.html)
Dan Aloni created the patch set for the above implementation.
(http://www.uwsg.iu.edu/hypermail/linux/kernel/0707.1/1053.html)
And I updated it for multi architectures and memory models.
(http://lists.infradead.org/pipermail/kexec/2007-August/000479.html)
Signed-off-by: Dan Aloni <da-x@monatomic.org>
Signed-off-by: Ken'ichi Ohmichi <oomichi@mxs.nes.nec.co.jp>
Signed-off-by: Bernhard Walle <bwalle@suse.de>
Signed-off-by: Daisuke Nishimura <nishimura@mxp.nes.nec.co.jp>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
-rw-r--r-- | arch/ia64/kernel/machine_kexec.c | 30 | ||||
-rw-r--r-- | arch/ia64/mm/discontig.c | 2 | ||||
-rw-r--r-- | arch/x86/kernel/machine_kexec_32.c | 13 | ||||
-rw-r--r-- | arch/x86/kernel/machine_kexec_64.c | 9 | ||||
-rw-r--r-- | include/asm-ia64/numa.h | 1 | ||||
-rw-r--r-- | include/linux/kexec.h | 26 | ||||
-rw-r--r-- | kernel/kexec.c | 110 | ||||
-rw-r--r-- | kernel/ksysfs.c | 10 |
8 files changed, 200 insertions, 1 deletions
diff --git a/arch/ia64/kernel/machine_kexec.c b/arch/ia64/kernel/machine_kexec.c index 58e943a5d95c..40f9c3e19220 100644 --- a/arch/ia64/kernel/machine_kexec.c +++ b/arch/ia64/kernel/machine_kexec.c | |||
@@ -15,6 +15,8 @@ | |||
15 | #include <linux/cpu.h> | 15 | #include <linux/cpu.h> |
16 | #include <linux/irq.h> | 16 | #include <linux/irq.h> |
17 | #include <linux/efi.h> | 17 | #include <linux/efi.h> |
18 | #include <linux/numa.h> | ||
19 | #include <linux/mmzone.h> | ||
18 | #include <asm/mmu_context.h> | 20 | #include <asm/mmu_context.h> |
19 | #include <asm/setup.h> | 21 | #include <asm/setup.h> |
20 | #include <asm/delay.h> | 22 | #include <asm/delay.h> |
@@ -121,3 +123,31 @@ void machine_kexec(struct kimage *image) | |||
121 | unw_init_running(ia64_machine_kexec, image); | 123 | unw_init_running(ia64_machine_kexec, image); |
122 | for(;;); | 124 | for(;;); |
123 | } | 125 | } |
126 | |||
127 | void arch_crash_save_vmcoreinfo(void) | ||
128 | { | ||
129 | #ifdef CONFIG_ARCH_DISCONTIGMEM_ENABLE | ||
130 | SYMBOL(pgdat_list); | ||
131 | LENGTH(pgdat_list, MAX_NUMNODES); | ||
132 | |||
133 | SYMBOL(node_memblk); | ||
134 | LENGTH(node_memblk, NR_NODE_MEMBLKS); | ||
135 | SIZE(node_memblk_s); | ||
136 | OFFSET(node_memblk_s, start_paddr); | ||
137 | OFFSET(node_memblk_s, size); | ||
138 | #endif | ||
139 | #ifdef CONFIG_PGTABLE_3 | ||
140 | CONFIG(PGTABLE_3); | ||
141 | #elif CONFIG_PGTABLE_4 | ||
142 | CONFIG(PGTABLE_4); | ||
143 | #endif | ||
144 | } | ||
145 | |||
146 | unsigned long paddr_vmcoreinfo_note(void) | ||
147 | { | ||
148 | unsigned long vaddr, paddr; | ||
149 | vaddr = (unsigned long)(char *)&vmcoreinfo_note; | ||
150 | asm volatile ("tpa %0 = %1" : "=r"(paddr) : "r"(vaddr) : "memory"); | ||
151 | return paddr; | ||
152 | } | ||
153 | |||
diff --git a/arch/ia64/mm/discontig.c b/arch/ia64/mm/discontig.c index 5628067a74d2..0b567398f38e 100644 --- a/arch/ia64/mm/discontig.c +++ b/arch/ia64/mm/discontig.c | |||
@@ -48,7 +48,7 @@ struct early_node_data { | |||
48 | static struct early_node_data mem_data[MAX_NUMNODES] __initdata; | 48 | static struct early_node_data mem_data[MAX_NUMNODES] __initdata; |
49 | static nodemask_t memory_less_mask __initdata; | 49 | static nodemask_t memory_less_mask __initdata; |
50 | 50 | ||
51 | static pg_data_t *pgdat_list[MAX_NUMNODES]; | 51 | pg_data_t *pgdat_list[MAX_NUMNODES]; |
52 | 52 | ||
53 | /* | 53 | /* |
54 | * To prevent cache aliasing effects, align per-node structures so that they | 54 | * To prevent cache aliasing effects, align per-node structures so that they |
diff --git a/arch/x86/kernel/machine_kexec_32.c b/arch/x86/kernel/machine_kexec_32.c index deda9a221cf2..ae20fa5afa62 100644 --- a/arch/x86/kernel/machine_kexec_32.c +++ b/arch/x86/kernel/machine_kexec_32.c | |||
@@ -10,6 +10,7 @@ | |||
10 | #include <linux/kexec.h> | 10 | #include <linux/kexec.h> |
11 | #include <linux/delay.h> | 11 | #include <linux/delay.h> |
12 | #include <linux/init.h> | 12 | #include <linux/init.h> |
13 | #include <linux/numa.h> | ||
13 | #include <asm/pgtable.h> | 14 | #include <asm/pgtable.h> |
14 | #include <asm/pgalloc.h> | 15 | #include <asm/pgalloc.h> |
15 | #include <asm/tlbflush.h> | 16 | #include <asm/tlbflush.h> |
@@ -169,3 +170,15 @@ static int __init parse_crashkernel(char *arg) | |||
169 | return 0; | 170 | return 0; |
170 | } | 171 | } |
171 | early_param("crashkernel", parse_crashkernel); | 172 | early_param("crashkernel", parse_crashkernel); |
173 | |||
174 | void arch_crash_save_vmcoreinfo(void) | ||
175 | { | ||
176 | #ifdef CONFIG_ARCH_DISCONTIGMEM_ENABLE | ||
177 | SYMBOL(node_data); | ||
178 | LENGTH(node_data, MAX_NUMNODES); | ||
179 | #endif | ||
180 | #ifdef CONFIG_X86_PAE | ||
181 | CONFIG(X86_PAE); | ||
182 | #endif | ||
183 | } | ||
184 | |||
diff --git a/arch/x86/kernel/machine_kexec_64.c b/arch/x86/kernel/machine_kexec_64.c index cd1899a2f0c5..e333ea110a58 100644 --- a/arch/x86/kernel/machine_kexec_64.c +++ b/arch/x86/kernel/machine_kexec_64.c | |||
@@ -10,6 +10,7 @@ | |||
10 | #include <linux/kexec.h> | 10 | #include <linux/kexec.h> |
11 | #include <linux/string.h> | 11 | #include <linux/string.h> |
12 | #include <linux/reboot.h> | 12 | #include <linux/reboot.h> |
13 | #include <linux/numa.h> | ||
13 | #include <asm/pgtable.h> | 14 | #include <asm/pgtable.h> |
14 | #include <asm/tlbflush.h> | 15 | #include <asm/tlbflush.h> |
15 | #include <asm/mmu_context.h> | 16 | #include <asm/mmu_context.h> |
@@ -257,3 +258,11 @@ static int __init setup_crashkernel(char *arg) | |||
257 | } | 258 | } |
258 | early_param("crashkernel", setup_crashkernel); | 259 | early_param("crashkernel", setup_crashkernel); |
259 | 260 | ||
261 | void arch_crash_save_vmcoreinfo(void) | ||
262 | { | ||
263 | #ifdef CONFIG_ARCH_DISCONTIGMEM_ENABLE | ||
264 | SYMBOL(node_data); | ||
265 | LENGTH(node_data, MAX_NUMNODES); | ||
266 | #endif | ||
267 | } | ||
268 | |||
diff --git a/include/asm-ia64/numa.h b/include/asm-ia64/numa.h index 7d5e2ccc37a0..6a8a27cfae3e 100644 --- a/include/asm-ia64/numa.h +++ b/include/asm-ia64/numa.h | |||
@@ -24,6 +24,7 @@ | |||
24 | 24 | ||
25 | extern u16 cpu_to_node_map[NR_CPUS] __cacheline_aligned; | 25 | extern u16 cpu_to_node_map[NR_CPUS] __cacheline_aligned; |
26 | extern cpumask_t node_to_cpu_mask[MAX_NUMNODES] __cacheline_aligned; | 26 | extern cpumask_t node_to_cpu_mask[MAX_NUMNODES] __cacheline_aligned; |
27 | extern pg_data_t *pgdat_list[MAX_NUMNODES]; | ||
27 | 28 | ||
28 | /* Stuff below this line could be architecture independent */ | 29 | /* Stuff below this line could be architecture independent */ |
29 | 30 | ||
diff --git a/include/linux/kexec.h b/include/linux/kexec.h index 8c2c7fcd58ce..99f2d6f0c83a 100644 --- a/include/linux/kexec.h +++ b/include/linux/kexec.h | |||
@@ -121,6 +121,23 @@ extern struct page *kimage_alloc_control_pages(struct kimage *image, | |||
121 | extern void crash_kexec(struct pt_regs *); | 121 | extern void crash_kexec(struct pt_regs *); |
122 | int kexec_should_crash(struct task_struct *); | 122 | int kexec_should_crash(struct task_struct *); |
123 | void crash_save_cpu(struct pt_regs *regs, int cpu); | 123 | void crash_save_cpu(struct pt_regs *regs, int cpu); |
124 | void crash_save_vmcoreinfo(void); | ||
125 | void arch_crash_save_vmcoreinfo(void); | ||
126 | void vmcoreinfo_append_str(const char *fmt, ...); | ||
127 | unsigned long paddr_vmcoreinfo_note(void); | ||
128 | |||
129 | #define SYMBOL(name) \ | ||
130 | vmcoreinfo_append_str("SYMBOL(%s)=%lx\n", #name, (unsigned long)&name) | ||
131 | #define SIZE(name) \ | ||
132 | vmcoreinfo_append_str("SIZE(%s)=%d\n", #name, sizeof(struct name)) | ||
133 | #define OFFSET(name, field) \ | ||
134 | vmcoreinfo_append_str("OFFSET(%s.%s)=%d\n", #name, #field, \ | ||
135 | &(((struct name *)0)->field)) | ||
136 | #define LENGTH(name, value) \ | ||
137 | vmcoreinfo_append_str("LENGTH(%s)=%d\n", #name, value) | ||
138 | #define CONFIG(name) \ | ||
139 | vmcoreinfo_append_str("CONFIG_%s=y\n", #name) | ||
140 | |||
124 | extern struct kimage *kexec_image; | 141 | extern struct kimage *kexec_image; |
125 | extern struct kimage *kexec_crash_image; | 142 | extern struct kimage *kexec_crash_image; |
126 | 143 | ||
@@ -148,11 +165,20 @@ extern struct kimage *kexec_crash_image; | |||
148 | 165 | ||
149 | #define KEXEC_FLAGS (KEXEC_ON_CRASH) /* List of defined/legal kexec flags */ | 166 | #define KEXEC_FLAGS (KEXEC_ON_CRASH) /* List of defined/legal kexec flags */ |
150 | 167 | ||
168 | #define VMCOREINFO_BYTES (4096) | ||
169 | #define VMCOREINFO_NOTE_NAME "VMCOREINFO" | ||
170 | #define VMCOREINFO_NOTE_NAME_BYTES ALIGN(sizeof(VMCOREINFO_NOTE_NAME), 4) | ||
171 | #define VMCOREINFO_NOTE_SIZE (KEXEC_NOTE_HEAD_BYTES*2 + VMCOREINFO_BYTES \ | ||
172 | + VMCOREINFO_NOTE_NAME_BYTES) | ||
173 | |||
151 | /* Location of a reserved region to hold the crash kernel. | 174 | /* Location of a reserved region to hold the crash kernel. |
152 | */ | 175 | */ |
153 | extern struct resource crashk_res; | 176 | extern struct resource crashk_res; |
154 | typedef u32 note_buf_t[KEXEC_NOTE_BYTES/4]; | 177 | typedef u32 note_buf_t[KEXEC_NOTE_BYTES/4]; |
155 | extern note_buf_t *crash_notes; | 178 | extern note_buf_t *crash_notes; |
179 | extern u32 vmcoreinfo_note[VMCOREINFO_NOTE_SIZE/4]; | ||
180 | extern unsigned int vmcoreinfo_size; | ||
181 | extern unsigned int vmcoreinfo_max_size; | ||
156 | 182 | ||
157 | 183 | ||
158 | #else /* !CONFIG_KEXEC */ | 184 | #else /* !CONFIG_KEXEC */ |
diff --git a/kernel/kexec.c b/kernel/kexec.c index d8de12e943cf..67828befbfc3 100644 --- a/kernel/kexec.c +++ b/kernel/kexec.c | |||
@@ -21,16 +21,26 @@ | |||
21 | #include <linux/hardirq.h> | 21 | #include <linux/hardirq.h> |
22 | #include <linux/elf.h> | 22 | #include <linux/elf.h> |
23 | #include <linux/elfcore.h> | 23 | #include <linux/elfcore.h> |
24 | #include <linux/utsrelease.h> | ||
25 | #include <linux/utsname.h> | ||
26 | #include <linux/numa.h> | ||
24 | 27 | ||
25 | #include <asm/page.h> | 28 | #include <asm/page.h> |
26 | #include <asm/uaccess.h> | 29 | #include <asm/uaccess.h> |
27 | #include <asm/io.h> | 30 | #include <asm/io.h> |
28 | #include <asm/system.h> | 31 | #include <asm/system.h> |
29 | #include <asm/semaphore.h> | 32 | #include <asm/semaphore.h> |
33 | #include <asm/sections.h> | ||
30 | 34 | ||
31 | /* Per cpu memory for storing cpu states in case of system crash. */ | 35 | /* Per cpu memory for storing cpu states in case of system crash. */ |
32 | note_buf_t* crash_notes; | 36 | note_buf_t* crash_notes; |
33 | 37 | ||
38 | /* vmcoreinfo stuff */ | ||
39 | unsigned char vmcoreinfo_data[VMCOREINFO_BYTES]; | ||
40 | u32 vmcoreinfo_note[VMCOREINFO_NOTE_SIZE/4]; | ||
41 | unsigned int vmcoreinfo_size = 0; | ||
42 | unsigned int vmcoreinfo_max_size = sizeof(vmcoreinfo_data); | ||
43 | |||
34 | /* Location of the reserved area for the crash kernel */ | 44 | /* Location of the reserved area for the crash kernel */ |
35 | struct resource crashk_res = { | 45 | struct resource crashk_res = { |
36 | .name = "Crash kernel", | 46 | .name = "Crash kernel", |
@@ -1060,6 +1070,7 @@ void crash_kexec(struct pt_regs *regs) | |||
1060 | if (kexec_crash_image) { | 1070 | if (kexec_crash_image) { |
1061 | struct pt_regs fixed_regs; | 1071 | struct pt_regs fixed_regs; |
1062 | crash_setup_regs(&fixed_regs, regs); | 1072 | crash_setup_regs(&fixed_regs, regs); |
1073 | crash_save_vmcoreinfo(); | ||
1063 | machine_crash_shutdown(&fixed_regs); | 1074 | machine_crash_shutdown(&fixed_regs); |
1064 | machine_kexec(kexec_crash_image); | 1075 | machine_kexec(kexec_crash_image); |
1065 | } | 1076 | } |
@@ -1134,3 +1145,102 @@ static int __init crash_notes_memory_init(void) | |||
1134 | return 0; | 1145 | return 0; |
1135 | } | 1146 | } |
1136 | module_init(crash_notes_memory_init) | 1147 | module_init(crash_notes_memory_init) |
1148 | |||
1149 | void crash_save_vmcoreinfo(void) | ||
1150 | { | ||
1151 | u32 *buf; | ||
1152 | |||
1153 | if (!vmcoreinfo_size) | ||
1154 | return; | ||
1155 | |||
1156 | vmcoreinfo_append_str("CRASHTIME=%d", xtime.tv_sec); | ||
1157 | |||
1158 | buf = (u32 *)vmcoreinfo_note; | ||
1159 | |||
1160 | buf = append_elf_note(buf, VMCOREINFO_NOTE_NAME, 0, vmcoreinfo_data, | ||
1161 | vmcoreinfo_size); | ||
1162 | |||
1163 | final_note(buf); | ||
1164 | } | ||
1165 | |||
1166 | void vmcoreinfo_append_str(const char *fmt, ...) | ||
1167 | { | ||
1168 | va_list args; | ||
1169 | char buf[0x50]; | ||
1170 | int r; | ||
1171 | |||
1172 | va_start(args, fmt); | ||
1173 | r = vsnprintf(buf, sizeof(buf), fmt, args); | ||
1174 | va_end(args); | ||
1175 | |||
1176 | if (r + vmcoreinfo_size > vmcoreinfo_max_size) | ||
1177 | r = vmcoreinfo_max_size - vmcoreinfo_size; | ||
1178 | |||
1179 | memcpy(&vmcoreinfo_data[vmcoreinfo_size], buf, r); | ||
1180 | |||
1181 | vmcoreinfo_size += r; | ||
1182 | } | ||
1183 | |||
1184 | /* | ||
1185 | * provide an empty default implementation here -- architecture | ||
1186 | * code may override this | ||
1187 | */ | ||
1188 | void __attribute__ ((weak)) arch_crash_save_vmcoreinfo(void) | ||
1189 | {} | ||
1190 | |||
1191 | unsigned long __attribute__ ((weak)) paddr_vmcoreinfo_note(void) | ||
1192 | { | ||
1193 | return __pa((unsigned long)(char *)&vmcoreinfo_note); | ||
1194 | } | ||
1195 | |||
1196 | static int __init crash_save_vmcoreinfo_init(void) | ||
1197 | { | ||
1198 | vmcoreinfo_append_str("OSRELEASE=%s\n", UTS_RELEASE); | ||
1199 | vmcoreinfo_append_str("PAGESIZE=%d\n", PAGE_SIZE); | ||
1200 | |||
1201 | SYMBOL(init_uts_ns); | ||
1202 | SYMBOL(node_online_map); | ||
1203 | SYMBOL(swapper_pg_dir); | ||
1204 | SYMBOL(_stext); | ||
1205 | |||
1206 | #ifndef CONFIG_NEED_MULTIPLE_NODES | ||
1207 | SYMBOL(mem_map); | ||
1208 | SYMBOL(contig_page_data); | ||
1209 | #endif | ||
1210 | #ifdef CONFIG_SPARSEMEM | ||
1211 | SYMBOL(mem_section); | ||
1212 | LENGTH(mem_section, NR_SECTION_ROOTS); | ||
1213 | SIZE(mem_section); | ||
1214 | OFFSET(mem_section, section_mem_map); | ||
1215 | #endif | ||
1216 | SIZE(page); | ||
1217 | SIZE(pglist_data); | ||
1218 | SIZE(zone); | ||
1219 | SIZE(free_area); | ||
1220 | SIZE(list_head); | ||
1221 | OFFSET(page, flags); | ||
1222 | OFFSET(page, _count); | ||
1223 | OFFSET(page, mapping); | ||
1224 | OFFSET(page, lru); | ||
1225 | OFFSET(pglist_data, node_zones); | ||
1226 | OFFSET(pglist_data, nr_zones); | ||
1227 | #ifdef CONFIG_FLAT_NODE_MEM_MAP | ||
1228 | OFFSET(pglist_data, node_mem_map); | ||
1229 | #endif | ||
1230 | OFFSET(pglist_data, node_start_pfn); | ||
1231 | OFFSET(pglist_data, node_spanned_pages); | ||
1232 | OFFSET(pglist_data, node_id); | ||
1233 | OFFSET(zone, free_area); | ||
1234 | OFFSET(zone, vm_stat); | ||
1235 | OFFSET(zone, spanned_pages); | ||
1236 | OFFSET(free_area, free_list); | ||
1237 | OFFSET(list_head, next); | ||
1238 | OFFSET(list_head, prev); | ||
1239 | LENGTH(zone.free_area, MAX_ORDER); | ||
1240 | |||
1241 | arch_crash_save_vmcoreinfo(); | ||
1242 | |||
1243 | return 0; | ||
1244 | } | ||
1245 | |||
1246 | module_init(crash_save_vmcoreinfo_init) | ||
diff --git a/kernel/ksysfs.c b/kernel/ksysfs.c index 6046939d0804..38b38f957ef0 100644 --- a/kernel/ksysfs.c +++ b/kernel/ksysfs.c | |||
@@ -61,6 +61,15 @@ static ssize_t kexec_crash_loaded_show(struct kset *kset, char *page) | |||
61 | return sprintf(page, "%d\n", !!kexec_crash_image); | 61 | return sprintf(page, "%d\n", !!kexec_crash_image); |
62 | } | 62 | } |
63 | KERNEL_ATTR_RO(kexec_crash_loaded); | 63 | KERNEL_ATTR_RO(kexec_crash_loaded); |
64 | |||
65 | static ssize_t vmcoreinfo_show(struct kset *kset, char *page) | ||
66 | { | ||
67 | return sprintf(page, "%lx %x\n", | ||
68 | paddr_vmcoreinfo_note(), | ||
69 | vmcoreinfo_max_size); | ||
70 | } | ||
71 | KERNEL_ATTR_RO(vmcoreinfo); | ||
72 | |||
64 | #endif /* CONFIG_KEXEC */ | 73 | #endif /* CONFIG_KEXEC */ |
65 | 74 | ||
66 | /* | 75 | /* |
@@ -96,6 +105,7 @@ static struct attribute * kernel_attrs[] = { | |||
96 | #ifdef CONFIG_KEXEC | 105 | #ifdef CONFIG_KEXEC |
97 | &kexec_loaded_attr.attr, | 106 | &kexec_loaded_attr.attr, |
98 | &kexec_crash_loaded_attr.attr, | 107 | &kexec_crash_loaded_attr.attr, |
108 | &vmcoreinfo_attr.attr, | ||
99 | #endif | 109 | #endif |
100 | NULL | 110 | NULL |
101 | }; | 111 | }; |