diff options
author | Steven Whitehouse <swhiteho@redhat.com> | 2006-07-17 09:25:26 -0400 |
---|---|---|
committer | Steven Whitehouse <swhiteho@redhat.com> | 2006-07-17 09:25:26 -0400 |
commit | 4bf311ddfbffe12d41ad1a3c311ab727db6f72cb (patch) | |
tree | 9d19a2774e83637d86dc876f3af22af1dacf0bec /fs | |
parent | 597d0cae0f99f62501e229bed50e8149604015bb (diff) | |
parent | 82d6897fefca6206bca7153805b4c5359ce97fc4 (diff) |
Merge branch 'master'
Diffstat (limited to 'fs')
-rw-r--r-- | fs/Kconfig | 1 | ||||
-rw-r--r-- | fs/binfmt_elf.c | 2 | ||||
-rw-r--r-- | fs/binfmt_elf_fdpic.c | 980 | ||||
-rw-r--r-- | fs/char_dev.c | 22 | ||||
-rw-r--r-- | fs/ext3/acl.h | 3 | ||||
-rw-r--r-- | fs/file.c | 14 | ||||
-rw-r--r-- | fs/hugetlbfs/inode.c | 4 | ||||
-rw-r--r-- | fs/jfs/jfs_txnmgr.c | 2 | ||||
-rw-r--r-- | fs/jfs/namei.c | 33 | ||||
-rw-r--r-- | fs/namei.c | 8 | ||||
-rw-r--r-- | fs/nfsd/nfs4proc.c | 8 | ||||
-rw-r--r-- | fs/nfsd/stats.c | 10 | ||||
-rw-r--r-- | fs/partitions/check.c | 1 | ||||
-rw-r--r-- | fs/proc/array.c | 6 | ||||
-rw-r--r-- | fs/proc/base.c | 33 | ||||
-rw-r--r-- | fs/proc/inode.c | 2 | ||||
-rw-r--r-- | fs/proc/kcore.c | 4 | ||||
-rw-r--r-- | fs/ramfs/file-nommu.c | 4 | ||||
-rw-r--r-- | fs/read_write.c | 2 | ||||
-rw-r--r-- | fs/reiserfs/file.c | 6 | ||||
-rw-r--r-- | fs/reiserfs/procfs.c | 25 | ||||
-rw-r--r-- | fs/splice.c | 238 | ||||
-rw-r--r-- | fs/sysfs/inode.c | 12 | ||||
-rw-r--r-- | fs/xfs/linux-2.6/xfs_linux.h | 1 |
24 files changed, 1127 insertions, 294 deletions
diff --git a/fs/Kconfig b/fs/Kconfig index a7cd7db5e533..ddc7462ddb56 100644 --- a/fs/Kconfig +++ b/fs/Kconfig | |||
@@ -1802,6 +1802,7 @@ config CIFS_POSIX | |||
1802 | 1802 | ||
1803 | config CIFS_DEBUG2 | 1803 | config CIFS_DEBUG2 |
1804 | bool "Enable additional CIFS debugging routines" | 1804 | bool "Enable additional CIFS debugging routines" |
1805 | depends on CIFS | ||
1805 | help | 1806 | help |
1806 | Enabling this option adds a few more debugging routines | 1807 | Enabling this option adds a few more debugging routines |
1807 | to the cifs code which slightly increases the size of | 1808 | to the cifs code which slightly increases the size of |
diff --git a/fs/binfmt_elf.c b/fs/binfmt_elf.c index f42e64210ee5..672a3b90bc55 100644 --- a/fs/binfmt_elf.c +++ b/fs/binfmt_elf.c | |||
@@ -1185,8 +1185,6 @@ static int maydump(struct vm_area_struct *vma) | |||
1185 | return 1; | 1185 | return 1; |
1186 | } | 1186 | } |
1187 | 1187 | ||
1188 | #define roundup(x, y) ((((x) + ((y) - 1)) / (y)) * (y)) | ||
1189 | |||
1190 | /* An ELF note in memory */ | 1188 | /* An ELF note in memory */ |
1191 | struct memelfnote | 1189 | struct memelfnote |
1192 | { | 1190 | { |
diff --git a/fs/binfmt_elf_fdpic.c b/fs/binfmt_elf_fdpic.c index eba4e23b9ca0..2f3365829229 100644 --- a/fs/binfmt_elf_fdpic.c +++ b/fs/binfmt_elf_fdpic.c | |||
@@ -1,6 +1,6 @@ | |||
1 | /* binfmt_elf_fdpic.c: FDPIC ELF binary format | 1 | /* binfmt_elf_fdpic.c: FDPIC ELF binary format |
2 | * | 2 | * |
3 | * Copyright (C) 2003, 2004 Red Hat, Inc. All Rights Reserved. | 3 | * Copyright (C) 2003, 2004, 2006 Red Hat, Inc. All Rights Reserved. |
4 | * Written by David Howells (dhowells@redhat.com) | 4 | * Written by David Howells (dhowells@redhat.com) |
5 | * Derived from binfmt_elf.c | 5 | * Derived from binfmt_elf.c |
6 | * | 6 | * |
@@ -24,7 +24,9 @@ | |||
24 | #include <linux/file.h> | 24 | #include <linux/file.h> |
25 | #include <linux/fcntl.h> | 25 | #include <linux/fcntl.h> |
26 | #include <linux/slab.h> | 26 | #include <linux/slab.h> |
27 | #include <linux/pagemap.h> | ||
27 | #include <linux/highmem.h> | 28 | #include <linux/highmem.h> |
29 | #include <linux/highuid.h> | ||
28 | #include <linux/personality.h> | 30 | #include <linux/personality.h> |
29 | #include <linux/ptrace.h> | 31 | #include <linux/ptrace.h> |
30 | #include <linux/init.h> | 32 | #include <linux/init.h> |
@@ -48,45 +50,59 @@ typedef char *elf_caddr_t; | |||
48 | #define kdebug(fmt, ...) do {} while(0) | 50 | #define kdebug(fmt, ...) do {} while(0) |
49 | #endif | 51 | #endif |
50 | 52 | ||
53 | #if 0 | ||
54 | #define kdcore(fmt, ...) printk("FDPIC "fmt"\n" ,##__VA_ARGS__ ) | ||
55 | #else | ||
56 | #define kdcore(fmt, ...) do {} while(0) | ||
57 | #endif | ||
58 | |||
51 | MODULE_LICENSE("GPL"); | 59 | MODULE_LICENSE("GPL"); |
52 | 60 | ||
53 | static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs); | 61 | static int load_elf_fdpic_binary(struct linux_binprm *, struct pt_regs *); |
54 | //static int load_elf_fdpic_library(struct file *); | 62 | static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *, struct file *); |
55 | static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *params, struct file *file); | 63 | static int elf_fdpic_map_file(struct elf_fdpic_params *, struct file *, |
56 | static int elf_fdpic_map_file(struct elf_fdpic_params *params, | 64 | struct mm_struct *, const char *); |
57 | struct file *file, | ||
58 | struct mm_struct *mm, | ||
59 | const char *what); | ||
60 | 65 | ||
61 | static int create_elf_fdpic_tables(struct linux_binprm *bprm, | 66 | static int create_elf_fdpic_tables(struct linux_binprm *, struct mm_struct *, |
62 | struct mm_struct *mm, | 67 | struct elf_fdpic_params *, |
63 | struct elf_fdpic_params *exec_params, | 68 | struct elf_fdpic_params *); |
64 | struct elf_fdpic_params *interp_params); | ||
65 | 69 | ||
66 | #ifndef CONFIG_MMU | 70 | #ifndef CONFIG_MMU |
67 | static int elf_fdpic_transfer_args_to_stack(struct linux_binprm *bprm, unsigned long *_sp); | 71 | static int elf_fdpic_transfer_args_to_stack(struct linux_binprm *, |
68 | static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *params, | 72 | unsigned long *); |
69 | struct file *file, | 73 | static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *, |
70 | struct mm_struct *mm); | 74 | struct file *, |
75 | struct mm_struct *); | ||
71 | #endif | 76 | #endif |
72 | 77 | ||
73 | static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | 78 | static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *, |
74 | struct file *file, | 79 | struct file *, struct mm_struct *); |
75 | struct mm_struct *mm); | 80 | |
81 | #if defined(USE_ELF_CORE_DUMP) && defined(CONFIG_ELF_CORE) | ||
82 | static int elf_fdpic_core_dump(long, struct pt_regs *, struct file *); | ||
83 | #endif | ||
76 | 84 | ||
77 | static struct linux_binfmt elf_fdpic_format = { | 85 | static struct linux_binfmt elf_fdpic_format = { |
78 | .module = THIS_MODULE, | 86 | .module = THIS_MODULE, |
79 | .load_binary = load_elf_fdpic_binary, | 87 | .load_binary = load_elf_fdpic_binary, |
80 | // .load_shlib = load_elf_fdpic_library, | 88 | #if defined(USE_ELF_CORE_DUMP) && defined(CONFIG_ELF_CORE) |
81 | // .core_dump = elf_fdpic_core_dump, | 89 | .core_dump = elf_fdpic_core_dump, |
90 | #endif | ||
82 | .min_coredump = ELF_EXEC_PAGESIZE, | 91 | .min_coredump = ELF_EXEC_PAGESIZE, |
83 | }; | 92 | }; |
84 | 93 | ||
85 | static int __init init_elf_fdpic_binfmt(void) { return register_binfmt(&elf_fdpic_format); } | 94 | static int __init init_elf_fdpic_binfmt(void) |
86 | static void __exit exit_elf_fdpic_binfmt(void) { unregister_binfmt(&elf_fdpic_format); } | 95 | { |
96 | return register_binfmt(&elf_fdpic_format); | ||
97 | } | ||
98 | |||
99 | static void __exit exit_elf_fdpic_binfmt(void) | ||
100 | { | ||
101 | unregister_binfmt(&elf_fdpic_format); | ||
102 | } | ||
87 | 103 | ||
88 | module_init(init_elf_fdpic_binfmt) | 104 | core_initcall(init_elf_fdpic_binfmt); |
89 | module_exit(exit_elf_fdpic_binfmt) | 105 | module_exit(exit_elf_fdpic_binfmt); |
90 | 106 | ||
91 | static int is_elf_fdpic(struct elfhdr *hdr, struct file *file) | 107 | static int is_elf_fdpic(struct elfhdr *hdr, struct file *file) |
92 | { | 108 | { |
@@ -105,7 +121,8 @@ static int is_elf_fdpic(struct elfhdr *hdr, struct file *file) | |||
105 | /* | 121 | /* |
106 | * read the program headers table into memory | 122 | * read the program headers table into memory |
107 | */ | 123 | */ |
108 | static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *params, struct file *file) | 124 | static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *params, |
125 | struct file *file) | ||
109 | { | 126 | { |
110 | struct elf32_phdr *phdr; | 127 | struct elf32_phdr *phdr; |
111 | unsigned long size; | 128 | unsigned long size; |
@@ -121,7 +138,8 @@ static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *params, struct file *f | |||
121 | if (!params->phdrs) | 138 | if (!params->phdrs) |
122 | return -ENOMEM; | 139 | return -ENOMEM; |
123 | 140 | ||
124 | retval = kernel_read(file, params->hdr.e_phoff, (char *) params->phdrs, size); | 141 | retval = kernel_read(file, params->hdr.e_phoff, |
142 | (char *) params->phdrs, size); | ||
125 | if (retval < 0) | 143 | if (retval < 0) |
126 | return retval; | 144 | return retval; |
127 | 145 | ||
@@ -141,17 +159,24 @@ static int elf_fdpic_fetch_phdrs(struct elf_fdpic_params *params, struct file *f | |||
141 | } | 159 | } |
142 | 160 | ||
143 | return 0; | 161 | return 0; |
144 | } /* end elf_fdpic_fetch_phdrs() */ | 162 | } |
145 | 163 | ||
146 | /*****************************************************************************/ | 164 | /*****************************************************************************/ |
147 | /* | 165 | /* |
148 | * load an fdpic binary into various bits of memory | 166 | * load an fdpic binary into various bits of memory |
149 | */ | 167 | */ |
150 | static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs) | 168 | static int load_elf_fdpic_binary(struct linux_binprm *bprm, |
169 | struct pt_regs *regs) | ||
151 | { | 170 | { |
152 | struct elf_fdpic_params exec_params, interp_params; | 171 | struct elf_fdpic_params exec_params, interp_params; |
153 | struct elf_phdr *phdr; | 172 | struct elf_phdr *phdr; |
154 | unsigned long stack_size; | 173 | unsigned long stack_size, entryaddr; |
174 | #ifndef CONFIG_MMU | ||
175 | unsigned long fullsize; | ||
176 | #endif | ||
177 | #ifdef ELF_FDPIC_PLAT_INIT | ||
178 | unsigned long dynaddr; | ||
179 | #endif | ||
155 | struct file *interpreter = NULL; /* to shut gcc up */ | 180 | struct file *interpreter = NULL; /* to shut gcc up */ |
156 | char *interpreter_name = NULL; | 181 | char *interpreter_name = NULL; |
157 | int executable_stack; | 182 | int executable_stack; |
@@ -212,7 +237,8 @@ static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs | |||
212 | goto error; | 237 | goto error; |
213 | } | 238 | } |
214 | 239 | ||
215 | retval = kernel_read(interpreter, 0, bprm->buf, BINPRM_BUF_SIZE); | 240 | retval = kernel_read(interpreter, 0, bprm->buf, |
241 | BINPRM_BUF_SIZE); | ||
216 | if (retval < 0) | 242 | if (retval < 0) |
217 | goto error; | 243 | goto error; |
218 | 244 | ||
@@ -295,7 +321,8 @@ static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs | |||
295 | ¤t->mm->start_stack, | 321 | ¤t->mm->start_stack, |
296 | ¤t->mm->start_brk); | 322 | ¤t->mm->start_brk); |
297 | 323 | ||
298 | retval = setup_arg_pages(bprm, current->mm->start_stack, executable_stack); | 324 | retval = setup_arg_pages(bprm, current->mm->start_stack, |
325 | executable_stack); | ||
299 | if (retval < 0) { | 326 | if (retval < 0) { |
300 | send_sig(SIGKILL, current, 0); | 327 | send_sig(SIGKILL, current, 0); |
301 | goto error_kill; | 328 | goto error_kill; |
@@ -303,7 +330,8 @@ static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs | |||
303 | #endif | 330 | #endif |
304 | 331 | ||
305 | /* load the executable and interpreter into memory */ | 332 | /* load the executable and interpreter into memory */ |
306 | retval = elf_fdpic_map_file(&exec_params, bprm->file, current->mm, "executable"); | 333 | retval = elf_fdpic_map_file(&exec_params, bprm->file, current->mm, |
334 | "executable"); | ||
307 | if (retval < 0) | 335 | if (retval < 0) |
308 | goto error_kill; | 336 | goto error_kill; |
309 | 337 | ||
@@ -324,7 +352,8 @@ static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs | |||
324 | if (!current->mm->start_brk) | 352 | if (!current->mm->start_brk) |
325 | current->mm->start_brk = current->mm->end_data; | 353 | current->mm->start_brk = current->mm->end_data; |
326 | 354 | ||
327 | current->mm->brk = current->mm->start_brk = PAGE_ALIGN(current->mm->start_brk); | 355 | current->mm->brk = current->mm->start_brk = |
356 | PAGE_ALIGN(current->mm->start_brk); | ||
328 | 357 | ||
329 | #else | 358 | #else |
330 | /* create a stack and brk area big enough for everyone | 359 | /* create a stack and brk area big enough for everyone |
@@ -336,47 +365,45 @@ static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs | |||
336 | stack_size = PAGE_SIZE * 2; | 365 | stack_size = PAGE_SIZE * 2; |
337 | 366 | ||
338 | down_write(¤t->mm->mmap_sem); | 367 | down_write(¤t->mm->mmap_sem); |
339 | current->mm->start_brk = do_mmap(NULL, | 368 | current->mm->start_brk = do_mmap(NULL, 0, stack_size, |
340 | 0, | ||
341 | stack_size, | ||
342 | PROT_READ | PROT_WRITE | PROT_EXEC, | 369 | PROT_READ | PROT_WRITE | PROT_EXEC, |
343 | MAP_PRIVATE | MAP_ANON | MAP_GROWSDOWN, | 370 | MAP_PRIVATE | MAP_ANON | MAP_GROWSDOWN, |
344 | 0); | 371 | 0); |
345 | 372 | ||
346 | if (IS_ERR((void *) current->mm->start_brk)) { | 373 | if (IS_ERR_VALUE(current->mm->start_brk)) { |
347 | up_write(¤t->mm->mmap_sem); | 374 | up_write(¤t->mm->mmap_sem); |
348 | retval = current->mm->start_brk; | 375 | retval = current->mm->start_brk; |
349 | current->mm->start_brk = 0; | 376 | current->mm->start_brk = 0; |
350 | goto error_kill; | 377 | goto error_kill; |
351 | } | 378 | } |
352 | 379 | ||
353 | if (do_mremap(current->mm->start_brk, | 380 | /* expand the stack mapping to use up the entire allocation granule */ |
354 | stack_size, | 381 | fullsize = ksize((char *) current->mm->start_brk); |
355 | ksize((char *) current->mm->start_brk), | 382 | if (!IS_ERR_VALUE(do_mremap(current->mm->start_brk, stack_size, |
356 | 0, 0 | 383 | fullsize, 0, 0))) |
357 | ) == current->mm->start_brk | 384 | stack_size = fullsize; |
358 | ) | ||
359 | stack_size = ksize((char *) current->mm->start_brk); | ||
360 | up_write(¤t->mm->mmap_sem); | 385 | up_write(¤t->mm->mmap_sem); |
361 | 386 | ||
362 | current->mm->brk = current->mm->start_brk; | 387 | current->mm->brk = current->mm->start_brk; |
363 | current->mm->context.end_brk = current->mm->start_brk; | 388 | current->mm->context.end_brk = current->mm->start_brk; |
364 | current->mm->context.end_brk += (stack_size > PAGE_SIZE) ? (stack_size - PAGE_SIZE) : 0; | 389 | current->mm->context.end_brk += |
390 | (stack_size > PAGE_SIZE) ? (stack_size - PAGE_SIZE) : 0; | ||
365 | current->mm->start_stack = current->mm->start_brk + stack_size; | 391 | current->mm->start_stack = current->mm->start_brk + stack_size; |
366 | #endif | 392 | #endif |
367 | 393 | ||
368 | compute_creds(bprm); | 394 | compute_creds(bprm); |
369 | current->flags &= ~PF_FORKNOEXEC; | 395 | current->flags &= ~PF_FORKNOEXEC; |
370 | if (create_elf_fdpic_tables(bprm, current->mm, &exec_params, &interp_params) < 0) | 396 | if (create_elf_fdpic_tables(bprm, current->mm, |
397 | &exec_params, &interp_params) < 0) | ||
371 | goto error_kill; | 398 | goto error_kill; |
372 | 399 | ||
373 | kdebug("- start_code %lx", (long) current->mm->start_code); | 400 | kdebug("- start_code %lx", current->mm->start_code); |
374 | kdebug("- end_code %lx", (long) current->mm->end_code); | 401 | kdebug("- end_code %lx", current->mm->end_code); |
375 | kdebug("- start_data %lx", (long) current->mm->start_data); | 402 | kdebug("- start_data %lx", current->mm->start_data); |
376 | kdebug("- end_data %lx", (long) current->mm->end_data); | 403 | kdebug("- end_data %lx", current->mm->end_data); |
377 | kdebug("- start_brk %lx", (long) current->mm->start_brk); | 404 | kdebug("- start_brk %lx", current->mm->start_brk); |
378 | kdebug("- brk %lx", (long) current->mm->brk); | 405 | kdebug("- brk %lx", current->mm->brk); |
379 | kdebug("- start_stack %lx", (long) current->mm->start_stack); | 406 | kdebug("- start_stack %lx", current->mm->start_stack); |
380 | 407 | ||
381 | #ifdef ELF_FDPIC_PLAT_INIT | 408 | #ifdef ELF_FDPIC_PLAT_INIT |
382 | /* | 409 | /* |
@@ -385,21 +412,18 @@ static int load_elf_fdpic_binary(struct linux_binprm *bprm, struct pt_regs *regs | |||
385 | * example. This macro performs whatever initialization to | 412 | * example. This macro performs whatever initialization to |
386 | * the regs structure is required. | 413 | * the regs structure is required. |
387 | */ | 414 | */ |
388 | ELF_FDPIC_PLAT_INIT(regs, | 415 | dynaddr = interp_params.dynamic_addr ?: exec_params.dynamic_addr; |
389 | exec_params.map_addr, | 416 | ELF_FDPIC_PLAT_INIT(regs, exec_params.map_addr, interp_params.map_addr, |
390 | interp_params.map_addr, | 417 | dynaddr); |
391 | interp_params.dynamic_addr ?: exec_params.dynamic_addr | ||
392 | ); | ||
393 | #endif | 418 | #endif |
394 | 419 | ||
395 | /* everything is now ready... get the userspace context ready to roll */ | 420 | /* everything is now ready... get the userspace context ready to roll */ |
396 | start_thread(regs, | 421 | entryaddr = interp_params.entry_addr ?: exec_params.entry_addr; |
397 | interp_params.entry_addr ?: exec_params.entry_addr, | 422 | start_thread(regs, entryaddr, current->mm->start_stack); |
398 | current->mm->start_stack); | ||
399 | 423 | ||
400 | if (unlikely(current->ptrace & PT_PTRACED)) { | 424 | if (unlikely(current->ptrace & PT_PTRACED)) { |
401 | if (current->ptrace & PT_TRACE_EXEC) | 425 | if (current->ptrace & PT_TRACE_EXEC) |
402 | ptrace_notify ((PTRACE_EVENT_EXEC << 8) | SIGTRAP); | 426 | ptrace_notify((PTRACE_EVENT_EXEC << 8) | SIGTRAP); |
403 | else | 427 | else |
404 | send_sig(SIGTRAP, current, 0); | 428 | send_sig(SIGTRAP, current, 0); |
405 | } | 429 | } |
@@ -419,11 +443,11 @@ error: | |||
419 | return retval; | 443 | return retval; |
420 | 444 | ||
421 | /* unrecoverable error - kill the process */ | 445 | /* unrecoverable error - kill the process */ |
422 | error_kill: | 446 | error_kill: |
423 | send_sig(SIGSEGV, current, 0); | 447 | send_sig(SIGSEGV, current, 0); |
424 | goto error; | 448 | goto error; |
425 | 449 | ||
426 | } /* end load_elf_fdpic_binary() */ | 450 | } |
427 | 451 | ||
428 | /*****************************************************************************/ | 452 | /*****************************************************************************/ |
429 | /* | 453 | /* |
@@ -459,6 +483,7 @@ static int create_elf_fdpic_tables(struct linux_binprm *bprm, | |||
459 | */ | 483 | */ |
460 | hwcap = ELF_HWCAP; | 484 | hwcap = ELF_HWCAP; |
461 | k_platform = ELF_PLATFORM; | 485 | k_platform = ELF_PLATFORM; |
486 | u_platform = NULL; | ||
462 | 487 | ||
463 | if (k_platform) { | 488 | if (k_platform) { |
464 | platform_len = strlen(k_platform) + 1; | 489 | platform_len = strlen(k_platform) + 1; |
@@ -470,11 +495,11 @@ static int create_elf_fdpic_tables(struct linux_binprm *bprm, | |||
470 | 495 | ||
471 | #if defined(__i386__) && defined(CONFIG_SMP) | 496 | #if defined(__i386__) && defined(CONFIG_SMP) |
472 | /* in some cases (e.g. Hyper-Threading), we want to avoid L1 evictions | 497 | /* in some cases (e.g. Hyper-Threading), we want to avoid L1 evictions |
473 | * by the processes running on the same package. One thing we can do | 498 | * by the processes running on the same package. One thing we can do is |
474 | * is to shuffle the initial stack for them. | 499 | * to shuffle the initial stack for them. |
475 | * | 500 | * |
476 | * the conditionals here are unneeded, but kept in to make the | 501 | * the conditionals here are unneeded, but kept in to make the code |
477 | * code behaviour the same as pre change unless we have hyperthreaded | 502 | * behaviour the same as pre change unless we have hyperthreaded |
478 | * processors. This keeps Mr Marcelo Person happier but should be | 503 | * processors. This keeps Mr Marcelo Person happier but should be |
479 | * removed for 2.5 | 504 | * removed for 2.5 |
480 | */ | 505 | */ |
@@ -497,11 +522,13 @@ static int create_elf_fdpic_tables(struct linux_binprm *bprm, | |||
497 | 522 | ||
498 | if (interp_params->loadmap) { | 523 | if (interp_params->loadmap) { |
499 | len = sizeof(struct elf32_fdpic_loadmap); | 524 | len = sizeof(struct elf32_fdpic_loadmap); |
500 | len += sizeof(struct elf32_fdpic_loadseg) * interp_params->loadmap->nsegs; | 525 | len += sizeof(struct elf32_fdpic_loadseg) * |
526 | interp_params->loadmap->nsegs; | ||
501 | sp = (sp - len) & ~7UL; | 527 | sp = (sp - len) & ~7UL; |
502 | interp_params->map_addr = sp; | 528 | interp_params->map_addr = sp; |
503 | 529 | ||
504 | if (copy_to_user((void __user *) sp, interp_params->loadmap, len) != 0) | 530 | if (copy_to_user((void __user *) sp, interp_params->loadmap, |
531 | len) != 0) | ||
505 | return -EFAULT; | 532 | return -EFAULT; |
506 | 533 | ||
507 | current->mm->context.interp_fdpic_loadmap = (unsigned long) sp; | 534 | current->mm->context.interp_fdpic_loadmap = (unsigned long) sp; |
@@ -525,34 +552,37 @@ static int create_elf_fdpic_tables(struct linux_binprm *bprm, | |||
525 | sp -= sp & 15UL; | 552 | sp -= sp & 15UL; |
526 | 553 | ||
527 | /* put the ELF interpreter info on the stack */ | 554 | /* put the ELF interpreter info on the stack */ |
528 | #define NEW_AUX_ENT(nr, id, val) \ | 555 | #define NEW_AUX_ENT(nr, id, val) \ |
529 | do { \ | 556 | do { \ |
530 | struct { unsigned long _id, _val; } __user *ent = (void __user *) csp; \ | 557 | struct { unsigned long _id, _val; } __user *ent; \ |
531 | __put_user((id), &ent[nr]._id); \ | 558 | \ |
532 | __put_user((val), &ent[nr]._val); \ | 559 | ent = (void __user *) csp; \ |
560 | __put_user((id), &ent[nr]._id); \ | ||
561 | __put_user((val), &ent[nr]._val); \ | ||
533 | } while (0) | 562 | } while (0) |
534 | 563 | ||
535 | csp -= 2 * sizeof(unsigned long); | 564 | csp -= 2 * sizeof(unsigned long); |
536 | NEW_AUX_ENT(0, AT_NULL, 0); | 565 | NEW_AUX_ENT(0, AT_NULL, 0); |
537 | if (k_platform) { | 566 | if (k_platform) { |
538 | csp -= 2 * sizeof(unsigned long); | 567 | csp -= 2 * sizeof(unsigned long); |
539 | NEW_AUX_ENT(0, AT_PLATFORM, (elf_addr_t)(unsigned long) u_platform); | 568 | NEW_AUX_ENT(0, AT_PLATFORM, |
569 | (elf_addr_t) (unsigned long) u_platform); | ||
540 | } | 570 | } |
541 | 571 | ||
542 | csp -= DLINFO_ITEMS * 2 * sizeof(unsigned long); | 572 | csp -= DLINFO_ITEMS * 2 * sizeof(unsigned long); |
543 | NEW_AUX_ENT( 0, AT_HWCAP, hwcap); | 573 | NEW_AUX_ENT( 0, AT_HWCAP, hwcap); |
544 | NEW_AUX_ENT( 1, AT_PAGESZ, PAGE_SIZE); | 574 | NEW_AUX_ENT( 1, AT_PAGESZ, PAGE_SIZE); |
545 | NEW_AUX_ENT( 2, AT_CLKTCK, CLOCKS_PER_SEC); | 575 | NEW_AUX_ENT( 2, AT_CLKTCK, CLOCKS_PER_SEC); |
546 | NEW_AUX_ENT( 3, AT_PHDR, exec_params->ph_addr); | 576 | NEW_AUX_ENT( 3, AT_PHDR, exec_params->ph_addr); |
547 | NEW_AUX_ENT( 4, AT_PHENT, sizeof(struct elf_phdr)); | 577 | NEW_AUX_ENT( 4, AT_PHENT, sizeof(struct elf_phdr)); |
548 | NEW_AUX_ENT( 5, AT_PHNUM, exec_params->hdr.e_phnum); | 578 | NEW_AUX_ENT( 5, AT_PHNUM, exec_params->hdr.e_phnum); |
549 | NEW_AUX_ENT( 6, AT_BASE, interp_params->elfhdr_addr); | 579 | NEW_AUX_ENT( 6, AT_BASE, interp_params->elfhdr_addr); |
550 | NEW_AUX_ENT( 7, AT_FLAGS, 0); | 580 | NEW_AUX_ENT( 7, AT_FLAGS, 0); |
551 | NEW_AUX_ENT( 8, AT_ENTRY, exec_params->entry_addr); | 581 | NEW_AUX_ENT( 8, AT_ENTRY, exec_params->entry_addr); |
552 | NEW_AUX_ENT( 9, AT_UID, (elf_addr_t) current->uid); | 582 | NEW_AUX_ENT( 9, AT_UID, (elf_addr_t) current->uid); |
553 | NEW_AUX_ENT(10, AT_EUID, (elf_addr_t) current->euid); | 583 | NEW_AUX_ENT(10, AT_EUID, (elf_addr_t) current->euid); |
554 | NEW_AUX_ENT(11, AT_GID, (elf_addr_t) current->gid); | 584 | NEW_AUX_ENT(11, AT_GID, (elf_addr_t) current->gid); |
555 | NEW_AUX_ENT(12, AT_EGID, (elf_addr_t) current->egid); | 585 | NEW_AUX_ENT(12, AT_EGID, (elf_addr_t) current->egid); |
556 | 586 | ||
557 | #ifdef ARCH_DLINFO | 587 | #ifdef ARCH_DLINFO |
558 | /* ARCH_DLINFO must come last so platform specific code can enforce | 588 | /* ARCH_DLINFO must come last so platform specific code can enforce |
@@ -578,7 +608,8 @@ static int create_elf_fdpic_tables(struct linux_binprm *bprm, | |||
578 | #ifdef CONFIG_MMU | 608 | #ifdef CONFIG_MMU |
579 | current->mm->arg_start = bprm->p; | 609 | current->mm->arg_start = bprm->p; |
580 | #else | 610 | #else |
581 | current->mm->arg_start = current->mm->start_stack - (MAX_ARG_PAGES * PAGE_SIZE - bprm->p); | 611 | current->mm->arg_start = current->mm->start_stack - |
612 | (MAX_ARG_PAGES * PAGE_SIZE - bprm->p); | ||
582 | #endif | 613 | #endif |
583 | 614 | ||
584 | p = (char __user *) current->mm->arg_start; | 615 | p = (char __user *) current->mm->arg_start; |
@@ -606,7 +637,7 @@ static int create_elf_fdpic_tables(struct linux_binprm *bprm, | |||
606 | 637 | ||
607 | mm->start_stack = (unsigned long) sp; | 638 | mm->start_stack = (unsigned long) sp; |
608 | return 0; | 639 | return 0; |
609 | } /* end create_elf_fdpic_tables() */ | 640 | } |
610 | 641 | ||
611 | /*****************************************************************************/ | 642 | /*****************************************************************************/ |
612 | /* | 643 | /* |
@@ -614,7 +645,8 @@ static int create_elf_fdpic_tables(struct linux_binprm *bprm, | |||
614 | * the stack | 645 | * the stack |
615 | */ | 646 | */ |
616 | #ifndef CONFIG_MMU | 647 | #ifndef CONFIG_MMU |
617 | static int elf_fdpic_transfer_args_to_stack(struct linux_binprm *bprm, unsigned long *_sp) | 648 | static int elf_fdpic_transfer_args_to_stack(struct linux_binprm *bprm, |
649 | unsigned long *_sp) | ||
618 | { | 650 | { |
619 | unsigned long index, stop, sp; | 651 | unsigned long index, stop, sp; |
620 | char *src; | 652 | char *src; |
@@ -635,9 +667,9 @@ static int elf_fdpic_transfer_args_to_stack(struct linux_binprm *bprm, unsigned | |||
635 | 667 | ||
636 | *_sp = (*_sp - (MAX_ARG_PAGES * PAGE_SIZE - bprm->p)) & ~15; | 668 | *_sp = (*_sp - (MAX_ARG_PAGES * PAGE_SIZE - bprm->p)) & ~15; |
637 | 669 | ||
638 | out: | 670 | out: |
639 | return ret; | 671 | return ret; |
640 | } /* end elf_fdpic_transfer_args_to_stack() */ | 672 | } |
641 | #endif | 673 | #endif |
642 | 674 | ||
643 | /*****************************************************************************/ | 675 | /*****************************************************************************/ |
@@ -712,17 +744,18 @@ static int elf_fdpic_map_file(struct elf_fdpic_params *params, | |||
712 | seg = loadmap->segs; | 744 | seg = loadmap->segs; |
713 | for (loop = loadmap->nsegs; loop > 0; loop--, seg++) { | 745 | for (loop = loadmap->nsegs; loop > 0; loop--, seg++) { |
714 | if (params->hdr.e_entry >= seg->p_vaddr && | 746 | if (params->hdr.e_entry >= seg->p_vaddr && |
715 | params->hdr.e_entry < seg->p_vaddr + seg->p_memsz | 747 | params->hdr.e_entry < seg->p_vaddr + seg->p_memsz) { |
716 | ) { | ||
717 | params->entry_addr = | 748 | params->entry_addr = |
718 | (params->hdr.e_entry - seg->p_vaddr) + seg->addr; | 749 | (params->hdr.e_entry - seg->p_vaddr) + |
750 | seg->addr; | ||
719 | break; | 751 | break; |
720 | } | 752 | } |
721 | } | 753 | } |
722 | } | 754 | } |
723 | 755 | ||
724 | /* determine where the program header table has wound up if mapped */ | 756 | /* determine where the program header table has wound up if mapped */ |
725 | stop = params->hdr.e_phoff + params->hdr.e_phnum * sizeof (struct elf_phdr); | 757 | stop = params->hdr.e_phoff; |
758 | stop += params->hdr.e_phnum * sizeof (struct elf_phdr); | ||
726 | phdr = params->phdrs; | 759 | phdr = params->phdrs; |
727 | 760 | ||
728 | for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) { | 761 | for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) { |
@@ -736,9 +769,11 @@ static int elf_fdpic_map_file(struct elf_fdpic_params *params, | |||
736 | seg = loadmap->segs; | 769 | seg = loadmap->segs; |
737 | for (loop = loadmap->nsegs; loop > 0; loop--, seg++) { | 770 | for (loop = loadmap->nsegs; loop > 0; loop--, seg++) { |
738 | if (phdr->p_vaddr >= seg->p_vaddr && | 771 | if (phdr->p_vaddr >= seg->p_vaddr && |
739 | phdr->p_vaddr + phdr->p_filesz <= seg->p_vaddr + seg->p_memsz | 772 | phdr->p_vaddr + phdr->p_filesz <= |
740 | ) { | 773 | seg->p_vaddr + seg->p_memsz) { |
741 | params->ph_addr = (phdr->p_vaddr - seg->p_vaddr) + seg->addr + | 774 | params->ph_addr = |
775 | (phdr->p_vaddr - seg->p_vaddr) + | ||
776 | seg->addr + | ||
742 | params->hdr.e_phoff - phdr->p_offset; | 777 | params->hdr.e_phoff - phdr->p_offset; |
743 | break; | 778 | break; |
744 | } | 779 | } |
@@ -755,18 +790,22 @@ static int elf_fdpic_map_file(struct elf_fdpic_params *params, | |||
755 | seg = loadmap->segs; | 790 | seg = loadmap->segs; |
756 | for (loop = loadmap->nsegs; loop > 0; loop--, seg++) { | 791 | for (loop = loadmap->nsegs; loop > 0; loop--, seg++) { |
757 | if (phdr->p_vaddr >= seg->p_vaddr && | 792 | if (phdr->p_vaddr >= seg->p_vaddr && |
758 | phdr->p_vaddr + phdr->p_memsz <= seg->p_vaddr + seg->p_memsz | 793 | phdr->p_vaddr + phdr->p_memsz <= |
759 | ) { | 794 | seg->p_vaddr + seg->p_memsz) { |
760 | params->dynamic_addr = (phdr->p_vaddr - seg->p_vaddr) + seg->addr; | 795 | params->dynamic_addr = |
761 | 796 | (phdr->p_vaddr - seg->p_vaddr) + | |
762 | /* check the dynamic section contains at least one item, and that | 797 | seg->addr; |
763 | * the last item is a NULL entry */ | 798 | |
799 | /* check the dynamic section contains at least | ||
800 | * one item, and that the last item is a NULL | ||
801 | * entry */ | ||
764 | if (phdr->p_memsz == 0 || | 802 | if (phdr->p_memsz == 0 || |
765 | phdr->p_memsz % sizeof(Elf32_Dyn) != 0) | 803 | phdr->p_memsz % sizeof(Elf32_Dyn) != 0) |
766 | goto dynamic_error; | 804 | goto dynamic_error; |
767 | 805 | ||
768 | tmp = phdr->p_memsz / sizeof(Elf32_Dyn); | 806 | tmp = phdr->p_memsz / sizeof(Elf32_Dyn); |
769 | if (((Elf32_Dyn *) params->dynamic_addr)[tmp - 1].d_tag != 0) | 807 | if (((Elf32_Dyn *) |
808 | params->dynamic_addr)[tmp - 1].d_tag != 0) | ||
770 | goto dynamic_error; | 809 | goto dynamic_error; |
771 | break; | 810 | break; |
772 | } | 811 | } |
@@ -775,8 +814,8 @@ static int elf_fdpic_map_file(struct elf_fdpic_params *params, | |||
775 | } | 814 | } |
776 | 815 | ||
777 | /* now elide adjacent segments in the load map on MMU linux | 816 | /* now elide adjacent segments in the load map on MMU linux |
778 | * - on uClinux the holes between may actually be filled with system stuff or stuff from | 817 | * - on uClinux the holes between may actually be filled with system |
779 | * other processes | 818 | * stuff or stuff from other processes |
780 | */ | 819 | */ |
781 | #ifdef CONFIG_MMU | 820 | #ifdef CONFIG_MMU |
782 | nloads = loadmap->nsegs; | 821 | nloads = loadmap->nsegs; |
@@ -787,7 +826,9 @@ static int elf_fdpic_map_file(struct elf_fdpic_params *params, | |||
787 | if (seg->p_vaddr - mseg->p_vaddr == seg->addr - mseg->addr) { | 826 | if (seg->p_vaddr - mseg->p_vaddr == seg->addr - mseg->addr) { |
788 | load_addr = PAGE_ALIGN(mseg->addr + mseg->p_memsz); | 827 | load_addr = PAGE_ALIGN(mseg->addr + mseg->p_memsz); |
789 | if (load_addr == (seg->addr & PAGE_MASK)) { | 828 | if (load_addr == (seg->addr & PAGE_MASK)) { |
790 | mseg->p_memsz += load_addr - (mseg->addr + mseg->p_memsz); | 829 | mseg->p_memsz += |
830 | load_addr - | ||
831 | (mseg->addr + mseg->p_memsz); | ||
791 | mseg->p_memsz += seg->addr & ~PAGE_MASK; | 832 | mseg->p_memsz += seg->addr & ~PAGE_MASK; |
792 | mseg->p_memsz += seg->p_memsz; | 833 | mseg->p_memsz += seg->p_memsz; |
793 | loadmap->nsegs--; | 834 | loadmap->nsegs--; |
@@ -815,20 +856,21 @@ static int elf_fdpic_map_file(struct elf_fdpic_params *params, | |||
815 | 856 | ||
816 | return 0; | 857 | return 0; |
817 | 858 | ||
818 | dynamic_error: | 859 | dynamic_error: |
819 | printk("ELF FDPIC %s with invalid DYNAMIC section (inode=%lu)\n", | 860 | printk("ELF FDPIC %s with invalid DYNAMIC section (inode=%lu)\n", |
820 | what, file->f_dentry->d_inode->i_ino); | 861 | what, file->f_dentry->d_inode->i_ino); |
821 | return -ELIBBAD; | 862 | return -ELIBBAD; |
822 | } /* end elf_fdpic_map_file() */ | 863 | } |
823 | 864 | ||
824 | /*****************************************************************************/ | 865 | /*****************************************************************************/ |
825 | /* | 866 | /* |
826 | * map a file with constant displacement under uClinux | 867 | * map a file with constant displacement under uClinux |
827 | */ | 868 | */ |
828 | #ifndef CONFIG_MMU | 869 | #ifndef CONFIG_MMU |
829 | static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *params, | 870 | static int elf_fdpic_map_file_constdisp_on_uclinux( |
830 | struct file *file, | 871 | struct elf_fdpic_params *params, |
831 | struct mm_struct *mm) | 872 | struct file *file, |
873 | struct mm_struct *mm) | ||
832 | { | 874 | { |
833 | struct elf32_fdpic_loadseg *seg; | 875 | struct elf32_fdpic_loadseg *seg; |
834 | struct elf32_phdr *phdr; | 876 | struct elf32_phdr *phdr; |
@@ -839,7 +881,8 @@ static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *para | |||
839 | load_addr = params->load_addr; | 881 | load_addr = params->load_addr; |
840 | seg = params->loadmap->segs; | 882 | seg = params->loadmap->segs; |
841 | 883 | ||
842 | /* determine the bounds of the contiguous overall allocation we must make */ | 884 | /* determine the bounds of the contiguous overall allocation we must |
885 | * make */ | ||
843 | phdr = params->phdrs; | 886 | phdr = params->phdrs; |
844 | for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) { | 887 | for (loop = 0; loop < params->hdr.e_phnum; loop++, phdr++) { |
845 | if (params->phdrs[loop].p_type != PT_LOAD) | 888 | if (params->phdrs[loop].p_type != PT_LOAD) |
@@ -860,7 +903,7 @@ static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *para | |||
860 | maddr = do_mmap(NULL, load_addr, top - base, | 903 | maddr = do_mmap(NULL, load_addr, top - base, |
861 | PROT_READ | PROT_WRITE | PROT_EXEC, mflags, 0); | 904 | PROT_READ | PROT_WRITE | PROT_EXEC, mflags, 0); |
862 | up_write(&mm->mmap_sem); | 905 | up_write(&mm->mmap_sem); |
863 | if (IS_ERR((void *) maddr)) | 906 | if (IS_ERR_VALUE(maddr)) |
864 | return (int) maddr; | 907 | return (int) maddr; |
865 | 908 | ||
866 | if (load_addr != 0) | 909 | if (load_addr != 0) |
@@ -878,7 +921,8 @@ static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *para | |||
878 | seg->p_vaddr = phdr->p_vaddr; | 921 | seg->p_vaddr = phdr->p_vaddr; |
879 | seg->p_memsz = phdr->p_memsz; | 922 | seg->p_memsz = phdr->p_memsz; |
880 | 923 | ||
881 | ret = file->f_op->read(file, (void *) seg->addr, phdr->p_filesz, &fpos); | 924 | ret = file->f_op->read(file, (void *) seg->addr, |
925 | phdr->p_filesz, &fpos); | ||
882 | if (ret < 0) | 926 | if (ret < 0) |
883 | return ret; | 927 | return ret; |
884 | 928 | ||
@@ -895,8 +939,7 @@ static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *para | |||
895 | if (phdr->p_flags & PF_X) { | 939 | if (phdr->p_flags & PF_X) { |
896 | mm->start_code = seg->addr; | 940 | mm->start_code = seg->addr; |
897 | mm->end_code = seg->addr + phdr->p_memsz; | 941 | mm->end_code = seg->addr + phdr->p_memsz; |
898 | } | 942 | } else if (!mm->start_data) { |
899 | else if (!mm->start_data) { | ||
900 | mm->start_data = seg->addr; | 943 | mm->start_data = seg->addr; |
901 | #ifndef CONFIG_MMU | 944 | #ifndef CONFIG_MMU |
902 | mm->end_data = seg->addr + phdr->p_memsz; | 945 | mm->end_data = seg->addr + phdr->p_memsz; |
@@ -913,7 +956,7 @@ static int elf_fdpic_map_file_constdisp_on_uclinux(struct elf_fdpic_params *para | |||
913 | } | 956 | } |
914 | 957 | ||
915 | return 0; | 958 | return 0; |
916 | } /* end elf_fdpic_map_file_constdisp_on_uclinux() */ | 959 | } |
917 | #endif | 960 | #endif |
918 | 961 | ||
919 | /*****************************************************************************/ | 962 | /*****************************************************************************/ |
@@ -974,14 +1017,14 @@ static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | |||
974 | 1017 | ||
975 | case ELF_FDPIC_FLAG_CONSTDISP: | 1018 | case ELF_FDPIC_FLAG_CONSTDISP: |
976 | /* constant displacement | 1019 | /* constant displacement |
977 | * - can be mapped anywhere, but must be mapped as a unit | 1020 | * - can be mapped anywhere, but must be mapped as a |
1021 | * unit | ||
978 | */ | 1022 | */ |
979 | if (!dvset) { | 1023 | if (!dvset) { |
980 | maddr = load_addr; | 1024 | maddr = load_addr; |
981 | delta_vaddr = phdr->p_vaddr; | 1025 | delta_vaddr = phdr->p_vaddr; |
982 | dvset = 1; | 1026 | dvset = 1; |
983 | } | 1027 | } else { |
984 | else { | ||
985 | maddr = load_addr + phdr->p_vaddr - delta_vaddr; | 1028 | maddr = load_addr + phdr->p_vaddr - delta_vaddr; |
986 | flags |= MAP_FIXED; | 1029 | flags |= MAP_FIXED; |
987 | } | 1030 | } |
@@ -1005,13 +1048,14 @@ static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | |||
1005 | up_write(&mm->mmap_sem); | 1048 | up_write(&mm->mmap_sem); |
1006 | 1049 | ||
1007 | kdebug("mmap[%d] <file> sz=%lx pr=%x fl=%x of=%lx --> %08lx", | 1050 | kdebug("mmap[%d] <file> sz=%lx pr=%x fl=%x of=%lx --> %08lx", |
1008 | loop, phdr->p_memsz + disp, prot, flags, phdr->p_offset - disp, | 1051 | loop, phdr->p_memsz + disp, prot, flags, |
1009 | maddr); | 1052 | phdr->p_offset - disp, maddr); |
1010 | 1053 | ||
1011 | if (IS_ERR((void *) maddr)) | 1054 | if (IS_ERR_VALUE(maddr)) |
1012 | return (int) maddr; | 1055 | return (int) maddr; |
1013 | 1056 | ||
1014 | if ((params->flags & ELF_FDPIC_FLAG_ARRANGEMENT) == ELF_FDPIC_FLAG_CONTIGUOUS) | 1057 | if ((params->flags & ELF_FDPIC_FLAG_ARRANGEMENT) == |
1058 | ELF_FDPIC_FLAG_CONTIGUOUS) | ||
1015 | load_addr += PAGE_ALIGN(phdr->p_memsz + disp); | 1059 | load_addr += PAGE_ALIGN(phdr->p_memsz + disp); |
1016 | 1060 | ||
1017 | seg->addr = maddr + disp; | 1061 | seg->addr = maddr + disp; |
@@ -1022,7 +1066,8 @@ static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | |||
1022 | if (phdr->p_offset == 0) | 1066 | if (phdr->p_offset == 0) |
1023 | params->elfhdr_addr = seg->addr; | 1067 | params->elfhdr_addr = seg->addr; |
1024 | 1068 | ||
1025 | /* clear the bit between beginning of mapping and beginning of PT_LOAD */ | 1069 | /* clear the bit between beginning of mapping and beginning of |
1070 | * PT_LOAD */ | ||
1026 | if (prot & PROT_WRITE && disp > 0) { | 1071 | if (prot & PROT_WRITE && disp > 0) { |
1027 | kdebug("clear[%d] ad=%lx sz=%lx", loop, maddr, disp); | 1072 | kdebug("clear[%d] ad=%lx sz=%lx", loop, maddr, disp); |
1028 | clear_user((void __user *) maddr, disp); | 1073 | clear_user((void __user *) maddr, disp); |
@@ -1038,19 +1083,20 @@ static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | |||
1038 | excess1 = PAGE_SIZE - ((maddr + phdr->p_filesz) & ~PAGE_MASK); | 1083 | excess1 = PAGE_SIZE - ((maddr + phdr->p_filesz) & ~PAGE_MASK); |
1039 | 1084 | ||
1040 | #ifdef CONFIG_MMU | 1085 | #ifdef CONFIG_MMU |
1041 | |||
1042 | if (excess > excess1) { | 1086 | if (excess > excess1) { |
1043 | unsigned long xaddr = maddr + phdr->p_filesz + excess1; | 1087 | unsigned long xaddr = maddr + phdr->p_filesz + excess1; |
1044 | unsigned long xmaddr; | 1088 | unsigned long xmaddr; |
1045 | 1089 | ||
1046 | flags |= MAP_FIXED | MAP_ANONYMOUS; | 1090 | flags |= MAP_FIXED | MAP_ANONYMOUS; |
1047 | down_write(&mm->mmap_sem); | 1091 | down_write(&mm->mmap_sem); |
1048 | xmaddr = do_mmap(NULL, xaddr, excess - excess1, prot, flags, 0); | 1092 | xmaddr = do_mmap(NULL, xaddr, excess - excess1, |
1093 | prot, flags, 0); | ||
1049 | up_write(&mm->mmap_sem); | 1094 | up_write(&mm->mmap_sem); |
1050 | 1095 | ||
1051 | kdebug("mmap[%d] <anon>" | 1096 | kdebug("mmap[%d] <anon>" |
1052 | " ad=%lx sz=%lx pr=%x fl=%x of=0 --> %08lx", | 1097 | " ad=%lx sz=%lx pr=%x fl=%x of=0 --> %08lx", |
1053 | loop, xaddr, excess - excess1, prot, flags, xmaddr); | 1098 | loop, xaddr, excess - excess1, prot, flags, |
1099 | xmaddr); | ||
1054 | 1100 | ||
1055 | if (xmaddr != xaddr) | 1101 | if (xmaddr != xaddr) |
1056 | return -ENOMEM; | 1102 | return -ENOMEM; |
@@ -1059,7 +1105,8 @@ static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | |||
1059 | if (prot & PROT_WRITE && excess1 > 0) { | 1105 | if (prot & PROT_WRITE && excess1 > 0) { |
1060 | kdebug("clear[%d] ad=%lx sz=%lx", | 1106 | kdebug("clear[%d] ad=%lx sz=%lx", |
1061 | loop, maddr + phdr->p_filesz, excess1); | 1107 | loop, maddr + phdr->p_filesz, excess1); |
1062 | clear_user((void __user *) maddr + phdr->p_filesz, excess1); | 1108 | clear_user((void __user *) maddr + phdr->p_filesz, |
1109 | excess1); | ||
1063 | } | 1110 | } |
1064 | 1111 | ||
1065 | #else | 1112 | #else |
@@ -1074,8 +1121,7 @@ static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | |||
1074 | if (phdr->p_flags & PF_X) { | 1121 | if (phdr->p_flags & PF_X) { |
1075 | mm->start_code = maddr; | 1122 | mm->start_code = maddr; |
1076 | mm->end_code = maddr + phdr->p_memsz; | 1123 | mm->end_code = maddr + phdr->p_memsz; |
1077 | } | 1124 | } else if (!mm->start_data) { |
1078 | else if (!mm->start_data) { | ||
1079 | mm->start_data = maddr; | 1125 | mm->start_data = maddr; |
1080 | mm->end_data = maddr + phdr->p_memsz; | 1126 | mm->end_data = maddr + phdr->p_memsz; |
1081 | } | 1127 | } |
@@ -1085,4 +1131,662 @@ static int elf_fdpic_map_file_by_direct_mmap(struct elf_fdpic_params *params, | |||
1085 | } | 1131 | } |
1086 | 1132 | ||
1087 | return 0; | 1133 | return 0; |
1088 | } /* end elf_fdpic_map_file_by_direct_mmap() */ | 1134 | } |
1135 | |||
1136 | /*****************************************************************************/ | ||
1137 | /* | ||
1138 | * ELF-FDPIC core dumper | ||
1139 | * | ||
1140 | * Modelled on fs/exec.c:aout_core_dump() | ||
1141 | * Jeremy Fitzhardinge <jeremy@sw.oz.au> | ||
1142 | * | ||
1143 | * Modelled on fs/binfmt_elf.c core dumper | ||
1144 | */ | ||
1145 | #if defined(USE_ELF_CORE_DUMP) && defined(CONFIG_ELF_CORE) | ||
1146 | |||
1147 | /* | ||
1148 | * These are the only things you should do on a core-file: use only these | ||
1149 | * functions to write out all the necessary info. | ||
1150 | */ | ||
1151 | static int dump_write(struct file *file, const void *addr, int nr) | ||
1152 | { | ||
1153 | return file->f_op->write(file, addr, nr, &file->f_pos) == nr; | ||
1154 | } | ||
1155 | |||
1156 | static int dump_seek(struct file *file, loff_t off) | ||
1157 | { | ||
1158 | if (file->f_op->llseek) { | ||
1159 | if (file->f_op->llseek(file, off, SEEK_SET) != off) | ||
1160 | return 0; | ||
1161 | } else { | ||
1162 | file->f_pos = off; | ||
1163 | } | ||
1164 | return 1; | ||
1165 | } | ||
1166 | |||
1167 | /* | ||
1168 | * Decide whether a segment is worth dumping; default is yes to be | ||
1169 | * sure (missing info is worse than too much; etc). | ||
1170 | * Personally I'd include everything, and use the coredump limit... | ||
1171 | * | ||
1172 | * I think we should skip something. But I am not sure how. H.J. | ||
1173 | */ | ||
1174 | static int maydump(struct vm_area_struct *vma) | ||
1175 | { | ||
1176 | /* Do not dump I/O mapped devices or special mappings */ | ||
1177 | if (vma->vm_flags & (VM_IO | VM_RESERVED)) { | ||
1178 | kdcore("%08lx: %08lx: no (IO)", vma->vm_start, vma->vm_flags); | ||
1179 | return 0; | ||
1180 | } | ||
1181 | |||
1182 | /* If we may not read the contents, don't allow us to dump | ||
1183 | * them either. "dump_write()" can't handle it anyway. | ||
1184 | */ | ||
1185 | if (!(vma->vm_flags & VM_READ)) { | ||
1186 | kdcore("%08lx: %08lx: no (!read)", vma->vm_start, vma->vm_flags); | ||
1187 | return 0; | ||
1188 | } | ||
1189 | |||
1190 | /* Dump shared memory only if mapped from an anonymous file. */ | ||
1191 | if (vma->vm_flags & VM_SHARED) { | ||
1192 | if (vma->vm_file->f_dentry->d_inode->i_nlink == 0) { | ||
1193 | kdcore("%08lx: %08lx: no (share)", vma->vm_start, vma->vm_flags); | ||
1194 | return 1; | ||
1195 | } | ||
1196 | |||
1197 | kdcore("%08lx: %08lx: no (share)", vma->vm_start, vma->vm_flags); | ||
1198 | return 0; | ||
1199 | } | ||
1200 | |||
1201 | #ifdef CONFIG_MMU | ||
1202 | /* If it hasn't been written to, don't write it out */ | ||
1203 | if (!vma->anon_vma) { | ||
1204 | kdcore("%08lx: %08lx: no (!anon)", vma->vm_start, vma->vm_flags); | ||
1205 | return 0; | ||
1206 | } | ||
1207 | #endif | ||
1208 | |||
1209 | kdcore("%08lx: %08lx: yes", vma->vm_start, vma->vm_flags); | ||
1210 | return 1; | ||
1211 | } | ||
1212 | |||
1213 | /* An ELF note in memory */ | ||
1214 | struct memelfnote | ||
1215 | { | ||
1216 | const char *name; | ||
1217 | int type; | ||
1218 | unsigned int datasz; | ||
1219 | void *data; | ||
1220 | }; | ||
1221 | |||
1222 | static int notesize(struct memelfnote *en) | ||
1223 | { | ||
1224 | int sz; | ||
1225 | |||
1226 | sz = sizeof(struct elf_note); | ||
1227 | sz += roundup(strlen(en->name) + 1, 4); | ||
1228 | sz += roundup(en->datasz, 4); | ||
1229 | |||
1230 | return sz; | ||
1231 | } | ||
1232 | |||
1233 | /* #define DEBUG */ | ||
1234 | |||
1235 | #define DUMP_WRITE(addr, nr) \ | ||
1236 | do { if (!dump_write(file, (addr), (nr))) return 0; } while(0) | ||
1237 | #define DUMP_SEEK(off) \ | ||
1238 | do { if (!dump_seek(file, (off))) return 0; } while(0) | ||
1239 | |||
1240 | static int writenote(struct memelfnote *men, struct file *file) | ||
1241 | { | ||
1242 | struct elf_note en; | ||
1243 | |||
1244 | en.n_namesz = strlen(men->name) + 1; | ||
1245 | en.n_descsz = men->datasz; | ||
1246 | en.n_type = men->type; | ||
1247 | |||
1248 | DUMP_WRITE(&en, sizeof(en)); | ||
1249 | DUMP_WRITE(men->name, en.n_namesz); | ||
1250 | /* XXX - cast from long long to long to avoid need for libgcc.a */ | ||
1251 | DUMP_SEEK(roundup((unsigned long)file->f_pos, 4)); /* XXX */ | ||
1252 | DUMP_WRITE(men->data, men->datasz); | ||
1253 | DUMP_SEEK(roundup((unsigned long)file->f_pos, 4)); /* XXX */ | ||
1254 | |||
1255 | return 1; | ||
1256 | } | ||
1257 | #undef DUMP_WRITE | ||
1258 | #undef DUMP_SEEK | ||
1259 | |||
1260 | #define DUMP_WRITE(addr, nr) \ | ||
1261 | if ((size += (nr)) > limit || !dump_write(file, (addr), (nr))) \ | ||
1262 | goto end_coredump; | ||
1263 | #define DUMP_SEEK(off) \ | ||
1264 | if (!dump_seek(file, (off))) \ | ||
1265 | goto end_coredump; | ||
1266 | |||
1267 | static inline void fill_elf_fdpic_header(struct elfhdr *elf, int segs) | ||
1268 | { | ||
1269 | memcpy(elf->e_ident, ELFMAG, SELFMAG); | ||
1270 | elf->e_ident[EI_CLASS] = ELF_CLASS; | ||
1271 | elf->e_ident[EI_DATA] = ELF_DATA; | ||
1272 | elf->e_ident[EI_VERSION] = EV_CURRENT; | ||
1273 | elf->e_ident[EI_OSABI] = ELF_OSABI; | ||
1274 | memset(elf->e_ident+EI_PAD, 0, EI_NIDENT-EI_PAD); | ||
1275 | |||
1276 | elf->e_type = ET_CORE; | ||
1277 | elf->e_machine = ELF_ARCH; | ||
1278 | elf->e_version = EV_CURRENT; | ||
1279 | elf->e_entry = 0; | ||
1280 | elf->e_phoff = sizeof(struct elfhdr); | ||
1281 | elf->e_shoff = 0; | ||
1282 | elf->e_flags = ELF_FDPIC_CORE_EFLAGS; | ||
1283 | elf->e_ehsize = sizeof(struct elfhdr); | ||
1284 | elf->e_phentsize = sizeof(struct elf_phdr); | ||
1285 | elf->e_phnum = segs; | ||
1286 | elf->e_shentsize = 0; | ||
1287 | elf->e_shnum = 0; | ||
1288 | elf->e_shstrndx = 0; | ||
1289 | return; | ||
1290 | } | ||
1291 | |||
1292 | static inline void fill_elf_note_phdr(struct elf_phdr *phdr, int sz, loff_t offset) | ||
1293 | { | ||
1294 | phdr->p_type = PT_NOTE; | ||
1295 | phdr->p_offset = offset; | ||
1296 | phdr->p_vaddr = 0; | ||
1297 | phdr->p_paddr = 0; | ||
1298 | phdr->p_filesz = sz; | ||
1299 | phdr->p_memsz = 0; | ||
1300 | phdr->p_flags = 0; | ||
1301 | phdr->p_align = 0; | ||
1302 | return; | ||
1303 | } | ||
1304 | |||
1305 | static inline void fill_note(struct memelfnote *note, const char *name, int type, | ||
1306 | unsigned int sz, void *data) | ||
1307 | { | ||
1308 | note->name = name; | ||
1309 | note->type = type; | ||
1310 | note->datasz = sz; | ||
1311 | note->data = data; | ||
1312 | return; | ||
1313 | } | ||
1314 | |||
1315 | /* | ||
1316 | * fill up all the fields in prstatus from the given task struct, except | ||
1317 | * registers which need to be filled up seperately. | ||
1318 | */ | ||
1319 | static void fill_prstatus(struct elf_prstatus *prstatus, | ||
1320 | struct task_struct *p, long signr) | ||
1321 | { | ||
1322 | prstatus->pr_info.si_signo = prstatus->pr_cursig = signr; | ||
1323 | prstatus->pr_sigpend = p->pending.signal.sig[0]; | ||
1324 | prstatus->pr_sighold = p->blocked.sig[0]; | ||
1325 | prstatus->pr_pid = p->pid; | ||
1326 | prstatus->pr_ppid = p->parent->pid; | ||
1327 | prstatus->pr_pgrp = process_group(p); | ||
1328 | prstatus->pr_sid = p->signal->session; | ||
1329 | if (thread_group_leader(p)) { | ||
1330 | /* | ||
1331 | * This is the record for the group leader. Add in the | ||
1332 | * cumulative times of previous dead threads. This total | ||
1333 | * won't include the time of each live thread whose state | ||
1334 | * is included in the core dump. The final total reported | ||
1335 | * to our parent process when it calls wait4 will include | ||
1336 | * those sums as well as the little bit more time it takes | ||
1337 | * this and each other thread to finish dying after the | ||
1338 | * core dump synchronization phase. | ||
1339 | */ | ||
1340 | cputime_to_timeval(cputime_add(p->utime, p->signal->utime), | ||
1341 | &prstatus->pr_utime); | ||
1342 | cputime_to_timeval(cputime_add(p->stime, p->signal->stime), | ||
1343 | &prstatus->pr_stime); | ||
1344 | } else { | ||
1345 | cputime_to_timeval(p->utime, &prstatus->pr_utime); | ||
1346 | cputime_to_timeval(p->stime, &prstatus->pr_stime); | ||
1347 | } | ||
1348 | cputime_to_timeval(p->signal->cutime, &prstatus->pr_cutime); | ||
1349 | cputime_to_timeval(p->signal->cstime, &prstatus->pr_cstime); | ||
1350 | |||
1351 | prstatus->pr_exec_fdpic_loadmap = p->mm->context.exec_fdpic_loadmap; | ||
1352 | prstatus->pr_interp_fdpic_loadmap = p->mm->context.interp_fdpic_loadmap; | ||
1353 | } | ||
1354 | |||
1355 | static int fill_psinfo(struct elf_prpsinfo *psinfo, struct task_struct *p, | ||
1356 | struct mm_struct *mm) | ||
1357 | { | ||
1358 | unsigned int i, len; | ||
1359 | |||
1360 | /* first copy the parameters from user space */ | ||
1361 | memset(psinfo, 0, sizeof(struct elf_prpsinfo)); | ||
1362 | |||
1363 | len = mm->arg_end - mm->arg_start; | ||
1364 | if (len >= ELF_PRARGSZ) | ||
1365 | len = ELF_PRARGSZ - 1; | ||
1366 | if (copy_from_user(&psinfo->pr_psargs, | ||
1367 | (const char __user *) mm->arg_start, len)) | ||
1368 | return -EFAULT; | ||
1369 | for (i = 0; i < len; i++) | ||
1370 | if (psinfo->pr_psargs[i] == 0) | ||
1371 | psinfo->pr_psargs[i] = ' '; | ||
1372 | psinfo->pr_psargs[len] = 0; | ||
1373 | |||
1374 | psinfo->pr_pid = p->pid; | ||
1375 | psinfo->pr_ppid = p->parent->pid; | ||
1376 | psinfo->pr_pgrp = process_group(p); | ||
1377 | psinfo->pr_sid = p->signal->session; | ||
1378 | |||
1379 | i = p->state ? ffz(~p->state) + 1 : 0; | ||
1380 | psinfo->pr_state = i; | ||
1381 | psinfo->pr_sname = (i > 5) ? '.' : "RSDTZW"[i]; | ||
1382 | psinfo->pr_zomb = psinfo->pr_sname == 'Z'; | ||
1383 | psinfo->pr_nice = task_nice(p); | ||
1384 | psinfo->pr_flag = p->flags; | ||
1385 | SET_UID(psinfo->pr_uid, p->uid); | ||
1386 | SET_GID(psinfo->pr_gid, p->gid); | ||
1387 | strncpy(psinfo->pr_fname, p->comm, sizeof(psinfo->pr_fname)); | ||
1388 | |||
1389 | return 0; | ||
1390 | } | ||
1391 | |||
1392 | /* Here is the structure in which status of each thread is captured. */ | ||
1393 | struct elf_thread_status | ||
1394 | { | ||
1395 | struct list_head list; | ||
1396 | struct elf_prstatus prstatus; /* NT_PRSTATUS */ | ||
1397 | elf_fpregset_t fpu; /* NT_PRFPREG */ | ||
1398 | struct task_struct *thread; | ||
1399 | #ifdef ELF_CORE_COPY_XFPREGS | ||
1400 | elf_fpxregset_t xfpu; /* NT_PRXFPREG */ | ||
1401 | #endif | ||
1402 | struct memelfnote notes[3]; | ||
1403 | int num_notes; | ||
1404 | }; | ||
1405 | |||
1406 | /* | ||
1407 | * In order to add the specific thread information for the elf file format, | ||
1408 | * we need to keep a linked list of every thread's pr_status and then create | ||
1409 | * a single section for them in the final core file. | ||
1410 | */ | ||
1411 | static int elf_dump_thread_status(long signr, struct elf_thread_status *t) | ||
1412 | { | ||
1413 | struct task_struct *p = t->thread; | ||
1414 | int sz = 0; | ||
1415 | |||
1416 | t->num_notes = 0; | ||
1417 | |||
1418 | fill_prstatus(&t->prstatus, p, signr); | ||
1419 | elf_core_copy_task_regs(p, &t->prstatus.pr_reg); | ||
1420 | |||
1421 | fill_note(&t->notes[0], "CORE", NT_PRSTATUS, sizeof(t->prstatus), | ||
1422 | &t->prstatus); | ||
1423 | t->num_notes++; | ||
1424 | sz += notesize(&t->notes[0]); | ||
1425 | |||
1426 | t->prstatus.pr_fpvalid = elf_core_copy_task_fpregs(p, NULL, &t->fpu); | ||
1427 | if (t->prstatus.pr_fpvalid) { | ||
1428 | fill_note(&t->notes[1], "CORE", NT_PRFPREG, sizeof(t->fpu), | ||
1429 | &t->fpu); | ||
1430 | t->num_notes++; | ||
1431 | sz += notesize(&t->notes[1]); | ||
1432 | } | ||
1433 | |||
1434 | #ifdef ELF_CORE_COPY_XFPREGS | ||
1435 | if (elf_core_copy_task_xfpregs(p, &t->xfpu)) { | ||
1436 | fill_note(&t->notes[2], "LINUX", NT_PRXFPREG, sizeof(t->xfpu), | ||
1437 | &t->xfpu); | ||
1438 | t->num_notes++; | ||
1439 | sz += notesize(&t->notes[2]); | ||
1440 | } | ||
1441 | #endif | ||
1442 | return sz; | ||
1443 | } | ||
1444 | |||
1445 | /* | ||
1446 | * dump the segments for an MMU process | ||
1447 | */ | ||
1448 | #ifdef CONFIG_MMU | ||
1449 | static int elf_fdpic_dump_segments(struct file *file, struct mm_struct *mm, | ||
1450 | size_t *size, unsigned long *limit) | ||
1451 | { | ||
1452 | struct vm_area_struct *vma; | ||
1453 | |||
1454 | for (vma = current->mm->mmap; vma; vma = vma->vm_next) { | ||
1455 | unsigned long addr; | ||
1456 | |||
1457 | if (!maydump(vma)) | ||
1458 | continue; | ||
1459 | |||
1460 | for (addr = vma->vm_start; | ||
1461 | addr < vma->vm_end; | ||
1462 | addr += PAGE_SIZE | ||
1463 | ) { | ||
1464 | struct vm_area_struct *vma; | ||
1465 | struct page *page; | ||
1466 | |||
1467 | if (get_user_pages(current, current->mm, addr, 1, 0, 1, | ||
1468 | &page, &vma) <= 0) { | ||
1469 | DUMP_SEEK(file->f_pos + PAGE_SIZE); | ||
1470 | } | ||
1471 | else if (page == ZERO_PAGE(addr)) { | ||
1472 | DUMP_SEEK(file->f_pos + PAGE_SIZE); | ||
1473 | page_cache_release(page); | ||
1474 | } | ||
1475 | else { | ||
1476 | void *kaddr; | ||
1477 | |||
1478 | flush_cache_page(vma, addr, page_to_pfn(page)); | ||
1479 | kaddr = kmap(page); | ||
1480 | if ((*size += PAGE_SIZE) > *limit || | ||
1481 | !dump_write(file, kaddr, PAGE_SIZE) | ||
1482 | ) { | ||
1483 | kunmap(page); | ||
1484 | page_cache_release(page); | ||
1485 | return -EIO; | ||
1486 | } | ||
1487 | kunmap(page); | ||
1488 | page_cache_release(page); | ||
1489 | } | ||
1490 | } | ||
1491 | } | ||
1492 | |||
1493 | return 0; | ||
1494 | |||
1495 | end_coredump: | ||
1496 | return -EFBIG; | ||
1497 | } | ||
1498 | #endif | ||
1499 | |||
1500 | /* | ||
1501 | * dump the segments for a NOMMU process | ||
1502 | */ | ||
1503 | #ifndef CONFIG_MMU | ||
1504 | static int elf_fdpic_dump_segments(struct file *file, struct mm_struct *mm, | ||
1505 | size_t *size, unsigned long *limit) | ||
1506 | { | ||
1507 | struct vm_list_struct *vml; | ||
1508 | |||
1509 | for (vml = current->mm->context.vmlist; vml; vml = vml->next) { | ||
1510 | struct vm_area_struct *vma = vml->vma; | ||
1511 | |||
1512 | if (!maydump(vma)) | ||
1513 | continue; | ||
1514 | |||
1515 | if ((*size += PAGE_SIZE) > *limit) | ||
1516 | return -EFBIG; | ||
1517 | |||
1518 | if (!dump_write(file, (void *) vma->vm_start, | ||
1519 | vma->vm_end - vma->vm_start)) | ||
1520 | return -EIO; | ||
1521 | } | ||
1522 | |||
1523 | return 0; | ||
1524 | } | ||
1525 | #endif | ||
1526 | |||
1527 | /* | ||
1528 | * Actual dumper | ||
1529 | * | ||
1530 | * This is a two-pass process; first we find the offsets of the bits, | ||
1531 | * and then they are actually written out. If we run out of core limit | ||
1532 | * we just truncate. | ||
1533 | */ | ||
1534 | static int elf_fdpic_core_dump(long signr, struct pt_regs *regs, | ||
1535 | struct file *file) | ||
1536 | { | ||
1537 | #define NUM_NOTES 6 | ||
1538 | int has_dumped = 0; | ||
1539 | mm_segment_t fs; | ||
1540 | int segs; | ||
1541 | size_t size = 0; | ||
1542 | int i; | ||
1543 | struct vm_area_struct *vma; | ||
1544 | struct elfhdr *elf = NULL; | ||
1545 | loff_t offset = 0, dataoff; | ||
1546 | unsigned long limit = current->signal->rlim[RLIMIT_CORE].rlim_cur; | ||
1547 | int numnote; | ||
1548 | struct memelfnote *notes = NULL; | ||
1549 | struct elf_prstatus *prstatus = NULL; /* NT_PRSTATUS */ | ||
1550 | struct elf_prpsinfo *psinfo = NULL; /* NT_PRPSINFO */ | ||
1551 | struct task_struct *g, *p; | ||
1552 | LIST_HEAD(thread_list); | ||
1553 | struct list_head *t; | ||
1554 | elf_fpregset_t *fpu = NULL; | ||
1555 | #ifdef ELF_CORE_COPY_XFPREGS | ||
1556 | elf_fpxregset_t *xfpu = NULL; | ||
1557 | #endif | ||
1558 | int thread_status_size = 0; | ||
1559 | #ifndef CONFIG_MMU | ||
1560 | struct vm_list_struct *vml; | ||
1561 | #endif | ||
1562 | elf_addr_t *auxv; | ||
1563 | |||
1564 | /* | ||
1565 | * We no longer stop all VM operations. | ||
1566 | * | ||
1567 | * This is because those proceses that could possibly change map_count | ||
1568 | * or the mmap / vma pages are now blocked in do_exit on current | ||
1569 | * finishing this core dump. | ||
1570 | * | ||
1571 | * Only ptrace can touch these memory addresses, but it doesn't change | ||
1572 | * the map_count or the pages allocated. So no possibility of crashing | ||
1573 | * exists while dumping the mm->vm_next areas to the core file. | ||
1574 | */ | ||
1575 | |||
1576 | /* alloc memory for large data structures: too large to be on stack */ | ||
1577 | elf = kmalloc(sizeof(*elf), GFP_KERNEL); | ||
1578 | if (!elf) | ||
1579 | goto cleanup; | ||
1580 | prstatus = kzalloc(sizeof(*prstatus), GFP_KERNEL); | ||
1581 | if (!prstatus) | ||
1582 | goto cleanup; | ||
1583 | psinfo = kmalloc(sizeof(*psinfo), GFP_KERNEL); | ||
1584 | if (!psinfo) | ||
1585 | goto cleanup; | ||
1586 | notes = kmalloc(NUM_NOTES * sizeof(struct memelfnote), GFP_KERNEL); | ||
1587 | if (!notes) | ||
1588 | goto cleanup; | ||
1589 | fpu = kmalloc(sizeof(*fpu), GFP_KERNEL); | ||
1590 | if (!fpu) | ||
1591 | goto cleanup; | ||
1592 | #ifdef ELF_CORE_COPY_XFPREGS | ||
1593 | xfpu = kmalloc(sizeof(*xfpu), GFP_KERNEL); | ||
1594 | if (!xfpu) | ||
1595 | goto cleanup; | ||
1596 | #endif | ||
1597 | |||
1598 | if (signr) { | ||
1599 | struct elf_thread_status *tmp; | ||
1600 | read_lock(&tasklist_lock); | ||
1601 | do_each_thread(g,p) | ||
1602 | if (current->mm == p->mm && current != p) { | ||
1603 | tmp = kzalloc(sizeof(*tmp), GFP_ATOMIC); | ||
1604 | if (!tmp) { | ||
1605 | read_unlock(&tasklist_lock); | ||
1606 | goto cleanup; | ||
1607 | } | ||
1608 | INIT_LIST_HEAD(&tmp->list); | ||
1609 | tmp->thread = p; | ||
1610 | list_add(&tmp->list, &thread_list); | ||
1611 | } | ||
1612 | while_each_thread(g,p); | ||
1613 | read_unlock(&tasklist_lock); | ||
1614 | list_for_each(t, &thread_list) { | ||
1615 | struct elf_thread_status *tmp; | ||
1616 | int sz; | ||
1617 | |||
1618 | tmp = list_entry(t, struct elf_thread_status, list); | ||
1619 | sz = elf_dump_thread_status(signr, tmp); | ||
1620 | thread_status_size += sz; | ||
1621 | } | ||
1622 | } | ||
1623 | |||
1624 | /* now collect the dump for the current */ | ||
1625 | fill_prstatus(prstatus, current, signr); | ||
1626 | elf_core_copy_regs(&prstatus->pr_reg, regs); | ||
1627 | |||
1628 | #ifdef CONFIG_MMU | ||
1629 | segs = current->mm->map_count; | ||
1630 | #else | ||
1631 | segs = 0; | ||
1632 | for (vml = current->mm->context.vmlist; vml; vml = vml->next) | ||
1633 | segs++; | ||
1634 | #endif | ||
1635 | #ifdef ELF_CORE_EXTRA_PHDRS | ||
1636 | segs += ELF_CORE_EXTRA_PHDRS; | ||
1637 | #endif | ||
1638 | |||
1639 | /* Set up header */ | ||
1640 | fill_elf_fdpic_header(elf, segs + 1); /* including notes section */ | ||
1641 | |||
1642 | has_dumped = 1; | ||
1643 | current->flags |= PF_DUMPCORE; | ||
1644 | |||
1645 | /* | ||
1646 | * Set up the notes in similar form to SVR4 core dumps made | ||
1647 | * with info from their /proc. | ||
1648 | */ | ||
1649 | |||
1650 | fill_note(notes + 0, "CORE", NT_PRSTATUS, sizeof(*prstatus), prstatus); | ||
1651 | fill_psinfo(psinfo, current->group_leader, current->mm); | ||
1652 | fill_note(notes + 1, "CORE", NT_PRPSINFO, sizeof(*psinfo), psinfo); | ||
1653 | |||
1654 | numnote = 2; | ||
1655 | |||
1656 | auxv = (elf_addr_t *) current->mm->saved_auxv; | ||
1657 | |||
1658 | i = 0; | ||
1659 | do | ||
1660 | i += 2; | ||
1661 | while (auxv[i - 2] != AT_NULL); | ||
1662 | fill_note(¬es[numnote++], "CORE", NT_AUXV, | ||
1663 | i * sizeof(elf_addr_t), auxv); | ||
1664 | |||
1665 | /* Try to dump the FPU. */ | ||
1666 | if ((prstatus->pr_fpvalid = | ||
1667 | elf_core_copy_task_fpregs(current, regs, fpu))) | ||
1668 | fill_note(notes + numnote++, | ||
1669 | "CORE", NT_PRFPREG, sizeof(*fpu), fpu); | ||
1670 | #ifdef ELF_CORE_COPY_XFPREGS | ||
1671 | if (elf_core_copy_task_xfpregs(current, xfpu)) | ||
1672 | fill_note(notes + numnote++, | ||
1673 | "LINUX", NT_PRXFPREG, sizeof(*xfpu), xfpu); | ||
1674 | #endif | ||
1675 | |||
1676 | fs = get_fs(); | ||
1677 | set_fs(KERNEL_DS); | ||
1678 | |||
1679 | DUMP_WRITE(elf, sizeof(*elf)); | ||
1680 | offset += sizeof(*elf); /* Elf header */ | ||
1681 | offset += (segs+1) * sizeof(struct elf_phdr); /* Program headers */ | ||
1682 | |||
1683 | /* Write notes phdr entry */ | ||
1684 | { | ||
1685 | struct elf_phdr phdr; | ||
1686 | int sz = 0; | ||
1687 | |||
1688 | for (i = 0; i < numnote; i++) | ||
1689 | sz += notesize(notes + i); | ||
1690 | |||
1691 | sz += thread_status_size; | ||
1692 | |||
1693 | fill_elf_note_phdr(&phdr, sz, offset); | ||
1694 | offset += sz; | ||
1695 | DUMP_WRITE(&phdr, sizeof(phdr)); | ||
1696 | } | ||
1697 | |||
1698 | /* Page-align dumped data */ | ||
1699 | dataoff = offset = roundup(offset, ELF_EXEC_PAGESIZE); | ||
1700 | |||
1701 | /* write program headers for segments dump */ | ||
1702 | for ( | ||
1703 | #ifdef CONFIG_MMU | ||
1704 | vma = current->mm->mmap; vma; vma = vma->vm_next | ||
1705 | #else | ||
1706 | vml = current->mm->context.vmlist; vml; vml = vml->next | ||
1707 | #endif | ||
1708 | ) { | ||
1709 | struct elf_phdr phdr; | ||
1710 | size_t sz; | ||
1711 | |||
1712 | #ifndef CONFIG_MMU | ||
1713 | vma = vml->vma; | ||
1714 | #endif | ||
1715 | |||
1716 | sz = vma->vm_end - vma->vm_start; | ||
1717 | |||
1718 | phdr.p_type = PT_LOAD; | ||
1719 | phdr.p_offset = offset; | ||
1720 | phdr.p_vaddr = vma->vm_start; | ||
1721 | phdr.p_paddr = 0; | ||
1722 | phdr.p_filesz = maydump(vma) ? sz : 0; | ||
1723 | phdr.p_memsz = sz; | ||
1724 | offset += phdr.p_filesz; | ||
1725 | phdr.p_flags = vma->vm_flags & VM_READ ? PF_R : 0; | ||
1726 | if (vma->vm_flags & VM_WRITE) | ||
1727 | phdr.p_flags |= PF_W; | ||
1728 | if (vma->vm_flags & VM_EXEC) | ||
1729 | phdr.p_flags |= PF_X; | ||
1730 | phdr.p_align = ELF_EXEC_PAGESIZE; | ||
1731 | |||
1732 | DUMP_WRITE(&phdr, sizeof(phdr)); | ||
1733 | } | ||
1734 | |||
1735 | #ifdef ELF_CORE_WRITE_EXTRA_PHDRS | ||
1736 | ELF_CORE_WRITE_EXTRA_PHDRS; | ||
1737 | #endif | ||
1738 | |||
1739 | /* write out the notes section */ | ||
1740 | for (i = 0; i < numnote; i++) | ||
1741 | if (!writenote(notes + i, file)) | ||
1742 | goto end_coredump; | ||
1743 | |||
1744 | /* write out the thread status notes section */ | ||
1745 | list_for_each(t, &thread_list) { | ||
1746 | struct elf_thread_status *tmp = | ||
1747 | list_entry(t, struct elf_thread_status, list); | ||
1748 | |||
1749 | for (i = 0; i < tmp->num_notes; i++) | ||
1750 | if (!writenote(&tmp->notes[i], file)) | ||
1751 | goto end_coredump; | ||
1752 | } | ||
1753 | |||
1754 | DUMP_SEEK(dataoff); | ||
1755 | |||
1756 | if (elf_fdpic_dump_segments(file, current->mm, &size, &limit) < 0) | ||
1757 | goto end_coredump; | ||
1758 | |||
1759 | #ifdef ELF_CORE_WRITE_EXTRA_DATA | ||
1760 | ELF_CORE_WRITE_EXTRA_DATA; | ||
1761 | #endif | ||
1762 | |||
1763 | if (file->f_pos != offset) { | ||
1764 | /* Sanity check */ | ||
1765 | printk(KERN_WARNING | ||
1766 | "elf_core_dump: file->f_pos (%lld) != offset (%lld)\n", | ||
1767 | file->f_pos, offset); | ||
1768 | } | ||
1769 | |||
1770 | end_coredump: | ||
1771 | set_fs(fs); | ||
1772 | |||
1773 | cleanup: | ||
1774 | while (!list_empty(&thread_list)) { | ||
1775 | struct list_head *tmp = thread_list.next; | ||
1776 | list_del(tmp); | ||
1777 | kfree(list_entry(tmp, struct elf_thread_status, list)); | ||
1778 | } | ||
1779 | |||
1780 | kfree(elf); | ||
1781 | kfree(prstatus); | ||
1782 | kfree(psinfo); | ||
1783 | kfree(notes); | ||
1784 | kfree(fpu); | ||
1785 | #ifdef ELF_CORE_COPY_XFPREGS | ||
1786 | kfree(xfpu); | ||
1787 | #endif | ||
1788 | return has_dumped; | ||
1789 | #undef NUM_NOTES | ||
1790 | } | ||
1791 | |||
1792 | #endif /* USE_ELF_CORE_DUMP */ | ||
diff --git a/fs/char_dev.c b/fs/char_dev.c index a4cbc6706ef0..3483d3cf8087 100644 --- a/fs/char_dev.c +++ b/fs/char_dev.c | |||
@@ -182,6 +182,28 @@ int alloc_chrdev_region(dev_t *dev, unsigned baseminor, unsigned count, | |||
182 | return 0; | 182 | return 0; |
183 | } | 183 | } |
184 | 184 | ||
185 | /** | ||
186 | * register_chrdev() - Register a major number for character devices. | ||
187 | * @major: major device number or 0 for dynamic allocation | ||
188 | * @name: name of this range of devices | ||
189 | * @fops: file operations associated with this devices | ||
190 | * | ||
191 | * If @major == 0 this functions will dynamically allocate a major and return | ||
192 | * its number. | ||
193 | * | ||
194 | * If @major > 0 this function will attempt to reserve a device with the given | ||
195 | * major number and will return zero on success. | ||
196 | * | ||
197 | * Returns a -ve errno on failure. | ||
198 | * | ||
199 | * The name of this device has nothing to do with the name of the device in | ||
200 | * /dev. It only helps to keep track of the different owners of devices. If | ||
201 | * your module name has only one type of devices it's ok to use e.g. the name | ||
202 | * of the module here. | ||
203 | * | ||
204 | * This function registers a range of 256 minor numbers. The first minor number | ||
205 | * is 0. | ||
206 | */ | ||
185 | int register_chrdev(unsigned int major, const char *name, | 207 | int register_chrdev(unsigned int major, const char *name, |
186 | const struct file_operations *fops) | 208 | const struct file_operations *fops) |
187 | { | 209 | { |
diff --git a/fs/ext3/acl.h b/fs/ext3/acl.h index 92d50b53a933..0d1e6279cbfd 100644 --- a/fs/ext3/acl.h +++ b/fs/ext3/acl.h | |||
@@ -62,9 +62,6 @@ extern int ext3_permission (struct inode *, int, struct nameidata *); | |||
62 | extern int ext3_acl_chmod (struct inode *); | 62 | extern int ext3_acl_chmod (struct inode *); |
63 | extern int ext3_init_acl (handle_t *, struct inode *, struct inode *); | 63 | extern int ext3_init_acl (handle_t *, struct inode *, struct inode *); |
64 | 64 | ||
65 | extern int init_ext3_acl(void); | ||
66 | extern void exit_ext3_acl(void); | ||
67 | |||
68 | #else /* CONFIG_EXT3_FS_POSIX_ACL */ | 65 | #else /* CONFIG_EXT3_FS_POSIX_ACL */ |
69 | #include <linux/sched.h> | 66 | #include <linux/sched.h> |
70 | #define ext3_permission NULL | 67 | #define ext3_permission NULL |
@@ -240,13 +240,9 @@ static struct fdtable *alloc_fdtable(int nr) | |||
240 | if (!fdt) | 240 | if (!fdt) |
241 | goto out; | 241 | goto out; |
242 | 242 | ||
243 | nfds = 8 * L1_CACHE_BYTES; | 243 | nfds = max_t(int, 8 * L1_CACHE_BYTES, roundup_pow_of_two(nr + 1)); |
244 | /* Expand to the max in easy steps */ | 244 | if (nfds > NR_OPEN) |
245 | while (nfds <= nr) { | 245 | nfds = NR_OPEN; |
246 | nfds = nfds * 2; | ||
247 | if (nfds > NR_OPEN) | ||
248 | nfds = NR_OPEN; | ||
249 | } | ||
250 | 246 | ||
251 | new_openset = alloc_fdset(nfds); | 247 | new_openset = alloc_fdset(nfds); |
252 | new_execset = alloc_fdset(nfds); | 248 | new_execset = alloc_fdset(nfds); |
@@ -277,11 +273,13 @@ static struct fdtable *alloc_fdtable(int nr) | |||
277 | } while (nfds <= nr); | 273 | } while (nfds <= nr); |
278 | new_fds = alloc_fd_array(nfds); | 274 | new_fds = alloc_fd_array(nfds); |
279 | if (!new_fds) | 275 | if (!new_fds) |
280 | goto out; | 276 | goto out2; |
281 | fdt->fd = new_fds; | 277 | fdt->fd = new_fds; |
282 | fdt->max_fds = nfds; | 278 | fdt->max_fds = nfds; |
283 | fdt->free_files = NULL; | 279 | fdt->free_files = NULL; |
284 | return fdt; | 280 | return fdt; |
281 | out2: | ||
282 | nfds = fdt->max_fdset; | ||
285 | out: | 283 | out: |
286 | if (new_openset) | 284 | if (new_openset) |
287 | free_fdset(new_openset, nfds); | 285 | free_fdset(new_openset, nfds); |
diff --git a/fs/hugetlbfs/inode.c b/fs/hugetlbfs/inode.c index 6449cb697967..c3920c96dadf 100644 --- a/fs/hugetlbfs/inode.c +++ b/fs/hugetlbfs/inode.c | |||
@@ -83,8 +83,6 @@ static int hugetlbfs_file_mmap(struct file *file, struct vm_area_struct *vma) | |||
83 | 83 | ||
84 | ret = -ENOMEM; | 84 | ret = -ENOMEM; |
85 | len = vma_len + ((loff_t)vma->vm_pgoff << PAGE_SHIFT); | 85 | len = vma_len + ((loff_t)vma->vm_pgoff << PAGE_SHIFT); |
86 | if (!(vma->vm_flags & VM_WRITE) && len > inode->i_size) | ||
87 | goto out; | ||
88 | 86 | ||
89 | if (vma->vm_flags & VM_MAYSHARE && | 87 | if (vma->vm_flags & VM_MAYSHARE && |
90 | hugetlb_reserve_pages(inode, vma->vm_pgoff >> (HPAGE_SHIFT-PAGE_SHIFT), | 88 | hugetlb_reserve_pages(inode, vma->vm_pgoff >> (HPAGE_SHIFT-PAGE_SHIFT), |
@@ -93,7 +91,7 @@ static int hugetlbfs_file_mmap(struct file *file, struct vm_area_struct *vma) | |||
93 | 91 | ||
94 | ret = 0; | 92 | ret = 0; |
95 | hugetlb_prefault_arch_hook(vma->vm_mm); | 93 | hugetlb_prefault_arch_hook(vma->vm_mm); |
96 | if (inode->i_size < len) | 94 | if (vma->vm_flags & VM_WRITE && inode->i_size < len) |
97 | inode->i_size = len; | 95 | inode->i_size = len; |
98 | out: | 96 | out: |
99 | mutex_unlock(&inode->i_mutex); | 97 | mutex_unlock(&inode->i_mutex); |
diff --git a/fs/jfs/jfs_txnmgr.c b/fs/jfs/jfs_txnmgr.c index 10c46231ce15..efbb586bed4b 100644 --- a/fs/jfs/jfs_txnmgr.c +++ b/fs/jfs/jfs_txnmgr.c | |||
@@ -2944,7 +2944,7 @@ int jfs_sync(void *arg) | |||
2944 | * Inode is being freed | 2944 | * Inode is being freed |
2945 | */ | 2945 | */ |
2946 | list_del_init(&jfs_ip->anon_inode_list); | 2946 | list_del_init(&jfs_ip->anon_inode_list); |
2947 | } else if (! !mutex_trylock(&jfs_ip->commit_mutex)) { | 2947 | } else if (mutex_trylock(&jfs_ip->commit_mutex)) { |
2948 | /* | 2948 | /* |
2949 | * inode will be removed from anonymous list | 2949 | * inode will be removed from anonymous list |
2950 | * when it is committed | 2950 | * when it is committed |
diff --git a/fs/jfs/namei.c b/fs/jfs/namei.c index 09ea03f62277..295268ad231b 100644 --- a/fs/jfs/namei.c +++ b/fs/jfs/namei.c | |||
@@ -165,8 +165,8 @@ static int jfs_create(struct inode *dip, struct dentry *dentry, int mode, | |||
165 | 165 | ||
166 | out3: | 166 | out3: |
167 | txEnd(tid); | 167 | txEnd(tid); |
168 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
169 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 168 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
169 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
170 | if (rc) { | 170 | if (rc) { |
171 | free_ea_wmap(ip); | 171 | free_ea_wmap(ip); |
172 | ip->i_nlink = 0; | 172 | ip->i_nlink = 0; |
@@ -300,8 +300,8 @@ static int jfs_mkdir(struct inode *dip, struct dentry *dentry, int mode) | |||
300 | 300 | ||
301 | out3: | 301 | out3: |
302 | txEnd(tid); | 302 | txEnd(tid); |
303 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
304 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 303 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
304 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
305 | if (rc) { | 305 | if (rc) { |
306 | free_ea_wmap(ip); | 306 | free_ea_wmap(ip); |
307 | ip->i_nlink = 0; | 307 | ip->i_nlink = 0; |
@@ -384,8 +384,8 @@ static int jfs_rmdir(struct inode *dip, struct dentry *dentry) | |||
384 | if (rc == -EIO) | 384 | if (rc == -EIO) |
385 | txAbort(tid, 1); | 385 | txAbort(tid, 1); |
386 | txEnd(tid); | 386 | txEnd(tid); |
387 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
388 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 387 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
388 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
389 | 389 | ||
390 | goto out2; | 390 | goto out2; |
391 | } | 391 | } |
@@ -422,8 +422,8 @@ static int jfs_rmdir(struct inode *dip, struct dentry *dentry) | |||
422 | 422 | ||
423 | txEnd(tid); | 423 | txEnd(tid); |
424 | 424 | ||
425 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
426 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 425 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
426 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
427 | 427 | ||
428 | /* | 428 | /* |
429 | * Truncating the directory index table is not guaranteed. It | 429 | * Truncating the directory index table is not guaranteed. It |
@@ -503,8 +503,8 @@ static int jfs_unlink(struct inode *dip, struct dentry *dentry) | |||
503 | if (rc == -EIO) | 503 | if (rc == -EIO) |
504 | txAbort(tid, 1); /* Marks FS Dirty */ | 504 | txAbort(tid, 1); /* Marks FS Dirty */ |
505 | txEnd(tid); | 505 | txEnd(tid); |
506 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
507 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 506 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
507 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
508 | IWRITE_UNLOCK(ip); | 508 | IWRITE_UNLOCK(ip); |
509 | goto out1; | 509 | goto out1; |
510 | } | 510 | } |
@@ -527,8 +527,8 @@ static int jfs_unlink(struct inode *dip, struct dentry *dentry) | |||
527 | if ((new_size = commitZeroLink(tid, ip)) < 0) { | 527 | if ((new_size = commitZeroLink(tid, ip)) < 0) { |
528 | txAbort(tid, 1); /* Marks FS Dirty */ | 528 | txAbort(tid, 1); /* Marks FS Dirty */ |
529 | txEnd(tid); | 529 | txEnd(tid); |
530 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
531 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 530 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
531 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
532 | IWRITE_UNLOCK(ip); | 532 | IWRITE_UNLOCK(ip); |
533 | rc = new_size; | 533 | rc = new_size; |
534 | goto out1; | 534 | goto out1; |
@@ -556,9 +556,8 @@ static int jfs_unlink(struct inode *dip, struct dentry *dentry) | |||
556 | 556 | ||
557 | txEnd(tid); | 557 | txEnd(tid); |
558 | 558 | ||
559 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
560 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 559 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
561 | 560 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | |
562 | 561 | ||
563 | while (new_size && (rc == 0)) { | 562 | while (new_size && (rc == 0)) { |
564 | tid = txBegin(dip->i_sb, 0); | 563 | tid = txBegin(dip->i_sb, 0); |
@@ -847,8 +846,8 @@ static int jfs_link(struct dentry *old_dentry, | |||
847 | out: | 846 | out: |
848 | txEnd(tid); | 847 | txEnd(tid); |
849 | 848 | ||
850 | mutex_unlock(&JFS_IP(dir)->commit_mutex); | ||
851 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 849 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
850 | mutex_unlock(&JFS_IP(dir)->commit_mutex); | ||
852 | 851 | ||
853 | jfs_info("jfs_link: rc:%d", rc); | 852 | jfs_info("jfs_link: rc:%d", rc); |
854 | return rc; | 853 | return rc; |
@@ -1037,8 +1036,8 @@ static int jfs_symlink(struct inode *dip, struct dentry *dentry, | |||
1037 | 1036 | ||
1038 | out3: | 1037 | out3: |
1039 | txEnd(tid); | 1038 | txEnd(tid); |
1040 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
1041 | mutex_unlock(&JFS_IP(ip)->commit_mutex); | 1039 | mutex_unlock(&JFS_IP(ip)->commit_mutex); |
1040 | mutex_unlock(&JFS_IP(dip)->commit_mutex); | ||
1042 | if (rc) { | 1041 | if (rc) { |
1043 | free_ea_wmap(ip); | 1042 | free_ea_wmap(ip); |
1044 | ip->i_nlink = 0; | 1043 | ip->i_nlink = 0; |
@@ -1160,10 +1159,11 @@ static int jfs_rename(struct inode *old_dir, struct dentry *old_dentry, | |||
1160 | if (S_ISDIR(new_ip->i_mode)) { | 1159 | if (S_ISDIR(new_ip->i_mode)) { |
1161 | new_ip->i_nlink--; | 1160 | new_ip->i_nlink--; |
1162 | if (new_ip->i_nlink) { | 1161 | if (new_ip->i_nlink) { |
1163 | mutex_unlock(&JFS_IP(new_dir)->commit_mutex); | 1162 | mutex_unlock(&JFS_IP(new_ip)->commit_mutex); |
1164 | mutex_unlock(&JFS_IP(old_ip)->commit_mutex); | ||
1165 | if (old_dir != new_dir) | 1163 | if (old_dir != new_dir) |
1166 | mutex_unlock(&JFS_IP(old_dir)->commit_mutex); | 1164 | mutex_unlock(&JFS_IP(old_dir)->commit_mutex); |
1165 | mutex_unlock(&JFS_IP(old_ip)->commit_mutex); | ||
1166 | mutex_unlock(&JFS_IP(new_dir)->commit_mutex); | ||
1167 | if (!S_ISDIR(old_ip->i_mode) && new_ip) | 1167 | if (!S_ISDIR(old_ip->i_mode) && new_ip) |
1168 | IWRITE_UNLOCK(new_ip); | 1168 | IWRITE_UNLOCK(new_ip); |
1169 | jfs_error(new_ip->i_sb, | 1169 | jfs_error(new_ip->i_sb, |
@@ -1281,13 +1281,12 @@ static int jfs_rename(struct inode *old_dir, struct dentry *old_dentry, | |||
1281 | 1281 | ||
1282 | out4: | 1282 | out4: |
1283 | txEnd(tid); | 1283 | txEnd(tid); |
1284 | |||
1285 | mutex_unlock(&JFS_IP(new_dir)->commit_mutex); | ||
1286 | mutex_unlock(&JFS_IP(old_ip)->commit_mutex); | ||
1287 | if (old_dir != new_dir) | ||
1288 | mutex_unlock(&JFS_IP(old_dir)->commit_mutex); | ||
1289 | if (new_ip) | 1284 | if (new_ip) |
1290 | mutex_unlock(&JFS_IP(new_ip)->commit_mutex); | 1285 | mutex_unlock(&JFS_IP(new_ip)->commit_mutex); |
1286 | if (old_dir != new_dir) | ||
1287 | mutex_unlock(&JFS_IP(old_dir)->commit_mutex); | ||
1288 | mutex_unlock(&JFS_IP(old_ip)->commit_mutex); | ||
1289 | mutex_unlock(&JFS_IP(new_dir)->commit_mutex); | ||
1291 | 1290 | ||
1292 | while (new_size && (rc == 0)) { | 1291 | while (new_size && (rc == 0)) { |
1293 | tid = txBegin(new_ip->i_sb, 0); | 1292 | tid = txBegin(new_ip->i_sb, 0); |
diff --git a/fs/namei.c b/fs/namei.c index c9750d755aff..e01070d7bf58 100644 --- a/fs/namei.c +++ b/fs/namei.c | |||
@@ -1712,8 +1712,14 @@ do_link: | |||
1712 | if (error) | 1712 | if (error) |
1713 | goto exit_dput; | 1713 | goto exit_dput; |
1714 | error = __do_follow_link(&path, nd); | 1714 | error = __do_follow_link(&path, nd); |
1715 | if (error) | 1715 | if (error) { |
1716 | /* Does someone understand code flow here? Or it is only | ||
1717 | * me so stupid? Anathema to whoever designed this non-sense | ||
1718 | * with "intent.open". | ||
1719 | */ | ||
1720 | release_open_intent(nd); | ||
1716 | return error; | 1721 | return error; |
1722 | } | ||
1717 | nd->flags &= ~LOOKUP_PARENT; | 1723 | nd->flags &= ~LOOKUP_PARENT; |
1718 | if (nd->last_type == LAST_BIND) | 1724 | if (nd->last_type == LAST_BIND) |
1719 | goto ok; | 1725 | goto ok; |
diff --git a/fs/nfsd/nfs4proc.c b/fs/nfsd/nfs4proc.c index b0e095ea0c03..ee4eff27aedc 100644 --- a/fs/nfsd/nfs4proc.c +++ b/fs/nfsd/nfs4proc.c | |||
@@ -721,6 +721,12 @@ nfsd4_proc_null(struct svc_rqst *rqstp, void *argp, void *resp) | |||
721 | return nfs_ok; | 721 | return nfs_ok; |
722 | } | 722 | } |
723 | 723 | ||
724 | static inline void nfsd4_increment_op_stats(u32 opnum) | ||
725 | { | ||
726 | if (opnum >= FIRST_NFS4_OP && opnum <= LAST_NFS4_OP) | ||
727 | nfsdstats.nfs4_opcount[opnum]++; | ||
728 | } | ||
729 | |||
724 | 730 | ||
725 | /* | 731 | /* |
726 | * COMPOUND call. | 732 | * COMPOUND call. |
@@ -930,6 +936,8 @@ encode_op: | |||
930 | /* XXX Ugh, we need to get rid of this kind of special case: */ | 936 | /* XXX Ugh, we need to get rid of this kind of special case: */ |
931 | if (op->opnum == OP_READ && op->u.read.rd_filp) | 937 | if (op->opnum == OP_READ && op->u.read.rd_filp) |
932 | fput(op->u.read.rd_filp); | 938 | fput(op->u.read.rd_filp); |
939 | |||
940 | nfsd4_increment_op_stats(op->opnum); | ||
933 | } | 941 | } |
934 | 942 | ||
935 | out: | 943 | out: |
diff --git a/fs/nfsd/stats.c b/fs/nfsd/stats.c index 57265d563804..71944cddf680 100644 --- a/fs/nfsd/stats.c +++ b/fs/nfsd/stats.c | |||
@@ -72,6 +72,16 @@ static int nfsd_proc_show(struct seq_file *seq, void *v) | |||
72 | /* show my rpc info */ | 72 | /* show my rpc info */ |
73 | svc_seq_show(seq, &nfsd_svcstats); | 73 | svc_seq_show(seq, &nfsd_svcstats); |
74 | 74 | ||
75 | #ifdef CONFIG_NFSD_V4 | ||
76 | /* Show count for individual nfsv4 operations */ | ||
77 | /* Writing operation numbers 0 1 2 also for maintaining uniformity */ | ||
78 | seq_printf(seq,"proc4ops %u", LAST_NFS4_OP + 1); | ||
79 | for (i = 0; i <= LAST_NFS4_OP; i++) | ||
80 | seq_printf(seq, " %u", nfsdstats.nfs4_opcount[i]); | ||
81 | |||
82 | seq_putc(seq, '\n'); | ||
83 | #endif | ||
84 | |||
75 | return 0; | 85 | return 0; |
76 | } | 86 | } |
77 | 87 | ||
diff --git a/fs/partitions/check.c b/fs/partitions/check.c index 839634026eb5..51c6a748df49 100644 --- a/fs/partitions/check.c +++ b/fs/partitions/check.c | |||
@@ -339,6 +339,7 @@ void add_partition(struct gendisk *disk, int part, sector_t start, sector_t len) | |||
339 | p->start_sect = start; | 339 | p->start_sect = start; |
340 | p->nr_sects = len; | 340 | p->nr_sects = len; |
341 | p->partno = part; | 341 | p->partno = part; |
342 | p->policy = disk->policy; | ||
342 | 343 | ||
343 | if (isdigit(disk->kobj.name[strlen(disk->kobj.name)-1])) | 344 | if (isdigit(disk->kobj.name[strlen(disk->kobj.name)-1])) |
344 | snprintf(p->kobj.name,KOBJ_NAME_LEN,"%sp%d",disk->kobj.name,part); | 345 | snprintf(p->kobj.name,KOBJ_NAME_LEN,"%sp%d",disk->kobj.name,part); |
diff --git a/fs/proc/array.c b/fs/proc/array.c index 7495d3e20775..0b615d62a159 100644 --- a/fs/proc/array.c +++ b/fs/proc/array.c | |||
@@ -74,6 +74,7 @@ | |||
74 | #include <linux/times.h> | 74 | #include <linux/times.h> |
75 | #include <linux/cpuset.h> | 75 | #include <linux/cpuset.h> |
76 | #include <linux/rcupdate.h> | 76 | #include <linux/rcupdate.h> |
77 | #include <linux/delayacct.h> | ||
77 | 78 | ||
78 | #include <asm/uaccess.h> | 79 | #include <asm/uaccess.h> |
79 | #include <asm/pgtable.h> | 80 | #include <asm/pgtable.h> |
@@ -411,7 +412,7 @@ static int do_task_stat(struct task_struct *task, char * buffer, int whole) | |||
411 | 412 | ||
412 | res = sprintf(buffer,"%d (%s) %c %d %d %d %d %d %lu %lu \ | 413 | res = sprintf(buffer,"%d (%s) %c %d %d %d %d %d %lu %lu \ |
413 | %lu %lu %lu %lu %lu %ld %ld %ld %ld %d 0 %llu %lu %ld %lu %lu %lu %lu %lu \ | 414 | %lu %lu %lu %lu %lu %ld %ld %ld %ld %d 0 %llu %lu %ld %lu %lu %lu %lu %lu \ |
414 | %lu %lu %lu %lu %lu %lu %lu %lu %d %d %lu %lu\n", | 415 | %lu %lu %lu %lu %lu %lu %lu %lu %d %d %lu %lu %llu\n", |
415 | task->pid, | 416 | task->pid, |
416 | tcomm, | 417 | tcomm, |
417 | state, | 418 | state, |
@@ -455,7 +456,8 @@ static int do_task_stat(struct task_struct *task, char * buffer, int whole) | |||
455 | task->exit_signal, | 456 | task->exit_signal, |
456 | task_cpu(task), | 457 | task_cpu(task), |
457 | task->rt_priority, | 458 | task->rt_priority, |
458 | task->policy); | 459 | task->policy, |
460 | (unsigned long long)delayacct_blkio_ticks(task)); | ||
459 | if(mm) | 461 | if(mm) |
460 | mmput(mm); | 462 | mmput(mm); |
461 | return res; | 463 | return res; |
diff --git a/fs/proc/base.c b/fs/proc/base.c index 243a94af0427..fe8d55fb17cc 100644 --- a/fs/proc/base.c +++ b/fs/proc/base.c | |||
@@ -551,6 +551,27 @@ static int proc_fd_access_allowed(struct inode *inode) | |||
551 | return allowed; | 551 | return allowed; |
552 | } | 552 | } |
553 | 553 | ||
554 | static int proc_setattr(struct dentry *dentry, struct iattr *attr) | ||
555 | { | ||
556 | int error; | ||
557 | struct inode *inode = dentry->d_inode; | ||
558 | |||
559 | if (attr->ia_valid & ATTR_MODE) | ||
560 | return -EPERM; | ||
561 | |||
562 | error = inode_change_ok(inode, attr); | ||
563 | if (!error) { | ||
564 | error = security_inode_setattr(dentry, attr); | ||
565 | if (!error) | ||
566 | error = inode_setattr(inode, attr); | ||
567 | } | ||
568 | return error; | ||
569 | } | ||
570 | |||
571 | static struct inode_operations proc_def_inode_operations = { | ||
572 | .setattr = proc_setattr, | ||
573 | }; | ||
574 | |||
554 | extern struct seq_operations mounts_op; | 575 | extern struct seq_operations mounts_op; |
555 | struct proc_mounts { | 576 | struct proc_mounts { |
556 | struct seq_file m; | 577 | struct seq_file m; |
@@ -1111,7 +1132,8 @@ out: | |||
1111 | 1132 | ||
1112 | static struct inode_operations proc_pid_link_inode_operations = { | 1133 | static struct inode_operations proc_pid_link_inode_operations = { |
1113 | .readlink = proc_pid_readlink, | 1134 | .readlink = proc_pid_readlink, |
1114 | .follow_link = proc_pid_follow_link | 1135 | .follow_link = proc_pid_follow_link, |
1136 | .setattr = proc_setattr, | ||
1115 | }; | 1137 | }; |
1116 | 1138 | ||
1117 | static int proc_readfd(struct file * filp, void * dirent, filldir_t filldir) | 1139 | static int proc_readfd(struct file * filp, void * dirent, filldir_t filldir) |
@@ -1285,6 +1307,7 @@ static struct inode *proc_pid_make_inode(struct super_block * sb, struct task_st | |||
1285 | ei = PROC_I(inode); | 1307 | ei = PROC_I(inode); |
1286 | inode->i_mtime = inode->i_atime = inode->i_ctime = CURRENT_TIME; | 1308 | inode->i_mtime = inode->i_atime = inode->i_ctime = CURRENT_TIME; |
1287 | inode->i_ino = fake_ino(task->pid, ino); | 1309 | inode->i_ino = fake_ino(task->pid, ino); |
1310 | inode->i_op = &proc_def_inode_operations; | ||
1288 | 1311 | ||
1289 | /* | 1312 | /* |
1290 | * grab the reference to task. | 1313 | * grab the reference to task. |
@@ -1339,6 +1362,7 @@ static int pid_revalidate(struct dentry *dentry, struct nameidata *nd) | |||
1339 | inode->i_uid = 0; | 1362 | inode->i_uid = 0; |
1340 | inode->i_gid = 0; | 1363 | inode->i_gid = 0; |
1341 | } | 1364 | } |
1365 | inode->i_mode &= ~(S_ISUID | S_ISGID); | ||
1342 | security_task_to_inode(task, inode); | 1366 | security_task_to_inode(task, inode); |
1343 | put_task_struct(task); | 1367 | put_task_struct(task); |
1344 | return 1; | 1368 | return 1; |
@@ -1389,6 +1413,7 @@ static int tid_fd_revalidate(struct dentry *dentry, struct nameidata *nd) | |||
1389 | inode->i_uid = 0; | 1413 | inode->i_uid = 0; |
1390 | inode->i_gid = 0; | 1414 | inode->i_gid = 0; |
1391 | } | 1415 | } |
1416 | inode->i_mode &= ~(S_ISUID | S_ISGID); | ||
1392 | security_task_to_inode(task, inode); | 1417 | security_task_to_inode(task, inode); |
1393 | put_task_struct(task); | 1418 | put_task_struct(task); |
1394 | return 1; | 1419 | return 1; |
@@ -1527,11 +1552,13 @@ static struct file_operations proc_task_operations = { | |||
1527 | */ | 1552 | */ |
1528 | static struct inode_operations proc_fd_inode_operations = { | 1553 | static struct inode_operations proc_fd_inode_operations = { |
1529 | .lookup = proc_lookupfd, | 1554 | .lookup = proc_lookupfd, |
1555 | .setattr = proc_setattr, | ||
1530 | }; | 1556 | }; |
1531 | 1557 | ||
1532 | static struct inode_operations proc_task_inode_operations = { | 1558 | static struct inode_operations proc_task_inode_operations = { |
1533 | .lookup = proc_task_lookup, | 1559 | .lookup = proc_task_lookup, |
1534 | .getattr = proc_task_getattr, | 1560 | .getattr = proc_task_getattr, |
1561 | .setattr = proc_setattr, | ||
1535 | }; | 1562 | }; |
1536 | 1563 | ||
1537 | #ifdef CONFIG_SECURITY | 1564 | #ifdef CONFIG_SECURITY |
@@ -1845,11 +1872,13 @@ static struct file_operations proc_tid_base_operations = { | |||
1845 | static struct inode_operations proc_tgid_base_inode_operations = { | 1872 | static struct inode_operations proc_tgid_base_inode_operations = { |
1846 | .lookup = proc_tgid_base_lookup, | 1873 | .lookup = proc_tgid_base_lookup, |
1847 | .getattr = pid_getattr, | 1874 | .getattr = pid_getattr, |
1875 | .setattr = proc_setattr, | ||
1848 | }; | 1876 | }; |
1849 | 1877 | ||
1850 | static struct inode_operations proc_tid_base_inode_operations = { | 1878 | static struct inode_operations proc_tid_base_inode_operations = { |
1851 | .lookup = proc_tid_base_lookup, | 1879 | .lookup = proc_tid_base_lookup, |
1852 | .getattr = pid_getattr, | 1880 | .getattr = pid_getattr, |
1881 | .setattr = proc_setattr, | ||
1853 | }; | 1882 | }; |
1854 | 1883 | ||
1855 | #ifdef CONFIG_SECURITY | 1884 | #ifdef CONFIG_SECURITY |
@@ -1892,11 +1921,13 @@ static struct dentry *proc_tid_attr_lookup(struct inode *dir, | |||
1892 | static struct inode_operations proc_tgid_attr_inode_operations = { | 1921 | static struct inode_operations proc_tgid_attr_inode_operations = { |
1893 | .lookup = proc_tgid_attr_lookup, | 1922 | .lookup = proc_tgid_attr_lookup, |
1894 | .getattr = pid_getattr, | 1923 | .getattr = pid_getattr, |
1924 | .setattr = proc_setattr, | ||
1895 | }; | 1925 | }; |
1896 | 1926 | ||
1897 | static struct inode_operations proc_tid_attr_inode_operations = { | 1927 | static struct inode_operations proc_tid_attr_inode_operations = { |
1898 | .lookup = proc_tid_attr_lookup, | 1928 | .lookup = proc_tid_attr_lookup, |
1899 | .getattr = pid_getattr, | 1929 | .getattr = pid_getattr, |
1930 | .setattr = proc_setattr, | ||
1900 | }; | 1931 | }; |
1901 | #endif | 1932 | #endif |
1902 | 1933 | ||
diff --git a/fs/proc/inode.c b/fs/proc/inode.c index 6dcef089e18e..49dfb2ab783e 100644 --- a/fs/proc/inode.c +++ b/fs/proc/inode.c | |||
@@ -192,7 +192,7 @@ int proc_fill_super(struct super_block *s, void *data, int silent) | |||
192 | { | 192 | { |
193 | struct inode * root_inode; | 193 | struct inode * root_inode; |
194 | 194 | ||
195 | s->s_flags |= MS_NODIRATIME; | 195 | s->s_flags |= MS_NODIRATIME | MS_NOSUID | MS_NOEXEC; |
196 | s->s_blocksize = 1024; | 196 | s->s_blocksize = 1024; |
197 | s->s_blocksize_bits = 10; | 197 | s->s_blocksize_bits = 10; |
198 | s->s_magic = PROC_SUPER_MAGIC; | 198 | s->s_magic = PROC_SUPER_MAGIC; |
diff --git a/fs/proc/kcore.c b/fs/proc/kcore.c index 036d14d83627..6a984f64edd7 100644 --- a/fs/proc/kcore.c +++ b/fs/proc/kcore.c | |||
@@ -42,8 +42,6 @@ const struct file_operations proc_kcore_operations = { | |||
42 | #define kc_offset_to_vaddr(o) ((o) + PAGE_OFFSET) | 42 | #define kc_offset_to_vaddr(o) ((o) + PAGE_OFFSET) |
43 | #endif | 43 | #endif |
44 | 44 | ||
45 | #define roundup(x, y) ((((x)+((y)-1))/(y))*(y)) | ||
46 | |||
47 | /* An ELF note in memory */ | 45 | /* An ELF note in memory */ |
48 | struct memelfnote | 46 | struct memelfnote |
49 | { | 47 | { |
@@ -384,7 +382,7 @@ read_kcore(struct file *file, char __user *buffer, size_t buflen, loff_t *fpos) | |||
384 | */ | 382 | */ |
385 | if (n) { | 383 | if (n) { |
386 | if (clear_user(buffer + tsz - n, | 384 | if (clear_user(buffer + tsz - n, |
387 | tsz - n)) | 385 | n)) |
388 | return -EFAULT; | 386 | return -EFAULT; |
389 | } | 387 | } |
390 | } else { | 388 | } else { |
diff --git a/fs/ramfs/file-nommu.c b/fs/ramfs/file-nommu.c index 99fffc9e1bfd..677139b48e00 100644 --- a/fs/ramfs/file-nommu.c +++ b/fs/ramfs/file-nommu.c | |||
@@ -283,9 +283,9 @@ unsigned long ramfs_nommu_get_unmapped_area(struct file *file, | |||
283 | 283 | ||
284 | /*****************************************************************************/ | 284 | /*****************************************************************************/ |
285 | /* | 285 | /* |
286 | * set up a mapping | 286 | * set up a mapping for shared memory segments |
287 | */ | 287 | */ |
288 | int ramfs_nommu_mmap(struct file *file, struct vm_area_struct *vma) | 288 | int ramfs_nommu_mmap(struct file *file, struct vm_area_struct *vma) |
289 | { | 289 | { |
290 | return 0; | 290 | return vma->vm_flags & VM_SHARED ? 0 : -ENOSYS; |
291 | } | 291 | } |
diff --git a/fs/read_write.c b/fs/read_write.c index 5bc0e9234f9d..d4cb3183c99c 100644 --- a/fs/read_write.c +++ b/fs/read_write.c | |||
@@ -436,7 +436,7 @@ unsigned long iov_shorten(struct iovec *iov, unsigned long nr_segs, size_t to) | |||
436 | return seg; | 436 | return seg; |
437 | } | 437 | } |
438 | 438 | ||
439 | EXPORT_SYMBOL(iov_shorten); | 439 | EXPORT_UNUSED_SYMBOL(iov_shorten); /* June 2006 */ |
440 | 440 | ||
441 | /* A write operation does a read from user space and vice versa */ | 441 | /* A write operation does a read from user space and vice versa */ |
442 | #define vrfy_dir(type) ((type) == READ ? VERIFY_WRITE : VERIFY_READ) | 442 | #define vrfy_dir(type) ((type) == READ ? VERIFY_WRITE : VERIFY_READ) |
diff --git a/fs/reiserfs/file.c b/fs/reiserfs/file.c index 752cea12e30f..f318b58510fd 100644 --- a/fs/reiserfs/file.c +++ b/fs/reiserfs/file.c | |||
@@ -860,8 +860,12 @@ static int reiserfs_submit_file_region_for_write(struct reiserfs_transaction_han | |||
860 | // this sets the proper flags for O_SYNC to trigger a commit | 860 | // this sets the proper flags for O_SYNC to trigger a commit |
861 | mark_inode_dirty(inode); | 861 | mark_inode_dirty(inode); |
862 | reiserfs_write_unlock(inode->i_sb); | 862 | reiserfs_write_unlock(inode->i_sb); |
863 | } else | 863 | } else { |
864 | reiserfs_write_lock(inode->i_sb); | ||
865 | reiserfs_update_inode_transaction(inode); | ||
864 | mark_inode_dirty(inode); | 866 | mark_inode_dirty(inode); |
867 | reiserfs_write_unlock(inode->i_sb); | ||
868 | } | ||
865 | 869 | ||
866 | sd_update = 1; | 870 | sd_update = 1; |
867 | } | 871 | } |
diff --git a/fs/reiserfs/procfs.c b/fs/reiserfs/procfs.c index 5d8a8cfebc70..c533ec1bcaec 100644 --- a/fs/reiserfs/procfs.c +++ b/fs/reiserfs/procfs.c | |||
@@ -492,9 +492,17 @@ static void add_file(struct super_block *sb, char *name, | |||
492 | 492 | ||
493 | int reiserfs_proc_info_init(struct super_block *sb) | 493 | int reiserfs_proc_info_init(struct super_block *sb) |
494 | { | 494 | { |
495 | char b[BDEVNAME_SIZE]; | ||
496 | char *s; | ||
497 | |||
498 | /* Some block devices use /'s */ | ||
499 | strlcpy(b, reiserfs_bdevname(sb), BDEVNAME_SIZE); | ||
500 | s = strchr(b, '/'); | ||
501 | if (s) | ||
502 | *s = '!'; | ||
503 | |||
495 | spin_lock_init(&__PINFO(sb).lock); | 504 | spin_lock_init(&__PINFO(sb).lock); |
496 | REISERFS_SB(sb)->procdir = | 505 | REISERFS_SB(sb)->procdir = proc_mkdir(b, proc_info_root); |
497 | proc_mkdir(reiserfs_bdevname(sb), proc_info_root); | ||
498 | if (REISERFS_SB(sb)->procdir) { | 506 | if (REISERFS_SB(sb)->procdir) { |
499 | REISERFS_SB(sb)->procdir->owner = THIS_MODULE; | 507 | REISERFS_SB(sb)->procdir->owner = THIS_MODULE; |
500 | REISERFS_SB(sb)->procdir->data = sb; | 508 | REISERFS_SB(sb)->procdir->data = sb; |
@@ -508,13 +516,22 @@ int reiserfs_proc_info_init(struct super_block *sb) | |||
508 | return 0; | 516 | return 0; |
509 | } | 517 | } |
510 | reiserfs_warning(sb, "reiserfs: cannot create /proc/%s/%s", | 518 | reiserfs_warning(sb, "reiserfs: cannot create /proc/%s/%s", |
511 | proc_info_root_name, reiserfs_bdevname(sb)); | 519 | proc_info_root_name, b); |
512 | return 1; | 520 | return 1; |
513 | } | 521 | } |
514 | 522 | ||
515 | int reiserfs_proc_info_done(struct super_block *sb) | 523 | int reiserfs_proc_info_done(struct super_block *sb) |
516 | { | 524 | { |
517 | struct proc_dir_entry *de = REISERFS_SB(sb)->procdir; | 525 | struct proc_dir_entry *de = REISERFS_SB(sb)->procdir; |
526 | char b[BDEVNAME_SIZE]; | ||
527 | char *s; | ||
528 | |||
529 | /* Some block devices use /'s */ | ||
530 | strlcpy(b, reiserfs_bdevname(sb), BDEVNAME_SIZE); | ||
531 | s = strchr(b, '/'); | ||
532 | if (s) | ||
533 | *s = '!'; | ||
534 | |||
518 | if (de) { | 535 | if (de) { |
519 | remove_proc_entry("journal", de); | 536 | remove_proc_entry("journal", de); |
520 | remove_proc_entry("oidmap", de); | 537 | remove_proc_entry("oidmap", de); |
@@ -528,7 +545,7 @@ int reiserfs_proc_info_done(struct super_block *sb) | |||
528 | __PINFO(sb).exiting = 1; | 545 | __PINFO(sb).exiting = 1; |
529 | spin_unlock(&__PINFO(sb).lock); | 546 | spin_unlock(&__PINFO(sb).lock); |
530 | if (proc_info_root) { | 547 | if (proc_info_root) { |
531 | remove_proc_entry(reiserfs_bdevname(sb), proc_info_root); | 548 | remove_proc_entry(b, proc_info_root); |
532 | REISERFS_SB(sb)->procdir = NULL; | 549 | REISERFS_SB(sb)->procdir = NULL; |
533 | } | 550 | } |
534 | return 0; | 551 | return 0; |
diff --git a/fs/splice.c b/fs/splice.c index 05fd2787be98..684bca3d3a10 100644 --- a/fs/splice.c +++ b/fs/splice.c | |||
@@ -1307,6 +1307,85 @@ asmlinkage long sys_splice(int fd_in, loff_t __user *off_in, | |||
1307 | } | 1307 | } |
1308 | 1308 | ||
1309 | /* | 1309 | /* |
1310 | * Make sure there's data to read. Wait for input if we can, otherwise | ||
1311 | * return an appropriate error. | ||
1312 | */ | ||
1313 | static int link_ipipe_prep(struct pipe_inode_info *pipe, unsigned int flags) | ||
1314 | { | ||
1315 | int ret; | ||
1316 | |||
1317 | /* | ||
1318 | * Check ->nrbufs without the inode lock first. This function | ||
1319 | * is speculative anyways, so missing one is ok. | ||
1320 | */ | ||
1321 | if (pipe->nrbufs) | ||
1322 | return 0; | ||
1323 | |||
1324 | ret = 0; | ||
1325 | mutex_lock(&pipe->inode->i_mutex); | ||
1326 | |||
1327 | while (!pipe->nrbufs) { | ||
1328 | if (signal_pending(current)) { | ||
1329 | ret = -ERESTARTSYS; | ||
1330 | break; | ||
1331 | } | ||
1332 | if (!pipe->writers) | ||
1333 | break; | ||
1334 | if (!pipe->waiting_writers) { | ||
1335 | if (flags & SPLICE_F_NONBLOCK) { | ||
1336 | ret = -EAGAIN; | ||
1337 | break; | ||
1338 | } | ||
1339 | } | ||
1340 | pipe_wait(pipe); | ||
1341 | } | ||
1342 | |||
1343 | mutex_unlock(&pipe->inode->i_mutex); | ||
1344 | return ret; | ||
1345 | } | ||
1346 | |||
1347 | /* | ||
1348 | * Make sure there's writeable room. Wait for room if we can, otherwise | ||
1349 | * return an appropriate error. | ||
1350 | */ | ||
1351 | static int link_opipe_prep(struct pipe_inode_info *pipe, unsigned int flags) | ||
1352 | { | ||
1353 | int ret; | ||
1354 | |||
1355 | /* | ||
1356 | * Check ->nrbufs without the inode lock first. This function | ||
1357 | * is speculative anyways, so missing one is ok. | ||
1358 | */ | ||
1359 | if (pipe->nrbufs < PIPE_BUFFERS) | ||
1360 | return 0; | ||
1361 | |||
1362 | ret = 0; | ||
1363 | mutex_lock(&pipe->inode->i_mutex); | ||
1364 | |||
1365 | while (pipe->nrbufs >= PIPE_BUFFERS) { | ||
1366 | if (!pipe->readers) { | ||
1367 | send_sig(SIGPIPE, current, 0); | ||
1368 | ret = -EPIPE; | ||
1369 | break; | ||
1370 | } | ||
1371 | if (flags & SPLICE_F_NONBLOCK) { | ||
1372 | ret = -EAGAIN; | ||
1373 | break; | ||
1374 | } | ||
1375 | if (signal_pending(current)) { | ||
1376 | ret = -ERESTARTSYS; | ||
1377 | break; | ||
1378 | } | ||
1379 | pipe->waiting_writers++; | ||
1380 | pipe_wait(pipe); | ||
1381 | pipe->waiting_writers--; | ||
1382 | } | ||
1383 | |||
1384 | mutex_unlock(&pipe->inode->i_mutex); | ||
1385 | return ret; | ||
1386 | } | ||
1387 | |||
1388 | /* | ||
1310 | * Link contents of ipipe to opipe. | 1389 | * Link contents of ipipe to opipe. |
1311 | */ | 1390 | */ |
1312 | static int link_pipe(struct pipe_inode_info *ipipe, | 1391 | static int link_pipe(struct pipe_inode_info *ipipe, |
@@ -1314,9 +1393,7 @@ static int link_pipe(struct pipe_inode_info *ipipe, | |||
1314 | size_t len, unsigned int flags) | 1393 | size_t len, unsigned int flags) |
1315 | { | 1394 | { |
1316 | struct pipe_buffer *ibuf, *obuf; | 1395 | struct pipe_buffer *ibuf, *obuf; |
1317 | int ret, do_wakeup, i, ipipe_first; | 1396 | int ret = 0, i = 0, nbuf; |
1318 | |||
1319 | ret = do_wakeup = ipipe_first = 0; | ||
1320 | 1397 | ||
1321 | /* | 1398 | /* |
1322 | * Potential ABBA deadlock, work around it by ordering lock | 1399 | * Potential ABBA deadlock, work around it by ordering lock |
@@ -1324,126 +1401,62 @@ static int link_pipe(struct pipe_inode_info *ipipe, | |||
1324 | * could deadlock (one doing tee from A -> B, the other from B -> A). | 1401 | * could deadlock (one doing tee from A -> B, the other from B -> A). |
1325 | */ | 1402 | */ |
1326 | if (ipipe->inode < opipe->inode) { | 1403 | if (ipipe->inode < opipe->inode) { |
1327 | ipipe_first = 1; | 1404 | mutex_lock_nested(&ipipe->inode->i_mutex, I_MUTEX_PARENT); |
1328 | mutex_lock(&ipipe->inode->i_mutex); | 1405 | mutex_lock_nested(&opipe->inode->i_mutex, I_MUTEX_CHILD); |
1329 | mutex_lock(&opipe->inode->i_mutex); | ||
1330 | } else { | 1406 | } else { |
1331 | mutex_lock(&opipe->inode->i_mutex); | 1407 | mutex_lock_nested(&opipe->inode->i_mutex, I_MUTEX_PARENT); |
1332 | mutex_lock(&ipipe->inode->i_mutex); | 1408 | mutex_lock_nested(&ipipe->inode->i_mutex, I_MUTEX_CHILD); |
1333 | } | 1409 | } |
1334 | 1410 | ||
1335 | for (i = 0;; i++) { | 1411 | do { |
1336 | if (!opipe->readers) { | 1412 | if (!opipe->readers) { |
1337 | send_sig(SIGPIPE, current, 0); | 1413 | send_sig(SIGPIPE, current, 0); |
1338 | if (!ret) | 1414 | if (!ret) |
1339 | ret = -EPIPE; | 1415 | ret = -EPIPE; |
1340 | break; | 1416 | break; |
1341 | } | 1417 | } |
1342 | if (ipipe->nrbufs - i) { | ||
1343 | ibuf = ipipe->bufs + ((ipipe->curbuf + i) & (PIPE_BUFFERS - 1)); | ||
1344 | 1418 | ||
1345 | /* | 1419 | /* |
1346 | * If we have room, fill this buffer | 1420 | * If we have iterated all input buffers or ran out of |
1347 | */ | 1421 | * output room, break. |
1348 | if (opipe->nrbufs < PIPE_BUFFERS) { | 1422 | */ |
1349 | int nbuf = (opipe->curbuf + opipe->nrbufs) & (PIPE_BUFFERS - 1); | 1423 | if (i >= ipipe->nrbufs || opipe->nrbufs >= PIPE_BUFFERS) |
1350 | 1424 | break; | |
1351 | /* | ||
1352 | * Get a reference to this pipe buffer, | ||
1353 | * so we can copy the contents over. | ||
1354 | */ | ||
1355 | ibuf->ops->get(ipipe, ibuf); | ||
1356 | |||
1357 | obuf = opipe->bufs + nbuf; | ||
1358 | *obuf = *ibuf; | ||
1359 | |||
1360 | /* | ||
1361 | * Don't inherit the gift flag, we need to | ||
1362 | * prevent multiple steals of this page. | ||
1363 | */ | ||
1364 | obuf->flags &= ~PIPE_BUF_FLAG_GIFT; | ||
1365 | |||
1366 | if (obuf->len > len) | ||
1367 | obuf->len = len; | ||
1368 | |||
1369 | opipe->nrbufs++; | ||
1370 | do_wakeup = 1; | ||
1371 | ret += obuf->len; | ||
1372 | len -= obuf->len; | ||
1373 | |||
1374 | if (!len) | ||
1375 | break; | ||
1376 | if (opipe->nrbufs < PIPE_BUFFERS) | ||
1377 | continue; | ||
1378 | } | ||
1379 | |||
1380 | /* | ||
1381 | * We have input available, but no output room. | ||
1382 | * If we already copied data, return that. If we | ||
1383 | * need to drop the opipe lock, it must be ordered | ||
1384 | * last to avoid deadlocks. | ||
1385 | */ | ||
1386 | if ((flags & SPLICE_F_NONBLOCK) || !ipipe_first) { | ||
1387 | if (!ret) | ||
1388 | ret = -EAGAIN; | ||
1389 | break; | ||
1390 | } | ||
1391 | if (signal_pending(current)) { | ||
1392 | if (!ret) | ||
1393 | ret = -ERESTARTSYS; | ||
1394 | break; | ||
1395 | } | ||
1396 | if (do_wakeup) { | ||
1397 | smp_mb(); | ||
1398 | if (waitqueue_active(&opipe->wait)) | ||
1399 | wake_up_interruptible(&opipe->wait); | ||
1400 | kill_fasync(&opipe->fasync_readers, SIGIO, POLL_IN); | ||
1401 | do_wakeup = 0; | ||
1402 | } | ||
1403 | 1425 | ||
1404 | opipe->waiting_writers++; | 1426 | ibuf = ipipe->bufs + ((ipipe->curbuf + i) & (PIPE_BUFFERS - 1)); |
1405 | pipe_wait(opipe); | 1427 | nbuf = (opipe->curbuf + opipe->nrbufs) & (PIPE_BUFFERS - 1); |
1406 | opipe->waiting_writers--; | ||
1407 | continue; | ||
1408 | } | ||
1409 | 1428 | ||
1410 | /* | 1429 | /* |
1411 | * No input buffers, do the usual checks for available | 1430 | * Get a reference to this pipe buffer, |
1412 | * writers and blocking and wait if necessary | 1431 | * so we can copy the contents over. |
1413 | */ | 1432 | */ |
1414 | if (!ipipe->writers) | 1433 | ibuf->ops->get(ipipe, ibuf); |
1415 | break; | 1434 | |
1416 | if (!ipipe->waiting_writers) { | 1435 | obuf = opipe->bufs + nbuf; |
1417 | if (ret) | 1436 | *obuf = *ibuf; |
1418 | break; | 1437 | |
1419 | } | ||
1420 | /* | 1438 | /* |
1421 | * pipe_wait() drops the ipipe mutex. To avoid deadlocks | 1439 | * Don't inherit the gift flag, we need to |
1422 | * with another process, we can only safely do that if | 1440 | * prevent multiple steals of this page. |
1423 | * the ipipe lock is ordered last. | ||
1424 | */ | 1441 | */ |
1425 | if ((flags & SPLICE_F_NONBLOCK) || ipipe_first) { | 1442 | obuf->flags &= ~PIPE_BUF_FLAG_GIFT; |
1426 | if (!ret) | ||
1427 | ret = -EAGAIN; | ||
1428 | break; | ||
1429 | } | ||
1430 | if (signal_pending(current)) { | ||
1431 | if (!ret) | ||
1432 | ret = -ERESTARTSYS; | ||
1433 | break; | ||
1434 | } | ||
1435 | 1443 | ||
1436 | if (waitqueue_active(&ipipe->wait)) | 1444 | if (obuf->len > len) |
1437 | wake_up_interruptible_sync(&ipipe->wait); | 1445 | obuf->len = len; |
1438 | kill_fasync(&ipipe->fasync_writers, SIGIO, POLL_OUT); | ||
1439 | 1446 | ||
1440 | pipe_wait(ipipe); | 1447 | opipe->nrbufs++; |
1441 | } | 1448 | ret += obuf->len; |
1449 | len -= obuf->len; | ||
1450 | i++; | ||
1451 | } while (len); | ||
1442 | 1452 | ||
1443 | mutex_unlock(&ipipe->inode->i_mutex); | 1453 | mutex_unlock(&ipipe->inode->i_mutex); |
1444 | mutex_unlock(&opipe->inode->i_mutex); | 1454 | mutex_unlock(&opipe->inode->i_mutex); |
1445 | 1455 | ||
1446 | if (do_wakeup) { | 1456 | /* |
1457 | * If we put data in the output pipe, wakeup any potential readers. | ||
1458 | */ | ||
1459 | if (ret > 0) { | ||
1447 | smp_mb(); | 1460 | smp_mb(); |
1448 | if (waitqueue_active(&opipe->wait)) | 1461 | if (waitqueue_active(&opipe->wait)) |
1449 | wake_up_interruptible(&opipe->wait); | 1462 | wake_up_interruptible(&opipe->wait); |
@@ -1464,14 +1477,29 @@ static long do_tee(struct file *in, struct file *out, size_t len, | |||
1464 | { | 1477 | { |
1465 | struct pipe_inode_info *ipipe = in->f_dentry->d_inode->i_pipe; | 1478 | struct pipe_inode_info *ipipe = in->f_dentry->d_inode->i_pipe; |
1466 | struct pipe_inode_info *opipe = out->f_dentry->d_inode->i_pipe; | 1479 | struct pipe_inode_info *opipe = out->f_dentry->d_inode->i_pipe; |
1480 | int ret = -EINVAL; | ||
1467 | 1481 | ||
1468 | /* | 1482 | /* |
1469 | * Link ipipe to the two output pipes, consuming as we go along. | 1483 | * Duplicate the contents of ipipe to opipe without actually |
1484 | * copying the data. | ||
1470 | */ | 1485 | */ |
1471 | if (ipipe && opipe) | 1486 | if (ipipe && opipe && ipipe != opipe) { |
1472 | return link_pipe(ipipe, opipe, len, flags); | 1487 | /* |
1488 | * Keep going, unless we encounter an error. The ipipe/opipe | ||
1489 | * ordering doesn't really matter. | ||
1490 | */ | ||
1491 | ret = link_ipipe_prep(ipipe, flags); | ||
1492 | if (!ret) { | ||
1493 | ret = link_opipe_prep(opipe, flags); | ||
1494 | if (!ret) { | ||
1495 | ret = link_pipe(ipipe, opipe, len, flags); | ||
1496 | if (!ret && (flags & SPLICE_F_NONBLOCK)) | ||
1497 | ret = -EAGAIN; | ||
1498 | } | ||
1499 | } | ||
1500 | } | ||
1473 | 1501 | ||
1474 | return -EINVAL; | 1502 | return ret; |
1475 | } | 1503 | } |
1476 | 1504 | ||
1477 | asmlinkage long sys_tee(int fdin, int fdout, size_t len, unsigned int flags) | 1505 | asmlinkage long sys_tee(int fdin, int fdout, size_t len, unsigned int flags) |
diff --git a/fs/sysfs/inode.c b/fs/sysfs/inode.c index 5e0e31cc46f5..9889e54e1f13 100644 --- a/fs/sysfs/inode.c +++ b/fs/sysfs/inode.c | |||
@@ -109,6 +109,17 @@ static inline void set_inode_attr(struct inode * inode, struct iattr * iattr) | |||
109 | inode->i_ctime = iattr->ia_ctime; | 109 | inode->i_ctime = iattr->ia_ctime; |
110 | } | 110 | } |
111 | 111 | ||
112 | |||
113 | /* | ||
114 | * sysfs has a different i_mutex lock order behavior for i_mutex than other | ||
115 | * filesystems; sysfs i_mutex is called in many places with subsystem locks | ||
116 | * held. At the same time, many of the VFS locking rules do not apply to | ||
117 | * sysfs at all (cross directory rename for example). To untangle this mess | ||
118 | * (which gives false positives in lockdep), we're giving sysfs inodes their | ||
119 | * own class for i_mutex. | ||
120 | */ | ||
121 | static struct lock_class_key sysfs_inode_imutex_key; | ||
122 | |||
112 | struct inode * sysfs_new_inode(mode_t mode, struct sysfs_dirent * sd) | 123 | struct inode * sysfs_new_inode(mode_t mode, struct sysfs_dirent * sd) |
113 | { | 124 | { |
114 | struct inode * inode = new_inode(sysfs_sb); | 125 | struct inode * inode = new_inode(sysfs_sb); |
@@ -118,6 +129,7 @@ struct inode * sysfs_new_inode(mode_t mode, struct sysfs_dirent * sd) | |||
118 | inode->i_mapping->a_ops = &sysfs_aops; | 129 | inode->i_mapping->a_ops = &sysfs_aops; |
119 | inode->i_mapping->backing_dev_info = &sysfs_backing_dev_info; | 130 | inode->i_mapping->backing_dev_info = &sysfs_backing_dev_info; |
120 | inode->i_op = &sysfs_inode_operations; | 131 | inode->i_op = &sysfs_inode_operations; |
132 | lockdep_set_class(&inode->i_mutex, &sysfs_inode_imutex_key); | ||
121 | 133 | ||
122 | if (sd->s_iattr) { | 134 | if (sd->s_iattr) { |
123 | /* sysfs_dirent has non-default attributes | 135 | /* sysfs_dirent has non-default attributes |
diff --git a/fs/xfs/linux-2.6/xfs_linux.h b/fs/xfs/linux-2.6/xfs_linux.h index 8c021dc57d1f..a13f75c1a936 100644 --- a/fs/xfs/linux-2.6/xfs_linux.h +++ b/fs/xfs/linux-2.6/xfs_linux.h | |||
@@ -215,7 +215,6 @@ BUFFER_FNS(PrivateStart, unwritten); | |||
215 | #define MIN(a,b) (min(a,b)) | 215 | #define MIN(a,b) (min(a,b)) |
216 | #define MAX(a,b) (max(a,b)) | 216 | #define MAX(a,b) (max(a,b)) |
217 | #define howmany(x, y) (((x)+((y)-1))/(y)) | 217 | #define howmany(x, y) (((x)+((y)-1))/(y)) |
218 | #define roundup(x, y) ((((x)+((y)-1))/(y))*(y)) | ||
219 | 218 | ||
220 | /* | 219 | /* |
221 | * Various platform dependent calls that don't fit anywhere else | 220 | * Various platform dependent calls that don't fit anywhere else |