diff options
Diffstat (limited to 'mm/mmap.c')
-rw-r--r-- | mm/mmap.c | 117 |
1 files changed, 60 insertions, 57 deletions
@@ -3,7 +3,7 @@ | |||
3 | * | 3 | * |
4 | * Written by obz. | 4 | * Written by obz. |
5 | * | 5 | * |
6 | * Address space accounting code <alan@redhat.com> | 6 | * Address space accounting code <alan@lxorguk.ukuu.org.uk> |
7 | */ | 7 | */ |
8 | 8 | ||
9 | #include <linux/slab.h> | 9 | #include <linux/slab.h> |
@@ -246,7 +246,7 @@ static struct vm_area_struct *remove_vma(struct vm_area_struct *vma) | |||
246 | return next; | 246 | return next; |
247 | } | 247 | } |
248 | 248 | ||
249 | asmlinkage unsigned long sys_brk(unsigned long brk) | 249 | SYSCALL_DEFINE1(brk, unsigned long, brk) |
250 | { | 250 | { |
251 | unsigned long rlim, retval; | 251 | unsigned long rlim, retval; |
252 | unsigned long newbrk, oldbrk; | 252 | unsigned long newbrk, oldbrk; |
@@ -414,7 +414,7 @@ void __vma_link_rb(struct mm_struct *mm, struct vm_area_struct *vma, | |||
414 | 414 | ||
415 | static void __vma_link_file(struct vm_area_struct *vma) | 415 | static void __vma_link_file(struct vm_area_struct *vma) |
416 | { | 416 | { |
417 | struct file * file; | 417 | struct file *file; |
418 | 418 | ||
419 | file = vma->vm_file; | 419 | file = vma->vm_file; |
420 | if (file) { | 420 | if (file) { |
@@ -475,11 +475,10 @@ static void vma_link(struct mm_struct *mm, struct vm_area_struct *vma, | |||
475 | * insert vm structure into list and rbtree and anon_vma, | 475 | * insert vm structure into list and rbtree and anon_vma, |
476 | * but it has already been inserted into prio_tree earlier. | 476 | * but it has already been inserted into prio_tree earlier. |
477 | */ | 477 | */ |
478 | static void | 478 | static void __insert_vm_struct(struct mm_struct *mm, struct vm_area_struct *vma) |
479 | __insert_vm_struct(struct mm_struct * mm, struct vm_area_struct * vma) | ||
480 | { | 479 | { |
481 | struct vm_area_struct * __vma, * prev; | 480 | struct vm_area_struct *__vma, *prev; |
482 | struct rb_node ** rb_link, * rb_parent; | 481 | struct rb_node **rb_link, *rb_parent; |
483 | 482 | ||
484 | __vma = find_vma_prepare(mm, vma->vm_start,&prev, &rb_link, &rb_parent); | 483 | __vma = find_vma_prepare(mm, vma->vm_start,&prev, &rb_link, &rb_parent); |
485 | BUG_ON(__vma && __vma->vm_start < vma->vm_end); | 484 | BUG_ON(__vma && __vma->vm_start < vma->vm_end); |
@@ -660,6 +659,9 @@ again: remove_next = 1 + (end > next->vm_end); | |||
660 | validate_mm(mm); | 659 | validate_mm(mm); |
661 | } | 660 | } |
662 | 661 | ||
662 | /* Flags that can be inherited from an existing mapping when merging */ | ||
663 | #define VM_MERGEABLE_FLAGS (VM_CAN_NONLINEAR) | ||
664 | |||
663 | /* | 665 | /* |
664 | * If the vma has a ->close operation then the driver probably needs to release | 666 | * If the vma has a ->close operation then the driver probably needs to release |
665 | * per-vma resources, so we don't attempt to merge those. | 667 | * per-vma resources, so we don't attempt to merge those. |
@@ -667,7 +669,7 @@ again: remove_next = 1 + (end > next->vm_end); | |||
667 | static inline int is_mergeable_vma(struct vm_area_struct *vma, | 669 | static inline int is_mergeable_vma(struct vm_area_struct *vma, |
668 | struct file *file, unsigned long vm_flags) | 670 | struct file *file, unsigned long vm_flags) |
669 | { | 671 | { |
670 | if (vma->vm_flags != vm_flags) | 672 | if ((vma->vm_flags ^ vm_flags) & ~VM_MERGEABLE_FLAGS) |
671 | return 0; | 673 | return 0; |
672 | if (vma->vm_file != file) | 674 | if (vma->vm_file != file) |
673 | return 0; | 675 | return 0; |
@@ -909,7 +911,7 @@ void vm_stat_account(struct mm_struct *mm, unsigned long flags, | |||
909 | * The caller must hold down_write(current->mm->mmap_sem). | 911 | * The caller must hold down_write(current->mm->mmap_sem). |
910 | */ | 912 | */ |
911 | 913 | ||
912 | unsigned long do_mmap_pgoff(struct file * file, unsigned long addr, | 914 | unsigned long do_mmap_pgoff(struct file *file, unsigned long addr, |
913 | unsigned long len, unsigned long prot, | 915 | unsigned long len, unsigned long prot, |
914 | unsigned long flags, unsigned long pgoff) | 916 | unsigned long flags, unsigned long pgoff) |
915 | { | 917 | { |
@@ -1092,6 +1094,15 @@ int vma_wants_writenotify(struct vm_area_struct *vma) | |||
1092 | mapping_cap_account_dirty(vma->vm_file->f_mapping); | 1094 | mapping_cap_account_dirty(vma->vm_file->f_mapping); |
1093 | } | 1095 | } |
1094 | 1096 | ||
1097 | /* | ||
1098 | * We account for memory if it's a private writeable mapping, | ||
1099 | * and VM_NORESERVE wasn't set. | ||
1100 | */ | ||
1101 | static inline int accountable_mapping(unsigned int vm_flags) | ||
1102 | { | ||
1103 | return (vm_flags & (VM_NORESERVE | VM_SHARED | VM_WRITE)) == VM_WRITE; | ||
1104 | } | ||
1105 | |||
1095 | unsigned long mmap_region(struct file *file, unsigned long addr, | 1106 | unsigned long mmap_region(struct file *file, unsigned long addr, |
1096 | unsigned long len, unsigned long flags, | 1107 | unsigned long len, unsigned long flags, |
1097 | unsigned int vm_flags, unsigned long pgoff, | 1108 | unsigned int vm_flags, unsigned long pgoff, |
@@ -1119,36 +1130,32 @@ munmap_back: | |||
1119 | if (!may_expand_vm(mm, len >> PAGE_SHIFT)) | 1130 | if (!may_expand_vm(mm, len >> PAGE_SHIFT)) |
1120 | return -ENOMEM; | 1131 | return -ENOMEM; |
1121 | 1132 | ||
1122 | if (flags & MAP_NORESERVE) | 1133 | /* |
1134 | * Set 'VM_NORESERVE' if we should not account for the | ||
1135 | * memory use of this mapping. We only honor MAP_NORESERVE | ||
1136 | * if we're allowed to overcommit memory. | ||
1137 | */ | ||
1138 | if ((flags & MAP_NORESERVE) && sysctl_overcommit_memory != OVERCOMMIT_NEVER) | ||
1139 | vm_flags |= VM_NORESERVE; | ||
1140 | if (!accountable) | ||
1123 | vm_flags |= VM_NORESERVE; | 1141 | vm_flags |= VM_NORESERVE; |
1124 | 1142 | ||
1125 | if (accountable && (!(flags & MAP_NORESERVE) || | 1143 | /* |
1126 | sysctl_overcommit_memory == OVERCOMMIT_NEVER)) { | 1144 | * Private writable mapping: check memory availability |
1127 | if (vm_flags & VM_SHARED) { | 1145 | */ |
1128 | /* Check memory availability in shmem_file_setup? */ | 1146 | if (accountable_mapping(vm_flags)) { |
1129 | vm_flags |= VM_ACCOUNT; | 1147 | charged = len >> PAGE_SHIFT; |
1130 | } else if (vm_flags & VM_WRITE) { | 1148 | if (security_vm_enough_memory(charged)) |
1131 | /* | 1149 | return -ENOMEM; |
1132 | * Private writable mapping: check memory availability | 1150 | vm_flags |= VM_ACCOUNT; |
1133 | */ | ||
1134 | charged = len >> PAGE_SHIFT; | ||
1135 | if (security_vm_enough_memory(charged)) | ||
1136 | return -ENOMEM; | ||
1137 | vm_flags |= VM_ACCOUNT; | ||
1138 | } | ||
1139 | } | 1151 | } |
1140 | 1152 | ||
1141 | /* | 1153 | /* |
1142 | * Can we just expand an old private anonymous mapping? | 1154 | * Can we just expand an old mapping? |
1143 | * The VM_SHARED test is necessary because shmem_zero_setup | ||
1144 | * will create the file object for a shared anonymous map below. | ||
1145 | */ | 1155 | */ |
1146 | if (!file && !(vm_flags & VM_SHARED)) { | 1156 | vma = vma_merge(mm, prev, addr, addr + len, vm_flags, NULL, file, pgoff, NULL); |
1147 | vma = vma_merge(mm, prev, addr, addr + len, vm_flags, | 1157 | if (vma) |
1148 | NULL, NULL, pgoff, NULL); | 1158 | goto out; |
1149 | if (vma) | ||
1150 | goto out; | ||
1151 | } | ||
1152 | 1159 | ||
1153 | /* | 1160 | /* |
1154 | * Determine the object being mapped and call the appropriate | 1161 | * Determine the object being mapped and call the appropriate |
@@ -1191,14 +1198,6 @@ munmap_back: | |||
1191 | goto free_vma; | 1198 | goto free_vma; |
1192 | } | 1199 | } |
1193 | 1200 | ||
1194 | /* We set VM_ACCOUNT in a shared mapping's vm_flags, to inform | ||
1195 | * shmem_zero_setup (perhaps called through /dev/zero's ->mmap) | ||
1196 | * that memory reservation must be checked; but that reservation | ||
1197 | * belongs to shared memory object, not to vma: so now clear it. | ||
1198 | */ | ||
1199 | if ((vm_flags & (VM_SHARED|VM_ACCOUNT)) == (VM_SHARED|VM_ACCOUNT)) | ||
1200 | vma->vm_flags &= ~VM_ACCOUNT; | ||
1201 | |||
1202 | /* Can addr have changed?? | 1201 | /* Can addr have changed?? |
1203 | * | 1202 | * |
1204 | * Answer: Yes, several device drivers can do it in their | 1203 | * Answer: Yes, several device drivers can do it in their |
@@ -1211,17 +1210,8 @@ munmap_back: | |||
1211 | if (vma_wants_writenotify(vma)) | 1210 | if (vma_wants_writenotify(vma)) |
1212 | vma->vm_page_prot = vm_get_page_prot(vm_flags & ~VM_SHARED); | 1211 | vma->vm_page_prot = vm_get_page_prot(vm_flags & ~VM_SHARED); |
1213 | 1212 | ||
1214 | if (file && vma_merge(mm, prev, addr, vma->vm_end, | 1213 | vma_link(mm, vma, prev, rb_link, rb_parent); |
1215 | vma->vm_flags, NULL, file, pgoff, vma_policy(vma))) { | 1214 | file = vma->vm_file; |
1216 | mpol_put(vma_policy(vma)); | ||
1217 | kmem_cache_free(vm_area_cachep, vma); | ||
1218 | fput(file); | ||
1219 | if (vm_flags & VM_EXECUTABLE) | ||
1220 | removed_exe_file_vma(mm); | ||
1221 | } else { | ||
1222 | vma_link(mm, vma, prev, rb_link, rb_parent); | ||
1223 | file = vma->vm_file; | ||
1224 | } | ||
1225 | 1215 | ||
1226 | /* Once vma denies write, undo our temporary denial count */ | 1216 | /* Once vma denies write, undo our temporary denial count */ |
1227 | if (correct_wcount) | 1217 | if (correct_wcount) |
@@ -1468,7 +1458,7 @@ get_unmapped_area(struct file *file, unsigned long addr, unsigned long len, | |||
1468 | EXPORT_SYMBOL(get_unmapped_area); | 1458 | EXPORT_SYMBOL(get_unmapped_area); |
1469 | 1459 | ||
1470 | /* Look up the first VMA which satisfies addr < vm_end, NULL if none. */ | 1460 | /* Look up the first VMA which satisfies addr < vm_end, NULL if none. */ |
1471 | struct vm_area_struct * find_vma(struct mm_struct * mm, unsigned long addr) | 1461 | struct vm_area_struct *find_vma(struct mm_struct *mm, unsigned long addr) |
1472 | { | 1462 | { |
1473 | struct vm_area_struct *vma = NULL; | 1463 | struct vm_area_struct *vma = NULL; |
1474 | 1464 | ||
@@ -1511,7 +1501,7 @@ find_vma_prev(struct mm_struct *mm, unsigned long addr, | |||
1511 | struct vm_area_struct **pprev) | 1501 | struct vm_area_struct **pprev) |
1512 | { | 1502 | { |
1513 | struct vm_area_struct *vma = NULL, *prev = NULL; | 1503 | struct vm_area_struct *vma = NULL, *prev = NULL; |
1514 | struct rb_node * rb_node; | 1504 | struct rb_node *rb_node; |
1515 | if (!mm) | 1505 | if (!mm) |
1516 | goto out; | 1506 | goto out; |
1517 | 1507 | ||
@@ -1545,7 +1535,7 @@ out: | |||
1545 | * update accounting. This is shared with both the | 1535 | * update accounting. This is shared with both the |
1546 | * grow-up and grow-down cases. | 1536 | * grow-up and grow-down cases. |
1547 | */ | 1537 | */ |
1548 | static int acct_stack_growth(struct vm_area_struct * vma, unsigned long size, unsigned long grow) | 1538 | static int acct_stack_growth(struct vm_area_struct *vma, unsigned long size, unsigned long grow) |
1549 | { | 1539 | { |
1550 | struct mm_struct *mm = vma->vm_mm; | 1540 | struct mm_struct *mm = vma->vm_mm; |
1551 | struct rlimit *rlim = current->signal->rlim; | 1541 | struct rlimit *rlim = current->signal->rlim; |
@@ -1953,7 +1943,7 @@ int do_munmap(struct mm_struct *mm, unsigned long start, size_t len) | |||
1953 | 1943 | ||
1954 | EXPORT_SYMBOL(do_munmap); | 1944 | EXPORT_SYMBOL(do_munmap); |
1955 | 1945 | ||
1956 | asmlinkage long sys_munmap(unsigned long addr, size_t len) | 1946 | SYSCALL_DEFINE2(munmap, unsigned long, addr, size_t, len) |
1957 | { | 1947 | { |
1958 | int ret; | 1948 | int ret; |
1959 | struct mm_struct *mm = current->mm; | 1949 | struct mm_struct *mm = current->mm; |
@@ -2095,6 +2085,9 @@ void exit_mmap(struct mm_struct *mm) | |||
2095 | arch_exit_mmap(mm); | 2085 | arch_exit_mmap(mm); |
2096 | mmu_notifier_release(mm); | 2086 | mmu_notifier_release(mm); |
2097 | 2087 | ||
2088 | if (!mm->mmap) /* Can happen if dup_mmap() received an OOM */ | ||
2089 | return; | ||
2090 | |||
2098 | if (mm->locked_vm) { | 2091 | if (mm->locked_vm) { |
2099 | vma = mm->mmap; | 2092 | vma = mm->mmap; |
2100 | while (vma) { | 2093 | while (vma) { |
@@ -2107,7 +2100,7 @@ void exit_mmap(struct mm_struct *mm) | |||
2107 | lru_add_drain(); | 2100 | lru_add_drain(); |
2108 | flush_cache_mm(mm); | 2101 | flush_cache_mm(mm); |
2109 | tlb = tlb_gather_mmu(mm, 1); | 2102 | tlb = tlb_gather_mmu(mm, 1); |
2110 | /* Don't update_hiwater_rss(mm) here, do_exit already did */ | 2103 | /* update_hiwater_rss(mm) here? but nobody should be looking */ |
2111 | /* Use -1 here to ensure all VMAs in the mm are unmapped */ | 2104 | /* Use -1 here to ensure all VMAs in the mm are unmapped */ |
2112 | end = unmap_vmas(&tlb, vma, 0, -1, &nr_accounted, NULL); | 2105 | end = unmap_vmas(&tlb, vma, 0, -1, &nr_accounted, NULL); |
2113 | vm_unacct_memory(nr_accounted); | 2106 | vm_unacct_memory(nr_accounted); |
@@ -2474,3 +2467,13 @@ void mm_drop_all_locks(struct mm_struct *mm) | |||
2474 | 2467 | ||
2475 | mutex_unlock(&mm_all_locks_mutex); | 2468 | mutex_unlock(&mm_all_locks_mutex); |
2476 | } | 2469 | } |
2470 | |||
2471 | /* | ||
2472 | * initialise the VMA slab | ||
2473 | */ | ||
2474 | void __init mmap_init(void) | ||
2475 | { | ||
2476 | vm_area_cachep = kmem_cache_create("vm_area_struct", | ||
2477 | sizeof(struct vm_area_struct), 0, | ||
2478 | SLAB_PANIC, NULL); | ||
2479 | } | ||