diff options
author | Michel Lespinasse <walken@google.com> | 2013-02-22 19:32:46 -0500 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2013-02-23 20:50:11 -0500 |
commit | 1869305009857cdeaabe6283bcdc2359c5784543 (patch) | |
tree | a8a500c71e7aa3a645322635f3d591c16601af27 /mm | |
parent | cea10a19b7972a1954c4a2d05a7de8db48b444fb (diff) |
mm: introduce VM_POPULATE flag to better deal with racy userspace programs
The vm_populate() code populates user mappings without constantly
holding the mmap_sem. This makes it susceptible to racy userspace
programs: the user mappings may change while vm_populate() is running,
and in this case vm_populate() may end up populating the new mapping
instead of the old one.
In order to reduce the possibility of userspace getting surprised by
this behavior, this change introduces the VM_POPULATE vma flag which
gets set on vmas we want vm_populate() to work on. This way
vm_populate() may still end up populating the new mapping after such a
race, but only if the new mapping is also one that the user has
requested (using MAP_SHARED, MAP_LOCKED or mlock) to be populated.
Signed-off-by: Michel Lespinasse <walken@google.com>
Acked-by: Rik van Riel <riel@redhat.com>
Tested-by: Andy Lutomirski <luto@amacapital.net>
Cc: Greg Ungerer <gregungerer@westnet.com.au>
Cc: David Howells <dhowells@redhat.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm')
-rw-r--r-- | mm/fremap.c | 12 | ||||
-rw-r--r-- | mm/mlock.c | 19 | ||||
-rw-r--r-- | mm/mmap.c | 4 |
3 files changed, 21 insertions, 14 deletions
diff --git a/mm/fremap.c b/mm/fremap.c index 503a72387087..0cd4c11488ed 100644 --- a/mm/fremap.c +++ b/mm/fremap.c | |||
@@ -204,8 +204,10 @@ get_write_lock: | |||
204 | unsigned long addr; | 204 | unsigned long addr; |
205 | struct file *file = get_file(vma->vm_file); | 205 | struct file *file = get_file(vma->vm_file); |
206 | 206 | ||
207 | addr = mmap_region(file, start, size, | 207 | vm_flags = vma->vm_flags; |
208 | vma->vm_flags, pgoff); | 208 | if (!(flags & MAP_NONBLOCK)) |
209 | vm_flags |= VM_POPULATE; | ||
210 | addr = mmap_region(file, start, size, vm_flags, pgoff); | ||
209 | fput(file); | 211 | fput(file); |
210 | if (IS_ERR_VALUE(addr)) { | 212 | if (IS_ERR_VALUE(addr)) { |
211 | err = addr; | 213 | err = addr; |
@@ -224,6 +226,12 @@ get_write_lock: | |||
224 | mutex_unlock(&mapping->i_mmap_mutex); | 226 | mutex_unlock(&mapping->i_mmap_mutex); |
225 | } | 227 | } |
226 | 228 | ||
229 | if (!(flags & MAP_NONBLOCK) && !(vma->vm_flags & VM_POPULATE)) { | ||
230 | if (!has_write_lock) | ||
231 | goto get_write_lock; | ||
232 | vma->vm_flags |= VM_POPULATE; | ||
233 | } | ||
234 | |||
227 | if (vma->vm_flags & VM_LOCKED) { | 235 | if (vma->vm_flags & VM_LOCKED) { |
228 | /* | 236 | /* |
229 | * drop PG_Mlocked flag for over-mapped range | 237 | * drop PG_Mlocked flag for over-mapped range |
diff --git a/mm/mlock.c b/mm/mlock.c index 569400a5d079..d6378feb2950 100644 --- a/mm/mlock.c +++ b/mm/mlock.c | |||
@@ -340,9 +340,9 @@ static int do_mlock(unsigned long start, size_t len, int on) | |||
340 | 340 | ||
341 | /* Here we know that vma->vm_start <= nstart < vma->vm_end. */ | 341 | /* Here we know that vma->vm_start <= nstart < vma->vm_end. */ |
342 | 342 | ||
343 | newflags = vma->vm_flags | VM_LOCKED; | 343 | newflags = vma->vm_flags & ~VM_LOCKED; |
344 | if (!on) | 344 | if (on) |
345 | newflags &= ~VM_LOCKED; | 345 | newflags |= VM_LOCKED | VM_POPULATE; |
346 | 346 | ||
347 | tmp = vma->vm_end; | 347 | tmp = vma->vm_end; |
348 | if (tmp > end) | 348 | if (tmp > end) |
@@ -402,7 +402,8 @@ int __mm_populate(unsigned long start, unsigned long len, int ignore_errors) | |||
402 | * range with the first VMA. Also, skip undesirable VMA types. | 402 | * range with the first VMA. Also, skip undesirable VMA types. |
403 | */ | 403 | */ |
404 | nend = min(end, vma->vm_end); | 404 | nend = min(end, vma->vm_end); |
405 | if (vma->vm_flags & (VM_IO | VM_PFNMAP)) | 405 | if ((vma->vm_flags & (VM_IO | VM_PFNMAP | VM_POPULATE)) != |
406 | VM_POPULATE) | ||
406 | continue; | 407 | continue; |
407 | if (nstart < vma->vm_start) | 408 | if (nstart < vma->vm_start) |
408 | nstart = vma->vm_start; | 409 | nstart = vma->vm_start; |
@@ -475,18 +476,18 @@ static int do_mlockall(int flags) | |||
475 | struct vm_area_struct * vma, * prev = NULL; | 476 | struct vm_area_struct * vma, * prev = NULL; |
476 | 477 | ||
477 | if (flags & MCL_FUTURE) | 478 | if (flags & MCL_FUTURE) |
478 | current->mm->def_flags |= VM_LOCKED; | 479 | current->mm->def_flags |= VM_LOCKED | VM_POPULATE; |
479 | else | 480 | else |
480 | current->mm->def_flags &= ~VM_LOCKED; | 481 | current->mm->def_flags &= ~(VM_LOCKED | VM_POPULATE); |
481 | if (flags == MCL_FUTURE) | 482 | if (flags == MCL_FUTURE) |
482 | goto out; | 483 | goto out; |
483 | 484 | ||
484 | for (vma = current->mm->mmap; vma ; vma = prev->vm_next) { | 485 | for (vma = current->mm->mmap; vma ; vma = prev->vm_next) { |
485 | vm_flags_t newflags; | 486 | vm_flags_t newflags; |
486 | 487 | ||
487 | newflags = vma->vm_flags | VM_LOCKED; | 488 | newflags = vma->vm_flags & ~VM_LOCKED; |
488 | if (!(flags & MCL_CURRENT)) | 489 | if (flags & MCL_CURRENT) |
489 | newflags &= ~VM_LOCKED; | 490 | newflags |= VM_LOCKED | VM_POPULATE; |
490 | 491 | ||
491 | /* Ignore errors */ | 492 | /* Ignore errors */ |
492 | mlock_fixup(vma, &prev, vma->vm_start, vma->vm_end, newflags); | 493 | mlock_fixup(vma, &prev, vma->vm_start, vma->vm_end, newflags); |
@@ -1306,9 +1306,7 @@ unsigned long do_mmap_pgoff(struct file *file, unsigned long addr, | |||
1306 | } | 1306 | } |
1307 | 1307 | ||
1308 | addr = mmap_region(file, addr, len, vm_flags, pgoff); | 1308 | addr = mmap_region(file, addr, len, vm_flags, pgoff); |
1309 | if (!IS_ERR_VALUE(addr) && | 1309 | if (!IS_ERR_VALUE(addr) && (vm_flags & VM_POPULATE)) |
1310 | ((vm_flags & VM_LOCKED) || | ||
1311 | (flags & (MAP_POPULATE | MAP_NONBLOCK)) == MAP_POPULATE)) | ||
1312 | *populate = true; | 1310 | *populate = true; |
1313 | return addr; | 1311 | return addr; |
1314 | } | 1312 | } |