aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorKonstantin Khlebnikov <khlebnikov@openvz.org>2012-10-08 19:28:40 -0400
committerLinus Torvalds <torvalds@linux-foundation.org>2012-10-09 03:22:17 -0400
commit4b6e1e37026ec7dae9b23d78ffcebdd5ddb1bfa1 (patch)
tree10200483a705005f41f543ed433581409cf2bf5f
parentcc2383ec06be093789469852e1fe96e1148e9a2c (diff)
mm: kill vma flag VM_INSERTPAGE
Merge VM_INSERTPAGE into VM_MIXEDMAP. VM_MIXEDMAP VMA can mix pure-pfn ptes, special ptes and normal ptes. Now copy_page_range() always copies VM_MIXEDMAP VMA on fork like VM_PFNMAP. If driver populates whole VMA at mmap() it probably not expects page-faults. This patch removes special check from vma_wants_writenotify() which disables pages write tracking for VMA populated via vm_instert_page(). BDI below mapped file should not use dirty-accounting, moreover do_wp_page() can handle this. vm_insert_page() still marks vma after first usage. Usually it is called from f_op->mmap() handler under mm->mmap_sem write-lock, so it able to change vma->vm_flags. Caller must set VM_MIXEDMAP at mmap time if it wants to call this function from other places, for example from page-fault handler. Signed-off-by: Konstantin Khlebnikov <khlebnikov@openvz.org> Cc: Alexander Viro <viro@zeniv.linux.org.uk> Cc: Carsten Otte <cotte@de.ibm.com> Cc: Chris Metcalf <cmetcalf@tilera.com> Cc: Cyrill Gorcunov <gorcunov@openvz.org> Cc: Eric Paris <eparis@redhat.com> Cc: H. Peter Anvin <hpa@zytor.com> Cc: Hugh Dickins <hughd@google.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: James Morris <james.l.morris@oracle.com> Cc: Jason Baron <jbaron@redhat.com> Cc: Kentaro Takeda <takedakn@nttdata.co.jp> Cc: Matt Helsley <matthltc@us.ibm.com> Cc: Nick Piggin <npiggin@kernel.dk> Cc: Oleg Nesterov <oleg@redhat.com> Cc: Peter Zijlstra <a.p.zijlstra@chello.nl> Cc: Robert Richter <robert.richter@amd.com> Cc: Suresh Siddha <suresh.b.siddha@intel.com> Cc: Tetsuo Handa <penguin-kernel@I-love.SAKURA.ne.jp> Cc: Venkatesh Pallipadi <venki@google.com> Acked-by: Linus Torvalds <torvalds@linux-foundation.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
-rw-r--r--include/linux/mm.h1
-rw-r--r--mm/huge_memory.c3
-rw-r--r--mm/ksm.c2
-rw-r--r--mm/memory.c14
-rw-r--r--mm/mmap.c2
5 files changed, 15 insertions, 7 deletions
diff --git a/include/linux/mm.h b/include/linux/mm.h
index 9c039f84b63c..fb0685b17914 100644
--- a/include/linux/mm.h
+++ b/include/linux/mm.h
@@ -103,7 +103,6 @@ extern unsigned int kobjsize(const void *objp);
103#define VM_HUGETLB 0x00400000 /* Huge TLB Page VM */ 103#define VM_HUGETLB 0x00400000 /* Huge TLB Page VM */
104#define VM_NONLINEAR 0x00800000 /* Is non-linear (remap_file_pages) */ 104#define VM_NONLINEAR 0x00800000 /* Is non-linear (remap_file_pages) */
105#define VM_ARCH_1 0x01000000 /* Architecture-specific flag */ 105#define VM_ARCH_1 0x01000000 /* Architecture-specific flag */
106#define VM_INSERTPAGE 0x02000000 /* The vma has had "vm_insert_page()" done on it */
107#define VM_NODUMP 0x04000000 /* Do not include in the core dump */ 106#define VM_NODUMP 0x04000000 /* Do not include in the core dump */
108 107
109#define VM_CAN_NONLINEAR 0x08000000 /* Has ->fault & does nonlinear pages */ 108#define VM_CAN_NONLINEAR 0x08000000 /* Has ->fault & does nonlinear pages */
diff --git a/mm/huge_memory.c b/mm/huge_memory.c
index 47206692cf88..9b72d1270519 100644
--- a/mm/huge_memory.c
+++ b/mm/huge_memory.c
@@ -1491,8 +1491,7 @@ out:
1491 return ret; 1491 return ret;
1492} 1492}
1493 1493
1494#define VM_NO_THP (VM_SPECIAL|VM_INSERTPAGE|VM_MIXEDMAP| \ 1494#define VM_NO_THP (VM_SPECIAL|VM_MIXEDMAP|VM_HUGETLB|VM_SHARED|VM_MAYSHARE)
1495 VM_HUGETLB|VM_SHARED|VM_MAYSHARE)
1496 1495
1497int hugepage_madvise(struct vm_area_struct *vma, 1496int hugepage_madvise(struct vm_area_struct *vma,
1498 unsigned long *vm_flags, int advice) 1497 unsigned long *vm_flags, int advice)
diff --git a/mm/ksm.c b/mm/ksm.c
index d1cbe2aa6b3a..f9ccb16559ee 100644
--- a/mm/ksm.c
+++ b/mm/ksm.c
@@ -1469,7 +1469,7 @@ int ksm_madvise(struct vm_area_struct *vma, unsigned long start,
1469 */ 1469 */
1470 if (*vm_flags & (VM_MERGEABLE | VM_SHARED | VM_MAYSHARE | 1470 if (*vm_flags & (VM_MERGEABLE | VM_SHARED | VM_MAYSHARE |
1471 VM_PFNMAP | VM_IO | VM_DONTEXPAND | 1471 VM_PFNMAP | VM_IO | VM_DONTEXPAND |
1472 VM_RESERVED | VM_HUGETLB | VM_INSERTPAGE | 1472 VM_RESERVED | VM_HUGETLB |
1473 VM_NONLINEAR | VM_MIXEDMAP)) 1473 VM_NONLINEAR | VM_MIXEDMAP))
1474 return 0; /* just ignore the advice */ 1474 return 0; /* just ignore the advice */
1475 1475
diff --git a/mm/memory.c b/mm/memory.c
index 655e1429388a..7b1e4feaec06 100644
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -1047,7 +1047,8 @@ int copy_page_range(struct mm_struct *dst_mm, struct mm_struct *src_mm,
1047 * readonly mappings. The tradeoff is that copy_page_range is more 1047 * readonly mappings. The tradeoff is that copy_page_range is more
1048 * efficient than faulting. 1048 * efficient than faulting.
1049 */ 1049 */
1050 if (!(vma->vm_flags & (VM_HUGETLB|VM_NONLINEAR|VM_PFNMAP|VM_INSERTPAGE))) { 1050 if (!(vma->vm_flags & (VM_HUGETLB | VM_NONLINEAR |
1051 VM_PFNMAP | VM_MIXEDMAP))) {
1051 if (!vma->anon_vma) 1052 if (!vma->anon_vma)
1052 return 0; 1053 return 0;
1053 } 1054 }
@@ -2085,6 +2086,11 @@ out:
2085 * ask for a shared writable mapping! 2086 * ask for a shared writable mapping!
2086 * 2087 *
2087 * The page does not need to be reserved. 2088 * The page does not need to be reserved.
2089 *
2090 * Usually this function is called from f_op->mmap() handler
2091 * under mm->mmap_sem write-lock, so it can change vma->vm_flags.
2092 * Caller must set VM_MIXEDMAP on vma if it wants to call this
2093 * function from other places, for example from page-fault handler.
2088 */ 2094 */
2089int vm_insert_page(struct vm_area_struct *vma, unsigned long addr, 2095int vm_insert_page(struct vm_area_struct *vma, unsigned long addr,
2090 struct page *page) 2096 struct page *page)
@@ -2093,7 +2099,11 @@ int vm_insert_page(struct vm_area_struct *vma, unsigned long addr,
2093 return -EFAULT; 2099 return -EFAULT;
2094 if (!page_count(page)) 2100 if (!page_count(page))
2095 return -EINVAL; 2101 return -EINVAL;
2096 vma->vm_flags |= VM_INSERTPAGE; 2102 if (!(vma->vm_flags & VM_MIXEDMAP)) {
2103 BUG_ON(down_read_trylock(&vma->vm_mm->mmap_sem));
2104 BUG_ON(vma->vm_flags & VM_PFNMAP);
2105 vma->vm_flags |= VM_MIXEDMAP;
2106 }
2097 return insert_page(vma, addr, page, vma->vm_page_prot); 2107 return insert_page(vma, addr, page, vma->vm_page_prot);
2098} 2108}
2099EXPORT_SYMBOL(vm_insert_page); 2109EXPORT_SYMBOL(vm_insert_page);
diff --git a/mm/mmap.c b/mm/mmap.c
index 872441e81914..b0989f4d4f09 100644
--- a/mm/mmap.c
+++ b/mm/mmap.c
@@ -1190,7 +1190,7 @@ int vma_wants_writenotify(struct vm_area_struct *vma)
1190 return 0; 1190 return 0;
1191 1191
1192 /* Specialty mapping? */ 1192 /* Specialty mapping? */
1193 if (vm_flags & (VM_PFNMAP|VM_INSERTPAGE)) 1193 if (vm_flags & VM_PFNMAP)
1194 return 0; 1194 return 0;
1195 1195
1196 /* Can the mapping track the dirty pages? */ 1196 /* Can the mapping track the dirty pages? */