aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorKirill A. Shutemov <kirill.shutemov@linux.intel.com>2012-12-12 16:50:59 -0500
committerLinus Torvalds <torvalds@linux-foundation.org>2012-12-12 20:38:31 -0500
commite180377f1ae48b3cbc559c9875d9b038f7f000c6 (patch)
treec51e0db181acc0372479bce5cd68b99abca7d8bb
parentcad7f613c4d010e1d0f05c9a4fb33c7ae40ba115 (diff)
thp: change split_huge_page_pmd() interface
Pass vma instead of mm and add address parameter. In most cases we already have vma on the stack. We provides split_huge_page_pmd_mm() for few cases when we have mm, but not vma. This change is preparation to huge zero pmd splitting implementation. Signed-off-by: Kirill A. Shutemov <kirill.shutemov@linux.intel.com> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Andi Kleen <ak@linux.intel.com> Cc: "H. Peter Anvin" <hpa@linux.intel.com> Cc: Mel Gorman <mel@csn.ul.ie> Cc: David Rientjes <rientjes@google.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
-rw-r--r--Documentation/vm/transhuge.txt4
-rw-r--r--arch/x86/kernel/vm86_32.c2
-rw-r--r--fs/proc/task_mmu.c2
-rw-r--r--include/linux/huge_mm.h14
-rw-r--r--mm/huge_memory.c19
-rw-r--r--mm/memory.c4
-rw-r--r--mm/mempolicy.c2
-rw-r--r--mm/mprotect.c2
-rw-r--r--mm/mremap.c2
-rw-r--r--mm/pagewalk.c2
10 files changed, 37 insertions, 16 deletions
diff --git a/Documentation/vm/transhuge.txt b/Documentation/vm/transhuge.txt
index f734bb2a78dc..8f5b41db314c 100644
--- a/Documentation/vm/transhuge.txt
+++ b/Documentation/vm/transhuge.txt
@@ -276,7 +276,7 @@ unaffected. libhugetlbfs will also work fine as usual.
276== Graceful fallback == 276== Graceful fallback ==
277 277
278Code walking pagetables but unware about huge pmds can simply call 278Code walking pagetables but unware about huge pmds can simply call
279split_huge_page_pmd(mm, pmd) where the pmd is the one returned by 279split_huge_page_pmd(vma, addr, pmd) where the pmd is the one returned by
280pmd_offset. It's trivial to make the code transparent hugepage aware 280pmd_offset. It's trivial to make the code transparent hugepage aware
281by just grepping for "pmd_offset" and adding split_huge_page_pmd where 281by just grepping for "pmd_offset" and adding split_huge_page_pmd where
282missing after pmd_offset returns the pmd. Thanks to the graceful 282missing after pmd_offset returns the pmd. Thanks to the graceful
@@ -299,7 +299,7 @@ diff --git a/mm/mremap.c b/mm/mremap.c
299 return NULL; 299 return NULL;
300 300
301 pmd = pmd_offset(pud, addr); 301 pmd = pmd_offset(pud, addr);
302+ split_huge_page_pmd(mm, pmd); 302+ split_huge_page_pmd(vma, addr, pmd);
303 if (pmd_none_or_clear_bad(pmd)) 303 if (pmd_none_or_clear_bad(pmd))
304 return NULL; 304 return NULL;
305 305
diff --git a/arch/x86/kernel/vm86_32.c b/arch/x86/kernel/vm86_32.c
index 5c9687b1bde6..1dfe69cc78a8 100644
--- a/arch/x86/kernel/vm86_32.c
+++ b/arch/x86/kernel/vm86_32.c
@@ -182,7 +182,7 @@ static void mark_screen_rdonly(struct mm_struct *mm)
182 if (pud_none_or_clear_bad(pud)) 182 if (pud_none_or_clear_bad(pud))
183 goto out; 183 goto out;
184 pmd = pmd_offset(pud, 0xA0000); 184 pmd = pmd_offset(pud, 0xA0000);
185 split_huge_page_pmd(mm, pmd); 185 split_huge_page_pmd_mm(mm, 0xA0000, pmd);
186 if (pmd_none_or_clear_bad(pmd)) 186 if (pmd_none_or_clear_bad(pmd))
187 goto out; 187 goto out;
188 pte = pte_offset_map_lock(mm, pmd, 0xA0000, &ptl); 188 pte = pte_offset_map_lock(mm, pmd, 0xA0000, &ptl);
diff --git a/fs/proc/task_mmu.c b/fs/proc/task_mmu.c
index 90c63f9392a5..291a0d15a0be 100644
--- a/fs/proc/task_mmu.c
+++ b/fs/proc/task_mmu.c
@@ -643,7 +643,7 @@ static int clear_refs_pte_range(pmd_t *pmd, unsigned long addr,
643 spinlock_t *ptl; 643 spinlock_t *ptl;
644 struct page *page; 644 struct page *page;
645 645
646 split_huge_page_pmd(walk->mm, pmd); 646 split_huge_page_pmd(vma, addr, pmd);
647 if (pmd_trans_unstable(pmd)) 647 if (pmd_trans_unstable(pmd))
648 return 0; 648 return 0;
649 649
diff --git a/include/linux/huge_mm.h b/include/linux/huge_mm.h
index 1af477552459..3132ea788581 100644
--- a/include/linux/huge_mm.h
+++ b/include/linux/huge_mm.h
@@ -95,12 +95,14 @@ extern int handle_pte_fault(struct mm_struct *mm,
95 struct vm_area_struct *vma, unsigned long address, 95 struct vm_area_struct *vma, unsigned long address,
96 pte_t *pte, pmd_t *pmd, unsigned int flags); 96 pte_t *pte, pmd_t *pmd, unsigned int flags);
97extern int split_huge_page(struct page *page); 97extern int split_huge_page(struct page *page);
98extern void __split_huge_page_pmd(struct mm_struct *mm, pmd_t *pmd); 98extern void __split_huge_page_pmd(struct vm_area_struct *vma,
99#define split_huge_page_pmd(__mm, __pmd) \ 99 unsigned long address, pmd_t *pmd);
100#define split_huge_page_pmd(__vma, __address, __pmd) \
100 do { \ 101 do { \
101 pmd_t *____pmd = (__pmd); \ 102 pmd_t *____pmd = (__pmd); \
102 if (unlikely(pmd_trans_huge(*____pmd))) \ 103 if (unlikely(pmd_trans_huge(*____pmd))) \
103 __split_huge_page_pmd(__mm, ____pmd); \ 104 __split_huge_page_pmd(__vma, __address, \
105 ____pmd); \
104 } while (0) 106 } while (0)
105#define wait_split_huge_page(__anon_vma, __pmd) \ 107#define wait_split_huge_page(__anon_vma, __pmd) \
106 do { \ 108 do { \
@@ -110,6 +112,8 @@ extern void __split_huge_page_pmd(struct mm_struct *mm, pmd_t *pmd);
110 BUG_ON(pmd_trans_splitting(*____pmd) || \ 112 BUG_ON(pmd_trans_splitting(*____pmd) || \
111 pmd_trans_huge(*____pmd)); \ 113 pmd_trans_huge(*____pmd)); \
112 } while (0) 114 } while (0)
115extern void split_huge_page_pmd_mm(struct mm_struct *mm, unsigned long address,
116 pmd_t *pmd);
113#if HPAGE_PMD_ORDER > MAX_ORDER 117#if HPAGE_PMD_ORDER > MAX_ORDER
114#error "hugepages can't be allocated by the buddy allocator" 118#error "hugepages can't be allocated by the buddy allocator"
115#endif 119#endif
@@ -177,10 +181,12 @@ static inline int split_huge_page(struct page *page)
177{ 181{
178 return 0; 182 return 0;
179} 183}
180#define split_huge_page_pmd(__mm, __pmd) \ 184#define split_huge_page_pmd(__vma, __address, __pmd) \
181 do { } while (0) 185 do { } while (0)
182#define wait_split_huge_page(__anon_vma, __pmd) \ 186#define wait_split_huge_page(__anon_vma, __pmd) \
183 do { } while (0) 187 do { } while (0)
188#define split_huge_page_pmd_mm(__mm, __address, __pmd) \
189 do { } while (0)
184#define compound_trans_head(page) compound_head(page) 190#define compound_trans_head(page) compound_head(page)
185static inline int hugepage_madvise(struct vm_area_struct *vma, 191static inline int hugepage_madvise(struct vm_area_struct *vma,
186 unsigned long *vm_flags, int advice) 192 unsigned long *vm_flags, int advice)
diff --git a/mm/huge_memory.c b/mm/huge_memory.c
index 7742fb36eb4d..de6aa5f3fdd2 100644
--- a/mm/huge_memory.c
+++ b/mm/huge_memory.c
@@ -2475,9 +2475,14 @@ static int khugepaged(void *none)
2475 return 0; 2475 return 0;
2476} 2476}
2477 2477
2478void __split_huge_page_pmd(struct mm_struct *mm, pmd_t *pmd) 2478void __split_huge_page_pmd(struct vm_area_struct *vma, unsigned long address,
2479 pmd_t *pmd)
2479{ 2480{
2480 struct page *page; 2481 struct page *page;
2482 unsigned long haddr = address & HPAGE_PMD_MASK;
2483 struct mm_struct *mm = vma->vm_mm;
2484
2485 BUG_ON(vma->vm_start > haddr || vma->vm_end < haddr + HPAGE_PMD_SIZE);
2481 2486
2482 spin_lock(&mm->page_table_lock); 2487 spin_lock(&mm->page_table_lock);
2483 if (unlikely(!pmd_trans_huge(*pmd))) { 2488 if (unlikely(!pmd_trans_huge(*pmd))) {
@@ -2495,6 +2500,16 @@ void __split_huge_page_pmd(struct mm_struct *mm, pmd_t *pmd)
2495 BUG_ON(pmd_trans_huge(*pmd)); 2500 BUG_ON(pmd_trans_huge(*pmd));
2496} 2501}
2497 2502
2503void split_huge_page_pmd_mm(struct mm_struct *mm, unsigned long address,
2504 pmd_t *pmd)
2505{
2506 struct vm_area_struct *vma;
2507
2508 vma = find_vma(mm, address);
2509 BUG_ON(vma == NULL);
2510 split_huge_page_pmd(vma, address, pmd);
2511}
2512
2498static void split_huge_page_address(struct mm_struct *mm, 2513static void split_huge_page_address(struct mm_struct *mm,
2499 unsigned long address) 2514 unsigned long address)
2500{ 2515{
@@ -2509,7 +2524,7 @@ static void split_huge_page_address(struct mm_struct *mm,
2509 * Caller holds the mmap_sem write mode, so a huge pmd cannot 2524 * Caller holds the mmap_sem write mode, so a huge pmd cannot
2510 * materialize from under us. 2525 * materialize from under us.
2511 */ 2526 */
2512 split_huge_page_pmd(mm, pmd); 2527 split_huge_page_pmd_mm(mm, address, pmd);
2513} 2528}
2514 2529
2515void __vma_adjust_trans_huge(struct vm_area_struct *vma, 2530void __vma_adjust_trans_huge(struct vm_area_struct *vma,
diff --git a/mm/memory.c b/mm/memory.c
index 259b34fe1347..f9a4b0cb8623 100644
--- a/mm/memory.c
+++ b/mm/memory.c
@@ -1243,7 +1243,7 @@ static inline unsigned long zap_pmd_range(struct mmu_gather *tlb,
1243 BUG(); 1243 BUG();
1244 } 1244 }
1245#endif 1245#endif
1246 split_huge_page_pmd(vma->vm_mm, pmd); 1246 split_huge_page_pmd(vma, addr, pmd);
1247 } else if (zap_huge_pmd(tlb, vma, pmd, addr)) 1247 } else if (zap_huge_pmd(tlb, vma, pmd, addr))
1248 goto next; 1248 goto next;
1249 /* fall through */ 1249 /* fall through */
@@ -1512,7 +1512,7 @@ struct page *follow_page(struct vm_area_struct *vma, unsigned long address,
1512 } 1512 }
1513 if (pmd_trans_huge(*pmd)) { 1513 if (pmd_trans_huge(*pmd)) {
1514 if (flags & FOLL_SPLIT) { 1514 if (flags & FOLL_SPLIT) {
1515 split_huge_page_pmd(mm, pmd); 1515 split_huge_page_pmd(vma, address, pmd);
1516 goto split_fallthrough; 1516 goto split_fallthrough;
1517 } 1517 }
1518 spin_lock(&mm->page_table_lock); 1518 spin_lock(&mm->page_table_lock);
diff --git a/mm/mempolicy.c b/mm/mempolicy.c
index 05b28361a39b..0719e8dd4945 100644
--- a/mm/mempolicy.c
+++ b/mm/mempolicy.c
@@ -511,7 +511,7 @@ static inline int check_pmd_range(struct vm_area_struct *vma, pud_t *pud,
511 pmd = pmd_offset(pud, addr); 511 pmd = pmd_offset(pud, addr);
512 do { 512 do {
513 next = pmd_addr_end(addr, end); 513 next = pmd_addr_end(addr, end);
514 split_huge_page_pmd(vma->vm_mm, pmd); 514 split_huge_page_pmd(vma, addr, pmd);
515 if (pmd_none_or_trans_huge_or_clear_bad(pmd)) 515 if (pmd_none_or_trans_huge_or_clear_bad(pmd))
516 continue; 516 continue;
517 if (check_pte_range(vma, pmd, addr, next, nodes, 517 if (check_pte_range(vma, pmd, addr, next, nodes,
diff --git a/mm/mprotect.c b/mm/mprotect.c
index a40992610ab6..e8c3938db6fa 100644
--- a/mm/mprotect.c
+++ b/mm/mprotect.c
@@ -90,7 +90,7 @@ static inline void change_pmd_range(struct vm_area_struct *vma, pud_t *pud,
90 next = pmd_addr_end(addr, end); 90 next = pmd_addr_end(addr, end);
91 if (pmd_trans_huge(*pmd)) { 91 if (pmd_trans_huge(*pmd)) {
92 if (next - addr != HPAGE_PMD_SIZE) 92 if (next - addr != HPAGE_PMD_SIZE)
93 split_huge_page_pmd(vma->vm_mm, pmd); 93 split_huge_page_pmd(vma, addr, pmd);
94 else if (change_huge_pmd(vma, pmd, addr, newprot)) 94 else if (change_huge_pmd(vma, pmd, addr, newprot))
95 continue; 95 continue;
96 /* fall through */ 96 /* fall through */
diff --git a/mm/mremap.c b/mm/mremap.c
index 1b61c2d3307a..eabb24da6c9e 100644
--- a/mm/mremap.c
+++ b/mm/mremap.c
@@ -182,7 +182,7 @@ unsigned long move_page_tables(struct vm_area_struct *vma,
182 need_flush = true; 182 need_flush = true;
183 continue; 183 continue;
184 } else if (!err) { 184 } else if (!err) {
185 split_huge_page_pmd(vma->vm_mm, old_pmd); 185 split_huge_page_pmd(vma, old_addr, old_pmd);
186 } 186 }
187 VM_BUG_ON(pmd_trans_huge(*old_pmd)); 187 VM_BUG_ON(pmd_trans_huge(*old_pmd));
188 } 188 }
diff --git a/mm/pagewalk.c b/mm/pagewalk.c
index 6c118d012bb5..35aa294656cd 100644
--- a/mm/pagewalk.c
+++ b/mm/pagewalk.c
@@ -58,7 +58,7 @@ again:
58 if (!walk->pte_entry) 58 if (!walk->pte_entry)
59 continue; 59 continue;
60 60
61 split_huge_page_pmd(walk->mm, pmd); 61 split_huge_page_pmd_mm(walk->mm, addr, pmd);
62 if (pmd_none_or_trans_huge_or_clear_bad(pmd)) 62 if (pmd_none_or_trans_huge_or_clear_bad(pmd))
63 goto again; 63 goto again;
64 err = walk_pte_range(pmd, addr, next, walk); 64 err = walk_pte_range(pmd, addr, next, walk);