aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorAneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com>2014-01-13 01:04:24 -0500
committerBenjamin Herrenschmidt <benh@kernel.crashing.org>2014-01-14 23:46:38 -0500
commitb3084f4db3aeb991c507ca774337c7e7893ed04f (patch)
treec5cad3a6843272a173e95a87a6087d362e19073e
parenta6da83f98267bc8ee4e34aa899169991eb0ceb93 (diff)
powerpc/thp: Fix crash on mremap
This patch fix the below crash NIP [c00000000004cee4] .__hash_page_thp+0x2a4/0x440 LR [c0000000000439ac] .hash_page+0x18c/0x5e0 ... Call Trace: [c000000736103c40] [00001ffffb000000] 0x1ffffb000000(unreliable) [437908.479693] [c000000736103d50] [c0000000000439ac] .hash_page+0x18c/0x5e0 [437908.479699] [c000000736103e30] [c00000000000924c] .do_hash_page+0x4c/0x58 On ppc64 we use the pgtable for storing the hpte slot information and store address to the pgtable at a constant offset (PTRS_PER_PMD) from pmd. On mremap, when we switch the pmd, we need to withdraw and deposit the pgtable again, so that we find the pgtable at PTRS_PER_PMD offset from new pmd. We also want to move the withdraw and deposit before the set_pmd so that, when page fault find the pmd as trans huge we can be sure that pgtable can be located at the offset. Signed-off-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> Acked-by: Kirill A. Shutemov <kirill.shutemov@linux.intel.com> Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
-rw-r--r--arch/powerpc/include/asm/pgtable-ppc64.h14
-rw-r--r--include/asm-generic/pgtable.h12
-rw-r--r--mm/huge_memory.c14
3 files changed, 31 insertions, 9 deletions
diff --git a/arch/powerpc/include/asm/pgtable-ppc64.h b/arch/powerpc/include/asm/pgtable-ppc64.h
index 4a191c472867..d27960c89a71 100644
--- a/arch/powerpc/include/asm/pgtable-ppc64.h
+++ b/arch/powerpc/include/asm/pgtable-ppc64.h
@@ -558,5 +558,19 @@ extern pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp);
558#define __HAVE_ARCH_PMDP_INVALIDATE 558#define __HAVE_ARCH_PMDP_INVALIDATE
559extern void pmdp_invalidate(struct vm_area_struct *vma, unsigned long address, 559extern void pmdp_invalidate(struct vm_area_struct *vma, unsigned long address,
560 pmd_t *pmdp); 560 pmd_t *pmdp);
561
562#define pmd_move_must_withdraw pmd_move_must_withdraw
563typedef struct spinlock spinlock_t;
564static inline int pmd_move_must_withdraw(spinlock_t *new_pmd_ptl,
565 spinlock_t *old_pmd_ptl)
566{
567 /*
568 * Archs like ppc64 use pgtable to store per pmd
569 * specific information. So when we switch the pmd,
570 * we should also withdraw and deposit the pgtable
571 */
572 return true;
573}
574
561#endif /* __ASSEMBLY__ */ 575#endif /* __ASSEMBLY__ */
562#endif /* _ASM_POWERPC_PGTABLE_PPC64_H_ */ 576#endif /* _ASM_POWERPC_PGTABLE_PPC64_H_ */
diff --git a/include/asm-generic/pgtable.h b/include/asm-generic/pgtable.h
index db0923458940..8e4f41d9af4d 100644
--- a/include/asm-generic/pgtable.h
+++ b/include/asm-generic/pgtable.h
@@ -558,6 +558,18 @@ static inline pmd_t pmd_read_atomic(pmd_t *pmdp)
558} 558}
559#endif 559#endif
560 560
561#ifndef pmd_move_must_withdraw
562static inline int pmd_move_must_withdraw(spinlock_t *new_pmd_ptl,
563 spinlock_t *old_pmd_ptl)
564{
565 /*
566 * With split pmd lock we also need to move preallocated
567 * PTE page table if new_pmd is on different PMD page table.
568 */
569 return new_pmd_ptl != old_pmd_ptl;
570}
571#endif
572
561/* 573/*
562 * This function is meant to be used by sites walking pagetables with 574 * This function is meant to be used by sites walking pagetables with
563 * the mmap_sem hold in read mode to protect against MADV_DONTNEED and 575 * the mmap_sem hold in read mode to protect against MADV_DONTNEED and
diff --git a/mm/huge_memory.c b/mm/huge_memory.c
index 95d1acb0f3d2..5d80c53b87cb 100644
--- a/mm/huge_memory.c
+++ b/mm/huge_memory.c
@@ -1502,19 +1502,15 @@ int move_huge_pmd(struct vm_area_struct *vma, struct vm_area_struct *new_vma,
1502 spin_lock_nested(new_ptl, SINGLE_DEPTH_NESTING); 1502 spin_lock_nested(new_ptl, SINGLE_DEPTH_NESTING);
1503 pmd = pmdp_get_and_clear(mm, old_addr, old_pmd); 1503 pmd = pmdp_get_and_clear(mm, old_addr, old_pmd);
1504 VM_BUG_ON(!pmd_none(*new_pmd)); 1504 VM_BUG_ON(!pmd_none(*new_pmd));
1505 set_pmd_at(mm, new_addr, new_pmd, pmd_mksoft_dirty(pmd));
1506 if (new_ptl != old_ptl) {
1507 pgtable_t pgtable;
1508 1505
1509 /* 1506 if (pmd_move_must_withdraw(new_ptl, old_ptl)) {
1510 * Move preallocated PTE page table if new_pmd is on 1507 pgtable_t pgtable;
1511 * different PMD page table.
1512 */
1513 pgtable = pgtable_trans_huge_withdraw(mm, old_pmd); 1508 pgtable = pgtable_trans_huge_withdraw(mm, old_pmd);
1514 pgtable_trans_huge_deposit(mm, new_pmd, pgtable); 1509 pgtable_trans_huge_deposit(mm, new_pmd, pgtable);
1515
1516 spin_unlock(new_ptl);
1517 } 1510 }
1511 set_pmd_at(mm, new_addr, new_pmd, pmd_mksoft_dirty(pmd));
1512 if (new_ptl != old_ptl)
1513 spin_unlock(new_ptl);
1518 spin_unlock(old_ptl); 1514 spin_unlock(old_ptl);
1519 } 1515 }
1520out: 1516out: