diff options
author | Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com> | 2014-01-13 01:04:24 -0500 |
---|---|---|
committer | Benjamin Herrenschmidt <benh@kernel.crashing.org> | 2014-01-14 23:46:38 -0500 |
commit | b3084f4db3aeb991c507ca774337c7e7893ed04f (patch) | |
tree | c5cad3a6843272a173e95a87a6087d362e19073e | |
parent | a6da83f98267bc8ee4e34aa899169991eb0ceb93 (diff) |
powerpc/thp: Fix crash on mremap
This patch fix the below crash
NIP [c00000000004cee4] .__hash_page_thp+0x2a4/0x440
LR [c0000000000439ac] .hash_page+0x18c/0x5e0
...
Call Trace:
[c000000736103c40] [00001ffffb000000] 0x1ffffb000000(unreliable)
[437908.479693] [c000000736103d50] [c0000000000439ac] .hash_page+0x18c/0x5e0
[437908.479699] [c000000736103e30] [c00000000000924c] .do_hash_page+0x4c/0x58
On ppc64 we use the pgtable for storing the hpte slot information and
store address to the pgtable at a constant offset (PTRS_PER_PMD) from
pmd. On mremap, when we switch the pmd, we need to withdraw and deposit
the pgtable again, so that we find the pgtable at PTRS_PER_PMD offset
from new pmd.
We also want to move the withdraw and deposit before the set_pmd so
that, when page fault find the pmd as trans huge we can be sure that
pgtable can be located at the offset.
Signed-off-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com>
Acked-by: Kirill A. Shutemov <kirill.shutemov@linux.intel.com>
Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
-rw-r--r-- | arch/powerpc/include/asm/pgtable-ppc64.h | 14 | ||||
-rw-r--r-- | include/asm-generic/pgtable.h | 12 | ||||
-rw-r--r-- | mm/huge_memory.c | 14 |
3 files changed, 31 insertions, 9 deletions
diff --git a/arch/powerpc/include/asm/pgtable-ppc64.h b/arch/powerpc/include/asm/pgtable-ppc64.h index 4a191c472867..d27960c89a71 100644 --- a/arch/powerpc/include/asm/pgtable-ppc64.h +++ b/arch/powerpc/include/asm/pgtable-ppc64.h | |||
@@ -558,5 +558,19 @@ extern pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp); | |||
558 | #define __HAVE_ARCH_PMDP_INVALIDATE | 558 | #define __HAVE_ARCH_PMDP_INVALIDATE |
559 | extern void pmdp_invalidate(struct vm_area_struct *vma, unsigned long address, | 559 | extern void pmdp_invalidate(struct vm_area_struct *vma, unsigned long address, |
560 | pmd_t *pmdp); | 560 | pmd_t *pmdp); |
561 | |||
562 | #define pmd_move_must_withdraw pmd_move_must_withdraw | ||
563 | typedef struct spinlock spinlock_t; | ||
564 | static inline int pmd_move_must_withdraw(spinlock_t *new_pmd_ptl, | ||
565 | spinlock_t *old_pmd_ptl) | ||
566 | { | ||
567 | /* | ||
568 | * Archs like ppc64 use pgtable to store per pmd | ||
569 | * specific information. So when we switch the pmd, | ||
570 | * we should also withdraw and deposit the pgtable | ||
571 | */ | ||
572 | return true; | ||
573 | } | ||
574 | |||
561 | #endif /* __ASSEMBLY__ */ | 575 | #endif /* __ASSEMBLY__ */ |
562 | #endif /* _ASM_POWERPC_PGTABLE_PPC64_H_ */ | 576 | #endif /* _ASM_POWERPC_PGTABLE_PPC64_H_ */ |
diff --git a/include/asm-generic/pgtable.h b/include/asm-generic/pgtable.h index db0923458940..8e4f41d9af4d 100644 --- a/include/asm-generic/pgtable.h +++ b/include/asm-generic/pgtable.h | |||
@@ -558,6 +558,18 @@ static inline pmd_t pmd_read_atomic(pmd_t *pmdp) | |||
558 | } | 558 | } |
559 | #endif | 559 | #endif |
560 | 560 | ||
561 | #ifndef pmd_move_must_withdraw | ||
562 | static inline int pmd_move_must_withdraw(spinlock_t *new_pmd_ptl, | ||
563 | spinlock_t *old_pmd_ptl) | ||
564 | { | ||
565 | /* | ||
566 | * With split pmd lock we also need to move preallocated | ||
567 | * PTE page table if new_pmd is on different PMD page table. | ||
568 | */ | ||
569 | return new_pmd_ptl != old_pmd_ptl; | ||
570 | } | ||
571 | #endif | ||
572 | |||
561 | /* | 573 | /* |
562 | * This function is meant to be used by sites walking pagetables with | 574 | * This function is meant to be used by sites walking pagetables with |
563 | * the mmap_sem hold in read mode to protect against MADV_DONTNEED and | 575 | * the mmap_sem hold in read mode to protect against MADV_DONTNEED and |
diff --git a/mm/huge_memory.c b/mm/huge_memory.c index 95d1acb0f3d2..5d80c53b87cb 100644 --- a/mm/huge_memory.c +++ b/mm/huge_memory.c | |||
@@ -1502,19 +1502,15 @@ int move_huge_pmd(struct vm_area_struct *vma, struct vm_area_struct *new_vma, | |||
1502 | spin_lock_nested(new_ptl, SINGLE_DEPTH_NESTING); | 1502 | spin_lock_nested(new_ptl, SINGLE_DEPTH_NESTING); |
1503 | pmd = pmdp_get_and_clear(mm, old_addr, old_pmd); | 1503 | pmd = pmdp_get_and_clear(mm, old_addr, old_pmd); |
1504 | VM_BUG_ON(!pmd_none(*new_pmd)); | 1504 | VM_BUG_ON(!pmd_none(*new_pmd)); |
1505 | set_pmd_at(mm, new_addr, new_pmd, pmd_mksoft_dirty(pmd)); | ||
1506 | if (new_ptl != old_ptl) { | ||
1507 | pgtable_t pgtable; | ||
1508 | 1505 | ||
1509 | /* | 1506 | if (pmd_move_must_withdraw(new_ptl, old_ptl)) { |
1510 | * Move preallocated PTE page table if new_pmd is on | 1507 | pgtable_t pgtable; |
1511 | * different PMD page table. | ||
1512 | */ | ||
1513 | pgtable = pgtable_trans_huge_withdraw(mm, old_pmd); | 1508 | pgtable = pgtable_trans_huge_withdraw(mm, old_pmd); |
1514 | pgtable_trans_huge_deposit(mm, new_pmd, pgtable); | 1509 | pgtable_trans_huge_deposit(mm, new_pmd, pgtable); |
1515 | |||
1516 | spin_unlock(new_ptl); | ||
1517 | } | 1510 | } |
1511 | set_pmd_at(mm, new_addr, new_pmd, pmd_mksoft_dirty(pmd)); | ||
1512 | if (new_ptl != old_ptl) | ||
1513 | spin_unlock(new_ptl); | ||
1518 | spin_unlock(old_ptl); | 1514 | spin_unlock(old_ptl); |
1519 | } | 1515 | } |
1520 | out: | 1516 | out: |