diff options
author | Christian Borntraeger <borntraeger@de.ibm.com> | 2014-12-07 15:41:33 -0500 |
---|---|---|
committer | Christian Borntraeger <borntraeger@de.ibm.com> | 2014-12-18 03:54:37 -0500 |
commit | e37c698270633327245beb0fbd8699db8a4b65b4 (patch) | |
tree | ed83173785e55c3f91467a19d8c4033e723a98e9 /mm | |
parent | 230fa253df6352af12ad0a16128760b5cb3f92df (diff) |
mm: replace ACCESS_ONCE with READ_ONCE or barriers
ACCESS_ONCE does not work reliably on non-scalar types. For
example gcc 4.6 and 4.7 might remove the volatile tag for such
accesses during the SRA (scalar replacement of aggregates) step
(https://gcc.gnu.org/bugzilla/show_bug.cgi?id=58145)
Let's change the code to access the page table elements with
READ_ONCE that does implicit scalar accesses for the gup code.
mm_find_pmd is tricky, because m68k and sparc(32bit) define pmd_t
as array of longs. This code requires just that the pmd_present
and pmd_trans_huge check are done on the same value, so a barrier
is sufficent.
A similar case is in handle_pte_fault. On ppc44x the word size is
32 bit, but a pte is 64 bit. A barrier is ok as well.
Signed-off-by: Christian Borntraeger <borntraeger@de.ibm.com>
Cc: linux-mm@kvack.org
Acked-by: Paul E. McKenney <paulmck@linux.vnet.ibm.com>
Diffstat (limited to 'mm')
-rw-r--r-- | mm/gup.c | 2 | ||||
-rw-r--r-- | mm/memory.c | 11 | ||||
-rw-r--r-- | mm/rmap.c | 3 |
3 files changed, 13 insertions, 3 deletions
@@ -917,7 +917,7 @@ static int gup_pud_range(pgd_t *pgdp, unsigned long addr, unsigned long end, | |||
917 | 917 | ||
918 | pudp = pud_offset(pgdp, addr); | 918 | pudp = pud_offset(pgdp, addr); |
919 | do { | 919 | do { |
920 | pud_t pud = ACCESS_ONCE(*pudp); | 920 | pud_t pud = READ_ONCE(*pudp); |
921 | 921 | ||
922 | next = pud_addr_end(addr, end); | 922 | next = pud_addr_end(addr, end); |
923 | if (pud_none(pud)) | 923 | if (pud_none(pud)) |
diff --git a/mm/memory.c b/mm/memory.c index 3e503831e042..d86aa88902a0 100644 --- a/mm/memory.c +++ b/mm/memory.c | |||
@@ -3202,7 +3202,16 @@ static int handle_pte_fault(struct mm_struct *mm, | |||
3202 | pte_t entry; | 3202 | pte_t entry; |
3203 | spinlock_t *ptl; | 3203 | spinlock_t *ptl; |
3204 | 3204 | ||
3205 | entry = ACCESS_ONCE(*pte); | 3205 | /* |
3206 | * some architectures can have larger ptes than wordsize, | ||
3207 | * e.g.ppc44x-defconfig has CONFIG_PTE_64BIT=y and CONFIG_32BIT=y, | ||
3208 | * so READ_ONCE or ACCESS_ONCE cannot guarantee atomic accesses. | ||
3209 | * The code below just needs a consistent view for the ifs and | ||
3210 | * we later double check anyway with the ptl lock held. So here | ||
3211 | * a barrier will do. | ||
3212 | */ | ||
3213 | entry = *pte; | ||
3214 | barrier(); | ||
3206 | if (!pte_present(entry)) { | 3215 | if (!pte_present(entry)) { |
3207 | if (pte_none(entry)) { | 3216 | if (pte_none(entry)) { |
3208 | if (vma->vm_ops) { | 3217 | if (vma->vm_ops) { |
@@ -581,7 +581,8 @@ pmd_t *mm_find_pmd(struct mm_struct *mm, unsigned long address) | |||
581 | * without holding anon_vma lock for write. So when looking for a | 581 | * without holding anon_vma lock for write. So when looking for a |
582 | * genuine pmde (in which to find pte), test present and !THP together. | 582 | * genuine pmde (in which to find pte), test present and !THP together. |
583 | */ | 583 | */ |
584 | pmde = ACCESS_ONCE(*pmd); | 584 | pmde = *pmd; |
585 | barrier(); | ||
585 | if (!pmd_present(pmde) || pmd_trans_huge(pmde)) | 586 | if (!pmd_present(pmde) || pmd_trans_huge(pmde)) |
586 | pmd = NULL; | 587 | pmd = NULL; |
587 | out: | 588 | out: |