diff options
| author | Zachary Amsden <zach@vmware.com> | 2007-05-02 13:27:19 -0400 |
|---|---|---|
| committer | Andi Kleen <andi@basil.nowhere.org> | 2007-05-02 13:27:19 -0400 |
| commit | 142dd975911fdd82b1b6f6617cd20ac90a8ccf00 (patch) | |
| tree | 1e72e96bce64d9301d3305b4dd0b30675c8676b0 | |
| parent | c2c1accd4b2f9c82fb89d40611c7f581948db255 (diff) | |
[PATCH] i386: pte xchg optimization
In situations where page table updates need only be made locally, and there is
no cross-processor A/D bit races involved, we need not use the heavyweight
xchg instruction to atomically fetch and clear page table entries. Instead,
we can just read and clear them directly.
This introduces a neat optimization for non-SMP kernels; drop the atomic xchg
operations from page table updates.
Thanks to Michel Lespinasse for noting this potential optimization.
Signed-off-by: Zachary Amsden <zach@vmware.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Andi Kleen <ak@suse.de>
| -rw-r--r-- | include/asm-i386/pgtable-2level.h | 14 | ||||
| -rw-r--r-- | include/asm-i386/pgtable-3level.h | 14 |
2 files changed, 28 insertions, 0 deletions
diff --git a/include/asm-i386/pgtable-2level.h b/include/asm-i386/pgtable-2level.h index 85d9005c0cdf..3daab67cd366 100644 --- a/include/asm-i386/pgtable-2level.h +++ b/include/asm-i386/pgtable-2level.h | |||
| @@ -41,10 +41,24 @@ static inline void native_pte_clear(struct mm_struct *mm, unsigned long addr, pt | |||
| 41 | *xp = __pte(0); | 41 | *xp = __pte(0); |
| 42 | } | 42 | } |
| 43 | 43 | ||
| 44 | /* local pte updates need not use xchg for locking */ | ||
| 45 | static inline pte_t native_local_ptep_get_and_clear(pte_t *ptep) | ||
| 46 | { | ||
| 47 | pte_t res; | ||
| 48 | |||
| 49 | res = *ptep; | ||
| 50 | native_pte_clear(NULL, 0, ptep); | ||
| 51 | return res; | ||
| 52 | } | ||
| 53 | |||
| 54 | #ifdef CONFIG_SMP | ||
| 44 | static inline pte_t native_ptep_get_and_clear(pte_t *xp) | 55 | static inline pte_t native_ptep_get_and_clear(pte_t *xp) |
| 45 | { | 56 | { |
| 46 | return __pte(xchg(&xp->pte_low, 0)); | 57 | return __pte(xchg(&xp->pte_low, 0)); |
| 47 | } | 58 | } |
| 59 | #else | ||
| 60 | #define native_ptep_get_and_clear(xp) native_local_ptep_get_and_clear(xp) | ||
| 61 | #endif | ||
| 48 | 62 | ||
| 49 | #define pte_page(x) pfn_to_page(pte_pfn(x)) | 63 | #define pte_page(x) pfn_to_page(pte_pfn(x)) |
| 50 | #define pte_none(x) (!(x).pte_low) | 64 | #define pte_none(x) (!(x).pte_low) |
diff --git a/include/asm-i386/pgtable-3level.h b/include/asm-i386/pgtable-3level.h index 664bfee5a2f2..45b024181507 100644 --- a/include/asm-i386/pgtable-3level.h +++ b/include/asm-i386/pgtable-3level.h | |||
| @@ -139,6 +139,17 @@ static inline void pud_clear (pud_t * pud) { } | |||
| 139 | #define pmd_offset(pud, address) ((pmd_t *) pud_page(*(pud)) + \ | 139 | #define pmd_offset(pud, address) ((pmd_t *) pud_page(*(pud)) + \ |
| 140 | pmd_index(address)) | 140 | pmd_index(address)) |
| 141 | 141 | ||
| 142 | /* local pte updates need not use xchg for locking */ | ||
| 143 | static inline pte_t native_local_ptep_get_and_clear(pte_t *ptep) | ||
| 144 | { | ||
| 145 | pte_t res; | ||
| 146 | |||
| 147 | res = *ptep; | ||
| 148 | native_pte_clear(NULL, 0, ptep); | ||
| 149 | return res; | ||
| 150 | } | ||
| 151 | |||
| 152 | #ifdef CONFIG_SMP | ||
| 142 | static inline pte_t native_ptep_get_and_clear(pte_t *ptep) | 153 | static inline pte_t native_ptep_get_and_clear(pte_t *ptep) |
| 143 | { | 154 | { |
| 144 | pte_t res; | 155 | pte_t res; |
| @@ -150,6 +161,9 @@ static inline pte_t native_ptep_get_and_clear(pte_t *ptep) | |||
| 150 | 161 | ||
| 151 | return res; | 162 | return res; |
| 152 | } | 163 | } |
| 164 | #else | ||
| 165 | #define native_ptep_get_and_clear(xp) native_local_ptep_get_and_clear(xp) | ||
| 166 | #endif | ||
| 153 | 167 | ||
| 154 | #define __HAVE_ARCH_PTE_SAME | 168 | #define __HAVE_ARCH_PTE_SAME |
| 155 | static inline int pte_same(pte_t a, pte_t b) | 169 | static inline int pte_same(pte_t a, pte_t b) |
