diff options
| -rw-r--r-- | arch/arm/mm/Kconfig | 8 | ||||
| -rw-r--r-- | arch/arm/mm/cache-xsc3l2.c | 182 | ||||
| -rw-r--r-- | arch/arm/mm/proc-xsc3.S | 22 |
3 files changed, 190 insertions, 22 deletions
diff --git a/arch/arm/mm/Kconfig b/arch/arm/mm/Kconfig index 399d1d66bf93..ed15f876c725 100644 --- a/arch/arm/mm/Kconfig +++ b/arch/arm/mm/Kconfig | |||
| @@ -742,3 +742,11 @@ config CACHE_L2X0 | |||
| 742 | select OUTER_CACHE | 742 | select OUTER_CACHE |
| 743 | help | 743 | help |
| 744 | This option enables the L2x0 PrimeCell. | 744 | This option enables the L2x0 PrimeCell. |
| 745 | |||
| 746 | config CACHE_XSC3L2 | ||
| 747 | bool "Enable the L2 cache on XScale3" | ||
| 748 | depends on CPU_XSC3 | ||
| 749 | default y | ||
| 750 | select OUTER_CACHE | ||
| 751 | help | ||
| 752 | This option enables the L2 cache on XScale3. | ||
diff --git a/arch/arm/mm/cache-xsc3l2.c b/arch/arm/mm/cache-xsc3l2.c new file mode 100644 index 000000000000..158bd96763d3 --- /dev/null +++ b/arch/arm/mm/cache-xsc3l2.c | |||
| @@ -0,0 +1,182 @@ | |||
| 1 | /* | ||
| 2 | * arch/arm/mm/cache-xsc3l2.c - XScale3 L2 cache controller support | ||
| 3 | * | ||
| 4 | * Copyright (C) 2007 ARM Limited | ||
| 5 | * | ||
| 6 | * This program is free software; you can redistribute it and/or modify | ||
| 7 | * it under the terms of the GNU General Public License version 2 as | ||
| 8 | * published by the Free Software Foundation. | ||
| 9 | * | ||
| 10 | * This program is distributed in the hope that it will be useful, | ||
| 11 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
| 12 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
| 13 | * GNU General Public License for more details. | ||
| 14 | * | ||
| 15 | * You should have received a copy of the GNU General Public License | ||
| 16 | * along with this program; if not, write to the Free Software | ||
| 17 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | ||
| 18 | */ | ||
| 19 | #include <linux/init.h> | ||
| 20 | #include <linux/spinlock.h> | ||
| 21 | |||
| 22 | #include <asm/system.h> | ||
| 23 | #include <asm/cacheflush.h> | ||
| 24 | #include <asm/io.h> | ||
| 25 | |||
| 26 | #define CR_L2 (1 << 26) | ||
| 27 | |||
| 28 | #define CACHE_LINE_SIZE 32 | ||
| 29 | #define CACHE_LINE_SHIFT 5 | ||
| 30 | #define CACHE_WAY_PER_SET 8 | ||
| 31 | |||
| 32 | #define CACHE_WAY_SIZE(l2ctype) (8192 << (((l2ctype) >> 8) & 0xf)) | ||
| 33 | #define CACHE_SET_SIZE(l2ctype) (CACHE_WAY_SIZE(l2ctype) >> CACHE_LINE_SHIFT) | ||
| 34 | |||
| 35 | static inline int xsc3_l2_present(void) | ||
| 36 | { | ||
| 37 | unsigned long l2ctype; | ||
| 38 | |||
| 39 | __asm__("mrc p15, 1, %0, c0, c0, 1" : "=r" (l2ctype)); | ||
| 40 | |||
| 41 | return !!(l2ctype & 0xf8); | ||
| 42 | } | ||
| 43 | |||
| 44 | static inline void xsc3_l2_clean_mva(unsigned long addr) | ||
| 45 | { | ||
| 46 | __asm__("mcr p15, 1, %0, c7, c11, 1" : : "r" (addr)); | ||
| 47 | } | ||
| 48 | |||
| 49 | static inline void xsc3_l2_clean_pa(unsigned long addr) | ||
| 50 | { | ||
| 51 | xsc3_l2_clean_mva(__phys_to_virt(addr)); | ||
| 52 | } | ||
| 53 | |||
| 54 | static inline void xsc3_l2_inv_mva(unsigned long addr) | ||
| 55 | { | ||
| 56 | __asm__("mcr p15, 1, %0, c7, c7, 1" : : "r" (addr)); | ||
| 57 | } | ||
| 58 | |||
| 59 | static inline void xsc3_l2_inv_pa(unsigned long addr) | ||
| 60 | { | ||
| 61 | xsc3_l2_inv_mva(__phys_to_virt(addr)); | ||
| 62 | } | ||
| 63 | |||
| 64 | static inline void xsc3_l2_inv_all(void) | ||
| 65 | { | ||
| 66 | unsigned long l2ctype, set_way; | ||
| 67 | int set, way; | ||
| 68 | |||
| 69 | __asm__("mrc p15, 1, %0, c0, c0, 1" : "=r" (l2ctype)); | ||
| 70 | |||
| 71 | for (set = 0; set < CACHE_SET_SIZE(l2ctype); set++) { | ||
| 72 | for (way = 0; way < CACHE_WAY_PER_SET; way++) { | ||
| 73 | set_way = (way << 29) | (set << 5); | ||
| 74 | __asm__("mcr p15, 1, %0, c7, c11, 2" : : "r"(set_way)); | ||
| 75 | } | ||
| 76 | } | ||
| 77 | |||
| 78 | dsb(); | ||
| 79 | } | ||
| 80 | |||
| 81 | static void xsc3_l2_inv_range(unsigned long start, unsigned long end) | ||
| 82 | { | ||
| 83 | if (start == 0 && end == -1ul) { | ||
| 84 | xsc3_l2_inv_all(); | ||
| 85 | return; | ||
| 86 | } | ||
| 87 | |||
| 88 | /* | ||
| 89 | * Clean and invalidate partial first cache line. | ||
| 90 | */ | ||
| 91 | if (start & (CACHE_LINE_SIZE - 1)) { | ||
| 92 | xsc3_l2_clean_pa(start & ~(CACHE_LINE_SIZE - 1)); | ||
| 93 | xsc3_l2_inv_pa(start & ~(CACHE_LINE_SIZE - 1)); | ||
| 94 | start = (start | (CACHE_LINE_SIZE - 1)) + 1; | ||
| 95 | } | ||
| 96 | |||
| 97 | /* | ||
| 98 | * Clean and invalidate partial last cache line. | ||
| 99 | */ | ||
| 100 | if (end & (CACHE_LINE_SIZE - 1)) { | ||
| 101 | xsc3_l2_clean_pa(end & ~(CACHE_LINE_SIZE - 1)); | ||
| 102 | xsc3_l2_inv_pa(end & ~(CACHE_LINE_SIZE - 1)); | ||
| 103 | end &= ~(CACHE_LINE_SIZE - 1); | ||
| 104 | } | ||
| 105 | |||
| 106 | /* | ||
| 107 | * Invalidate all full cache lines between 'start' and 'end'. | ||
| 108 | */ | ||
| 109 | while (start != end) { | ||
| 110 | xsc3_l2_inv_pa(start); | ||
| 111 | start += CACHE_LINE_SIZE; | ||
| 112 | } | ||
| 113 | |||
| 114 | dsb(); | ||
| 115 | } | ||
| 116 | |||
| 117 | static void xsc3_l2_clean_range(unsigned long start, unsigned long end) | ||
| 118 | { | ||
| 119 | start &= ~(CACHE_LINE_SIZE - 1); | ||
| 120 | while (start < end) { | ||
| 121 | xsc3_l2_clean_pa(start); | ||
| 122 | start += CACHE_LINE_SIZE; | ||
| 123 | } | ||
| 124 | |||
| 125 | dsb(); | ||
| 126 | } | ||
| 127 | |||
| 128 | /* | ||
| 129 | * optimize L2 flush all operation by set/way format | ||
| 130 | */ | ||
| 131 | static inline void xsc3_l2_flush_all(void) | ||
| 132 | { | ||
| 133 | unsigned long l2ctype, set_way; | ||
| 134 | int set, way; | ||
| 135 | |||
| 136 | __asm__("mrc p15, 1, %0, c0, c0, 1" : "=r" (l2ctype)); | ||
| 137 | |||
| 138 | for (set = 0; set < CACHE_SET_SIZE(l2ctype); set++) { | ||
| 139 | for (way = 0; way < CACHE_WAY_PER_SET; way++) { | ||
| 140 | set_way = (way << 29) | (set << 5); | ||
| 141 | __asm__("mcr p15, 1, %0, c7, c15, 2" : : "r"(set_way)); | ||
| 142 | } | ||
| 143 | } | ||
| 144 | |||
| 145 | dsb(); | ||
| 146 | } | ||
| 147 | |||
| 148 | static void xsc3_l2_flush_range(unsigned long start, unsigned long end) | ||
| 149 | { | ||
| 150 | if (start == 0 && end == -1ul) { | ||
| 151 | xsc3_l2_flush_all(); | ||
| 152 | return; | ||
| 153 | } | ||
| 154 | |||
| 155 | start &= ~(CACHE_LINE_SIZE - 1); | ||
| 156 | while (start < end) { | ||
| 157 | xsc3_l2_clean_pa(start); | ||
| 158 | xsc3_l2_inv_pa(start); | ||
| 159 | start += CACHE_LINE_SIZE; | ||
| 160 | } | ||
| 161 | |||
| 162 | dsb(); | ||
| 163 | } | ||
| 164 | |||
| 165 | static int __init xsc3_l2_init(void) | ||
| 166 | { | ||
| 167 | if (!cpu_is_xsc3() || !xsc3_l2_present()) | ||
| 168 | return 0; | ||
| 169 | |||
| 170 | if (!(get_cr() & CR_L2)) { | ||
| 171 | pr_info("XScale3 L2 cache enabled.\n"); | ||
| 172 | adjust_cr(CR_L2, CR_L2); | ||
| 173 | xsc3_l2_inv_all(); | ||
| 174 | } | ||
| 175 | |||
| 176 | outer_cache.inv_range = xsc3_l2_inv_range; | ||
| 177 | outer_cache.clean_range = xsc3_l2_clean_range; | ||
| 178 | outer_cache.flush_range = xsc3_l2_flush_range; | ||
| 179 | |||
| 180 | return 0; | ||
| 181 | } | ||
| 182 | core_initcall(xsc3_l2_init); | ||
diff --git a/arch/arm/mm/proc-xsc3.S b/arch/arm/mm/proc-xsc3.S index 3533741a76f6..6ff53c24510f 100644 --- a/arch/arm/mm/proc-xsc3.S +++ b/arch/arm/mm/proc-xsc3.S | |||
| @@ -52,11 +52,6 @@ | |||
| 52 | #define CACHESIZE 32768 | 52 | #define CACHESIZE 32768 |
| 53 | 53 | ||
| 54 | /* | 54 | /* |
| 55 | * Run with L2 enabled. | ||
| 56 | */ | ||
| 57 | #define L2_CACHE_ENABLE 1 | ||
| 58 | |||
| 59 | /* | ||
| 60 | * This macro is used to wait for a CP15 write and is needed when we | 55 | * This macro is used to wait for a CP15 write and is needed when we |
| 61 | * have to ensure that the last operation to the coprocessor was | 56 | * have to ensure that the last operation to the coprocessor was |
| 62 | * completed before continuing with operation. | 57 | * completed before continuing with operation. |
| @@ -265,12 +260,9 @@ ENTRY(xsc3_dma_inv_range) | |||
| 265 | tst r0, #CACHELINESIZE - 1 | 260 | tst r0, #CACHELINESIZE - 1 |
| 266 | bic r0, r0, #CACHELINESIZE - 1 | 261 | bic r0, r0, #CACHELINESIZE - 1 |
| 267 | mcrne p15, 0, r0, c7, c10, 1 @ clean L1 D line | 262 | mcrne p15, 0, r0, c7, c10, 1 @ clean L1 D line |
| 268 | mcrne p15, 1, r0, c7, c11, 1 @ clean L2 line | ||
| 269 | tst r1, #CACHELINESIZE - 1 | 263 | tst r1, #CACHELINESIZE - 1 |
| 270 | mcrne p15, 0, r1, c7, c10, 1 @ clean L1 D line | 264 | mcrne p15, 0, r1, c7, c10, 1 @ clean L1 D line |
| 271 | mcrne p15, 1, r1, c7, c11, 1 @ clean L2 line | ||
| 272 | 1: mcr p15, 0, r0, c7, c6, 1 @ invalidate L1 D line | 265 | 1: mcr p15, 0, r0, c7, c6, 1 @ invalidate L1 D line |
| 273 | mcr p15, 1, r0, c7, c7, 1 @ invalidate L2 line | ||
| 274 | add r0, r0, #CACHELINESIZE | 266 | add r0, r0, #CACHELINESIZE |
| 275 | cmp r0, r1 | 267 | cmp r0, r1 |
| 276 | blo 1b | 268 | blo 1b |
| @@ -288,7 +280,6 @@ ENTRY(xsc3_dma_inv_range) | |||
| 288 | ENTRY(xsc3_dma_clean_range) | 280 | ENTRY(xsc3_dma_clean_range) |
| 289 | bic r0, r0, #CACHELINESIZE - 1 | 281 | bic r0, r0, #CACHELINESIZE - 1 |
| 290 | 1: mcr p15, 0, r0, c7, c10, 1 @ clean L1 D line | 282 | 1: mcr p15, 0, r0, c7, c10, 1 @ clean L1 D line |
| 291 | mcr p15, 1, r0, c7, c11, 1 @ clean L2 line | ||
| 292 | add r0, r0, #CACHELINESIZE | 283 | add r0, r0, #CACHELINESIZE |
| 293 | cmp r0, r1 | 284 | cmp r0, r1 |
| 294 | blo 1b | 285 | blo 1b |
| @@ -306,8 +297,6 @@ ENTRY(xsc3_dma_clean_range) | |||
| 306 | ENTRY(xsc3_dma_flush_range) | 297 | ENTRY(xsc3_dma_flush_range) |
| 307 | bic r0, r0, #CACHELINESIZE - 1 | 298 | bic r0, r0, #CACHELINESIZE - 1 |
| 308 | 1: mcr p15, 0, r0, c7, c14, 1 @ clean/invalidate L1 D line | 299 | 1: mcr p15, 0, r0, c7, c14, 1 @ clean/invalidate L1 D line |
| 309 | mcr p15, 1, r0, c7, c11, 1 @ clean L2 line | ||
| 310 | mcr p15, 1, r0, c7, c7, 1 @ invalidate L2 line | ||
| 311 | add r0, r0, #CACHELINESIZE | 300 | add r0, r0, #CACHELINESIZE |
| 312 | cmp r0, r1 | 301 | cmp r0, r1 |
| 313 | blo 1b | 302 | blo 1b |
| @@ -347,9 +336,7 @@ ENTRY(cpu_xsc3_switch_mm) | |||
| 347 | mcr p15, 0, ip, c7, c5, 0 @ invalidate L1 I cache and BTB | 336 | mcr p15, 0, ip, c7, c5, 0 @ invalidate L1 I cache and BTB |
| 348 | mcr p15, 0, ip, c7, c10, 4 @ data write barrier | 337 | mcr p15, 0, ip, c7, c10, 4 @ data write barrier |
| 349 | mcr p15, 0, ip, c7, c5, 4 @ prefetch flush | 338 | mcr p15, 0, ip, c7, c5, 4 @ prefetch flush |
| 350 | #ifdef L2_CACHE_ENABLE | ||
| 351 | orr r0, r0, #0x18 @ cache the page table in L2 | 339 | orr r0, r0, #0x18 @ cache the page table in L2 |
| 352 | #endif | ||
| 353 | mcr p15, 0, r0, c2, c0, 0 @ load page table pointer | 340 | mcr p15, 0, r0, c2, c0, 0 @ load page table pointer |
| 354 | mcr p15, 0, ip, c8, c7, 0 @ invalidate I and D TLBs | 341 | mcr p15, 0, ip, c8, c7, 0 @ invalidate I and D TLBs |
| 355 | cpwait_ret lr, ip | 342 | cpwait_ret lr, ip |
| @@ -378,12 +365,10 @@ ENTRY(cpu_xsc3_set_pte_ext) | |||
| 378 | orreq r2, r2, #PTE_EXT_AP_UNO_SRW @ yes -> user n/a, system r/w | 365 | orreq r2, r2, #PTE_EXT_AP_UNO_SRW @ yes -> user n/a, system r/w |
| 379 | @ combined with user -> user r/w | 366 | @ combined with user -> user r/w |
| 380 | 367 | ||
| 381 | #if L2_CACHE_ENABLE | ||
| 382 | @ If it's cacheable, it needs to be in L2 also. | 368 | @ If it's cacheable, it needs to be in L2 also. |
| 383 | eor ip, r1, #L_PTE_CACHEABLE | 369 | eor ip, r1, #L_PTE_CACHEABLE |
| 384 | tst ip, #L_PTE_CACHEABLE | 370 | tst ip, #L_PTE_CACHEABLE |
| 385 | orreq r2, r2, #PTE_EXT_TEX(0x5) | 371 | orreq r2, r2, #PTE_EXT_TEX(0x5) |
| 386 | #endif | ||
| 387 | 372 | ||
| 388 | tst r3, #L_PTE_PRESENT | L_PTE_YOUNG @ present and young? | 373 | tst r3, #L_PTE_PRESENT | L_PTE_YOUNG @ present and young? |
| 389 | movne r2, #0 @ no -> fault | 374 | movne r2, #0 @ no -> fault |
| @@ -408,9 +393,7 @@ __xsc3_setup: | |||
| 408 | mcr p15, 0, ip, c7, c10, 4 @ data write barrier | 393 | mcr p15, 0, ip, c7, c10, 4 @ data write barrier |
| 409 | mcr p15, 0, ip, c7, c5, 4 @ prefetch flush | 394 | mcr p15, 0, ip, c7, c5, 4 @ prefetch flush |
| 410 | mcr p15, 0, ip, c8, c7, 0 @ invalidate I and D TLBs | 395 | mcr p15, 0, ip, c8, c7, 0 @ invalidate I and D TLBs |
| 411 | #if L2_CACHE_ENABLE | ||
| 412 | orr r4, r4, #0x18 @ cache the page table in L2 | 396 | orr r4, r4, #0x18 @ cache the page table in L2 |
| 413 | #endif | ||
| 414 | mcr p15, 0, r4, c2, c0, 0 @ load page table pointer | 397 | mcr p15, 0, r4, c2, c0, 0 @ load page table pointer |
| 415 | 398 | ||
| 416 | mov r0, #0 @ don't allow CP access | 399 | mov r0, #0 @ don't allow CP access |
| @@ -418,9 +401,7 @@ __xsc3_setup: | |||
| 418 | 401 | ||
| 419 | mrc p15, 0, r0, c1, c0, 1 @ get auxiliary control reg | 402 | mrc p15, 0, r0, c1, c0, 1 @ get auxiliary control reg |
| 420 | and r0, r0, #2 @ preserve bit P bit setting | 403 | and r0, r0, #2 @ preserve bit P bit setting |
| 421 | #if L2_CACHE_ENABLE | ||
| 422 | orr r0, r0, #(1 << 10) @ enable L2 for LLR cache | 404 | orr r0, r0, #(1 << 10) @ enable L2 for LLR cache |
| 423 | #endif | ||
| 424 | mcr p15, 0, r0, c1, c0, 1 @ set auxiliary control reg | 405 | mcr p15, 0, r0, c1, c0, 1 @ set auxiliary control reg |
| 425 | 406 | ||
| 426 | adr r5, xsc3_crval | 407 | adr r5, xsc3_crval |
| @@ -429,9 +410,6 @@ __xsc3_setup: | |||
| 429 | bic r0, r0, r5 @ ..V. ..R. .... ..A. | 410 | bic r0, r0, r5 @ ..V. ..R. .... ..A. |
| 430 | orr r0, r0, r6 @ ..VI Z..S .... .C.M (mmu) | 411 | orr r0, r0, r6 @ ..VI Z..S .... .C.M (mmu) |
| 431 | @ ...I Z..S .... .... (uc) | 412 | @ ...I Z..S .... .... (uc) |
| 432 | #if L2_CACHE_ENABLE | ||
| 433 | orr r0, r0, #0x04000000 @ L2 enable | ||
| 434 | #endif | ||
| 435 | mov pc, lr | 413 | mov pc, lr |
| 436 | 414 | ||
| 437 | .size __xsc3_setup, . - __xsc3_setup | 415 | .size __xsc3_setup, . - __xsc3_setup |
