diff options
| author | Tony Luck <tony.luck@intel.com> | 2008-04-17 13:13:57 -0400 |
|---|---|---|
| committer | Tony Luck <tony.luck@intel.com> | 2008-04-17 13:13:57 -0400 |
| commit | f4df39cbdd9e9ab615e80148cc271db22a8508ad (patch) | |
| tree | 312fcf9de1154c85782c121a46fa2952f9812292 | |
| parent | a49072bb367a94a9af6c6a6dcbaa1dc5617d7fa0 (diff) | |
| parent | a6c75b86ce9f01db4ea9912877b526c2dc4d2f0a (diff) | |
Pull nptcg into release branch
Conflicts:
arch/ia64/mm/tlb.c
| -rw-r--r-- | Documentation/kernel-parameters.txt | 4 | ||||
| -rw-r--r-- | arch/ia64/kernel/efi.c | 46 | ||||
| -rw-r--r-- | arch/ia64/kernel/setup.c | 6 | ||||
| -rw-r--r-- | arch/ia64/mm/tlb.c | 161 | ||||
| -rw-r--r-- | include/asm-ia64/sal.h | 21 | ||||
| -rw-r--r-- | include/asm-ia64/tlbflush.h | 1 |
6 files changed, 222 insertions, 17 deletions
diff --git a/Documentation/kernel-parameters.txt b/Documentation/kernel-parameters.txt index dafd001bf833..5389acf9e075 100644 --- a/Documentation/kernel-parameters.txt +++ b/Documentation/kernel-parameters.txt | |||
| @@ -1339,6 +1339,10 @@ and is between 256 and 4096 characters. It is defined in the file | |||
| 1339 | 1339 | ||
| 1340 | nowb [ARM] | 1340 | nowb [ARM] |
| 1341 | 1341 | ||
| 1342 | nptcg= [IA64] Override max number of concurrent global TLB | ||
| 1343 | purges which is reported from either PAL_VM_SUMMARY or | ||
| 1344 | SAL PALO. | ||
| 1345 | |||
| 1342 | numa_zonelist_order= [KNL, BOOT] Select zonelist order for NUMA. | 1346 | numa_zonelist_order= [KNL, BOOT] Select zonelist order for NUMA. |
| 1343 | one of ['zone', 'node', 'default'] can be specified | 1347 | one of ['zone', 'node', 'default'] can be specified |
| 1344 | This can be set from sysctl after boot. | 1348 | This can be set from sysctl after boot. |
diff --git a/arch/ia64/kernel/efi.c b/arch/ia64/kernel/efi.c index 728d7247a1a6..d45f215bc8fc 100644 --- a/arch/ia64/kernel/efi.c +++ b/arch/ia64/kernel/efi.c | |||
| @@ -37,6 +37,7 @@ | |||
| 37 | #include <asm/pgtable.h> | 37 | #include <asm/pgtable.h> |
| 38 | #include <asm/processor.h> | 38 | #include <asm/processor.h> |
| 39 | #include <asm/mca.h> | 39 | #include <asm/mca.h> |
| 40 | #include <asm/tlbflush.h> | ||
| 40 | 41 | ||
| 41 | #define EFI_DEBUG 0 | 42 | #define EFI_DEBUG 0 |
| 42 | 43 | ||
| @@ -403,6 +404,41 @@ efi_get_pal_addr (void) | |||
| 403 | return NULL; | 404 | return NULL; |
| 404 | } | 405 | } |
| 405 | 406 | ||
| 407 | |||
| 408 | static u8 __init palo_checksum(u8 *buffer, u32 length) | ||
| 409 | { | ||
| 410 | u8 sum = 0; | ||
| 411 | u8 *end = buffer + length; | ||
| 412 | |||
| 413 | while (buffer < end) | ||
| 414 | sum = (u8) (sum + *(buffer++)); | ||
| 415 | |||
| 416 | return sum; | ||
| 417 | } | ||
| 418 | |||
| 419 | /* | ||
| 420 | * Parse and handle PALO table which is published at: | ||
| 421 | * http://www.dig64.org/home/DIG64_PALO_R1_0.pdf | ||
| 422 | */ | ||
| 423 | static void __init handle_palo(unsigned long palo_phys) | ||
| 424 | { | ||
| 425 | struct palo_table *palo = __va(palo_phys); | ||
| 426 | u8 checksum; | ||
| 427 | |||
| 428 | if (strncmp(palo->signature, PALO_SIG, sizeof(PALO_SIG) - 1)) { | ||
| 429 | printk(KERN_INFO "PALO signature incorrect.\n"); | ||
| 430 | return; | ||
| 431 | } | ||
| 432 | |||
| 433 | checksum = palo_checksum((u8 *)palo, palo->length); | ||
| 434 | if (checksum) { | ||
| 435 | printk(KERN_INFO "PALO checksum incorrect.\n"); | ||
| 436 | return; | ||
| 437 | } | ||
| 438 | |||
| 439 | setup_ptcg_sem(palo->max_tlb_purges, NPTCG_FROM_PALO); | ||
| 440 | } | ||
| 441 | |||
| 406 | void | 442 | void |
| 407 | efi_map_pal_code (void) | 443 | efi_map_pal_code (void) |
| 408 | { | 444 | { |
| @@ -432,6 +468,7 @@ efi_init (void) | |||
| 432 | u64 efi_desc_size; | 468 | u64 efi_desc_size; |
| 433 | char *cp, vendor[100] = "unknown"; | 469 | char *cp, vendor[100] = "unknown"; |
| 434 | int i; | 470 | int i; |
| 471 | unsigned long palo_phys; | ||
| 435 | 472 | ||
| 436 | /* | 473 | /* |
| 437 | * It's too early to be able to use the standard kernel command line | 474 | * It's too early to be able to use the standard kernel command line |
| @@ -496,6 +533,8 @@ efi_init (void) | |||
| 496 | efi.hcdp = EFI_INVALID_TABLE_ADDR; | 533 | efi.hcdp = EFI_INVALID_TABLE_ADDR; |
| 497 | efi.uga = EFI_INVALID_TABLE_ADDR; | 534 | efi.uga = EFI_INVALID_TABLE_ADDR; |
| 498 | 535 | ||
| 536 | palo_phys = EFI_INVALID_TABLE_ADDR; | ||
| 537 | |||
| 499 | for (i = 0; i < (int) efi.systab->nr_tables; i++) { | 538 | for (i = 0; i < (int) efi.systab->nr_tables; i++) { |
| 500 | if (efi_guidcmp(config_tables[i].guid, MPS_TABLE_GUID) == 0) { | 539 | if (efi_guidcmp(config_tables[i].guid, MPS_TABLE_GUID) == 0) { |
| 501 | efi.mps = config_tables[i].table; | 540 | efi.mps = config_tables[i].table; |
| @@ -515,10 +554,17 @@ efi_init (void) | |||
| 515 | } else if (efi_guidcmp(config_tables[i].guid, HCDP_TABLE_GUID) == 0) { | 554 | } else if (efi_guidcmp(config_tables[i].guid, HCDP_TABLE_GUID) == 0) { |
| 516 | efi.hcdp = config_tables[i].table; | 555 | efi.hcdp = config_tables[i].table; |
| 517 | printk(" HCDP=0x%lx", config_tables[i].table); | 556 | printk(" HCDP=0x%lx", config_tables[i].table); |
| 557 | } else if (efi_guidcmp(config_tables[i].guid, | ||
| 558 | PROCESSOR_ABSTRACTION_LAYER_OVERWRITE_GUID) == 0) { | ||
| 559 | palo_phys = config_tables[i].table; | ||
| 560 | printk(" PALO=0x%lx", config_tables[i].table); | ||
| 518 | } | 561 | } |
| 519 | } | 562 | } |
| 520 | printk("\n"); | 563 | printk("\n"); |
| 521 | 564 | ||
| 565 | if (palo_phys != EFI_INVALID_TABLE_ADDR) | ||
| 566 | handle_palo(palo_phys); | ||
| 567 | |||
| 522 | runtime = __va(efi.systab->runtime); | 568 | runtime = __va(efi.systab->runtime); |
| 523 | efi.get_time = phys_get_time; | 569 | efi.get_time = phys_get_time; |
| 524 | efi.set_time = phys_set_time; | 570 | efi.set_time = phys_set_time; |
diff --git a/arch/ia64/kernel/setup.c b/arch/ia64/kernel/setup.c index 6206541f9e87..b86a072418a2 100644 --- a/arch/ia64/kernel/setup.c +++ b/arch/ia64/kernel/setup.c | |||
| @@ -59,6 +59,7 @@ | |||
| 59 | #include <asm/setup.h> | 59 | #include <asm/setup.h> |
| 60 | #include <asm/smp.h> | 60 | #include <asm/smp.h> |
| 61 | #include <asm/system.h> | 61 | #include <asm/system.h> |
| 62 | #include <asm/tlbflush.h> | ||
| 62 | #include <asm/unistd.h> | 63 | #include <asm/unistd.h> |
| 63 | #include <asm/hpsim.h> | 64 | #include <asm/hpsim.h> |
| 64 | 65 | ||
| @@ -948,9 +949,10 @@ cpu_init (void) | |||
| 948 | #endif | 949 | #endif |
| 949 | 950 | ||
| 950 | /* set ia64_ctx.max_rid to the maximum RID that is supported by all CPUs: */ | 951 | /* set ia64_ctx.max_rid to the maximum RID that is supported by all CPUs: */ |
| 951 | if (ia64_pal_vm_summary(NULL, &vmi) == 0) | 952 | if (ia64_pal_vm_summary(NULL, &vmi) == 0) { |
| 952 | max_ctx = (1U << (vmi.pal_vm_info_2_s.rid_size - 3)) - 1; | 953 | max_ctx = (1U << (vmi.pal_vm_info_2_s.rid_size - 3)) - 1; |
| 953 | else { | 954 | setup_ptcg_sem(vmi.pal_vm_info_2_s.max_purges, NPTCG_FROM_PAL); |
| 955 | } else { | ||
| 954 | printk(KERN_WARNING "cpu_init: PAL VM summary failed, assuming 18 RID bits\n"); | 956 | printk(KERN_WARNING "cpu_init: PAL VM summary failed, assuming 18 RID bits\n"); |
| 955 | max_ctx = (1U << 15) - 1; /* use architected minimum */ | 957 | max_ctx = (1U << 15) - 1; /* use architected minimum */ |
| 956 | } | 958 | } |
diff --git a/arch/ia64/mm/tlb.c b/arch/ia64/mm/tlb.c index 3d8903f936a5..d52ec4e83409 100644 --- a/arch/ia64/mm/tlb.c +++ b/arch/ia64/mm/tlb.c | |||
| @@ -11,6 +11,9 @@ | |||
| 11 | * Rohit Seth <rohit.seth@intel.com> | 11 | * Rohit Seth <rohit.seth@intel.com> |
| 12 | * Ken Chen <kenneth.w.chen@intel.com> | 12 | * Ken Chen <kenneth.w.chen@intel.com> |
| 13 | * Christophe de Dinechin <ddd@hp.com>: Avoid ptc.e on memory allocation | 13 | * Christophe de Dinechin <ddd@hp.com>: Avoid ptc.e on memory allocation |
| 14 | * Copyright (C) 2007 Intel Corp | ||
| 15 | * Fenghua Yu <fenghua.yu@intel.com> | ||
| 16 | * Add multiple ptc.g/ptc.ga instruction support in global tlb purge. | ||
| 14 | */ | 17 | */ |
| 15 | #include <linux/module.h> | 18 | #include <linux/module.h> |
| 16 | #include <linux/init.h> | 19 | #include <linux/init.h> |
| @@ -27,6 +30,7 @@ | |||
| 27 | #include <asm/tlbflush.h> | 30 | #include <asm/tlbflush.h> |
| 28 | #include <asm/dma.h> | 31 | #include <asm/dma.h> |
| 29 | #include <asm/processor.h> | 32 | #include <asm/processor.h> |
| 33 | #include <asm/sal.h> | ||
| 30 | #include <asm/tlb.h> | 34 | #include <asm/tlb.h> |
| 31 | 35 | ||
| 32 | static struct { | 36 | static struct { |
| @@ -90,14 +94,140 @@ wrap_mmu_context (struct mm_struct *mm) | |||
| 90 | local_flush_tlb_all(); | 94 | local_flush_tlb_all(); |
| 91 | } | 95 | } |
| 92 | 96 | ||
| 97 | /* | ||
| 98 | * Implement "spinaphores" ... like counting semaphores, but they | ||
| 99 | * spin instead of sleeping. If there are ever any other users for | ||
| 100 | * this primitive it can be moved up to a spinaphore.h header. | ||
| 101 | */ | ||
| 102 | struct spinaphore { | ||
| 103 | atomic_t cur; | ||
| 104 | }; | ||
| 105 | |||
| 106 | static inline void spinaphore_init(struct spinaphore *ss, int val) | ||
| 107 | { | ||
| 108 | atomic_set(&ss->cur, val); | ||
| 109 | } | ||
| 110 | |||
| 111 | static inline void down_spin(struct spinaphore *ss) | ||
| 112 | { | ||
| 113 | while (unlikely(!atomic_add_unless(&ss->cur, -1, 0))) | ||
| 114 | while (atomic_read(&ss->cur) == 0) | ||
| 115 | cpu_relax(); | ||
| 116 | } | ||
| 117 | |||
| 118 | static inline void up_spin(struct spinaphore *ss) | ||
| 119 | { | ||
| 120 | atomic_add(1, &ss->cur); | ||
| 121 | } | ||
| 122 | |||
| 123 | static struct spinaphore ptcg_sem; | ||
| 124 | static u16 nptcg = 1; | ||
| 125 | static int need_ptcg_sem = 1; | ||
| 126 | static int toolatetochangeptcgsem = 0; | ||
| 127 | |||
| 128 | /* | ||
| 129 | * Kernel parameter "nptcg=" overrides max number of concurrent global TLB | ||
| 130 | * purges which is reported from either PAL or SAL PALO. | ||
| 131 | * | ||
| 132 | * We don't have sanity checking for nptcg value. It's the user's responsibility | ||
| 133 | * for valid nptcg value on the platform. Otherwise, kernel may hang in some | ||
| 134 | * cases. | ||
| 135 | */ | ||
| 136 | static int __init | ||
| 137 | set_nptcg(char *str) | ||
| 138 | { | ||
| 139 | int value = 0; | ||
| 140 | |||
| 141 | get_option(&str, &value); | ||
| 142 | setup_ptcg_sem(value, NPTCG_FROM_KERNEL_PARAMETER); | ||
| 143 | |||
| 144 | return 1; | ||
| 145 | } | ||
| 146 | |||
| 147 | __setup("nptcg=", set_nptcg); | ||
| 148 | |||
| 149 | /* | ||
| 150 | * Maximum number of simultaneous ptc.g purges in the system can | ||
| 151 | * be defined by PAL_VM_SUMMARY (in which case we should take | ||
| 152 | * the smallest value for any cpu in the system) or by the PAL | ||
| 153 | * override table (in which case we should ignore the value from | ||
| 154 | * PAL_VM_SUMMARY). | ||
| 155 | * | ||
| 156 | * Kernel parameter "nptcg=" overrides maximum number of simultanesous ptc.g | ||
| 157 | * purges defined in either PAL_VM_SUMMARY or PAL override table. In this case, | ||
| 158 | * we should ignore the value from either PAL_VM_SUMMARY or PAL override table. | ||
| 159 | * | ||
| 160 | * Complicating the logic here is the fact that num_possible_cpus() | ||
| 161 | * isn't fully setup until we start bringing cpus online. | ||
| 162 | */ | ||
| 163 | void | ||
| 164 | setup_ptcg_sem(int max_purges, int nptcg_from) | ||
| 165 | { | ||
| 166 | static int kp_override; | ||
| 167 | static int palo_override; | ||
| 168 | static int firstcpu = 1; | ||
| 169 | |||
| 170 | if (toolatetochangeptcgsem) { | ||
| 171 | BUG_ON(max_purges < nptcg); | ||
| 172 | return; | ||
| 173 | } | ||
| 174 | |||
| 175 | if (nptcg_from == NPTCG_FROM_KERNEL_PARAMETER) { | ||
| 176 | kp_override = 1; | ||
| 177 | nptcg = max_purges; | ||
| 178 | goto resetsema; | ||
| 179 | } | ||
| 180 | if (kp_override) { | ||
| 181 | need_ptcg_sem = num_possible_cpus() > nptcg; | ||
| 182 | return; | ||
| 183 | } | ||
| 184 | |||
| 185 | if (nptcg_from == NPTCG_FROM_PALO) { | ||
| 186 | palo_override = 1; | ||
| 187 | |||
| 188 | /* In PALO max_purges == 0 really means it! */ | ||
| 189 | if (max_purges == 0) | ||
| 190 | panic("Whoa! Platform does not support global TLB purges.\n"); | ||
| 191 | nptcg = max_purges; | ||
| 192 | if (nptcg == PALO_MAX_TLB_PURGES) { | ||
| 193 | need_ptcg_sem = 0; | ||
| 194 | return; | ||
| 195 | } | ||
| 196 | goto resetsema; | ||
| 197 | } | ||
| 198 | if (palo_override) { | ||
| 199 | if (nptcg != PALO_MAX_TLB_PURGES) | ||
| 200 | need_ptcg_sem = (num_possible_cpus() > nptcg); | ||
| 201 | return; | ||
| 202 | } | ||
| 203 | |||
| 204 | /* In PAL_VM_SUMMARY max_purges == 0 actually means 1 */ | ||
| 205 | if (max_purges == 0) max_purges = 1; | ||
| 206 | |||
| 207 | if (firstcpu) { | ||
| 208 | nptcg = max_purges; | ||
| 209 | firstcpu = 0; | ||
| 210 | } | ||
| 211 | if (max_purges < nptcg) | ||
| 212 | nptcg = max_purges; | ||
| 213 | if (nptcg == PAL_MAX_PURGES) { | ||
| 214 | need_ptcg_sem = 0; | ||
| 215 | return; | ||
| 216 | } else | ||
| 217 | need_ptcg_sem = (num_possible_cpus() > nptcg); | ||
| 218 | |||
| 219 | resetsema: | ||
| 220 | spinaphore_init(&ptcg_sem, max_purges); | ||
| 221 | } | ||
| 222 | |||
| 93 | void | 223 | void |
| 94 | ia64_global_tlb_purge (struct mm_struct *mm, unsigned long start, | 224 | ia64_global_tlb_purge (struct mm_struct *mm, unsigned long start, |
| 95 | unsigned long end, unsigned long nbits) | 225 | unsigned long end, unsigned long nbits) |
| 96 | { | 226 | { |
| 97 | static DEFINE_SPINLOCK(ptcg_lock); | ||
| 98 | |||
| 99 | struct mm_struct *active_mm = current->active_mm; | 227 | struct mm_struct *active_mm = current->active_mm; |
| 100 | 228 | ||
| 229 | toolatetochangeptcgsem = 1; | ||
| 230 | |||
| 101 | if (mm != active_mm) { | 231 | if (mm != active_mm) { |
| 102 | /* Restore region IDs for mm */ | 232 | /* Restore region IDs for mm */ |
| 103 | if (mm && active_mm) { | 233 | if (mm && active_mm) { |
| @@ -108,19 +238,20 @@ ia64_global_tlb_purge (struct mm_struct *mm, unsigned long start, | |||
| 108 | } | 238 | } |
| 109 | } | 239 | } |
| 110 | 240 | ||
| 111 | /* HW requires global serialization of ptc.ga. */ | 241 | if (need_ptcg_sem) |
| 112 | spin_lock(&ptcg_lock); | 242 | down_spin(&ptcg_sem); |
| 113 | { | 243 | |
| 114 | do { | 244 | do { |
| 115 | /* | 245 | /* |
| 116 | * Flush ALAT entries also. | 246 | * Flush ALAT entries also. |
| 117 | */ | 247 | */ |
| 118 | ia64_ptcga(start, (nbits<<2)); | 248 | ia64_ptcga(start, (nbits << 2)); |
| 119 | ia64_srlz_i(); | 249 | ia64_srlz_i(); |
| 120 | start += (1UL << nbits); | 250 | start += (1UL << nbits); |
| 121 | } while (start < end); | 251 | } while (start < end); |
| 122 | } | 252 | |
| 123 | spin_unlock(&ptcg_lock); | 253 | if (need_ptcg_sem) |
| 254 | up_spin(&ptcg_sem); | ||
| 124 | 255 | ||
| 125 | if (mm != active_mm) { | 256 | if (mm != active_mm) { |
| 126 | activate_context(active_mm); | 257 | activate_context(active_mm); |
diff --git a/include/asm-ia64/sal.h b/include/asm-ia64/sal.h index f4904db3b057..89594b442f83 100644 --- a/include/asm-ia64/sal.h +++ b/include/asm-ia64/sal.h | |||
| @@ -296,6 +296,9 @@ enum { | |||
| 296 | EFI_GUID(0xe429faf8, 0x3cb7, 0x11d4, 0xbc, 0xa7, 0x0, 0x80, 0xc7, 0x3c, 0x88, 0x81) | 296 | EFI_GUID(0xe429faf8, 0x3cb7, 0x11d4, 0xbc, 0xa7, 0x0, 0x80, 0xc7, 0x3c, 0x88, 0x81) |
| 297 | #define SAL_PLAT_BUS_ERR_SECT_GUID \ | 297 | #define SAL_PLAT_BUS_ERR_SECT_GUID \ |
| 298 | EFI_GUID(0xe429faf9, 0x3cb7, 0x11d4, 0xbc, 0xa7, 0x0, 0x80, 0xc7, 0x3c, 0x88, 0x81) | 298 | EFI_GUID(0xe429faf9, 0x3cb7, 0x11d4, 0xbc, 0xa7, 0x0, 0x80, 0xc7, 0x3c, 0x88, 0x81) |
| 299 | #define PROCESSOR_ABSTRACTION_LAYER_OVERWRITE_GUID \ | ||
| 300 | EFI_GUID(0x6cb0a200, 0x893a, 0x11da, 0x96, 0xd2, 0x0, 0x10, 0x83, 0xff, \ | ||
| 301 | 0xca, 0x4d) | ||
| 299 | 302 | ||
| 300 | #define MAX_CACHE_ERRORS 6 | 303 | #define MAX_CACHE_ERRORS 6 |
| 301 | #define MAX_TLB_ERRORS 6 | 304 | #define MAX_TLB_ERRORS 6 |
| @@ -879,6 +882,24 @@ extern void ia64_jump_to_sal(struct sal_to_os_boot *); | |||
| 879 | 882 | ||
| 880 | extern void ia64_sal_handler_init(void *entry_point, void *gpval); | 883 | extern void ia64_sal_handler_init(void *entry_point, void *gpval); |
| 881 | 884 | ||
| 885 | #define PALO_MAX_TLB_PURGES 0xFFFF | ||
| 886 | #define PALO_SIG "PALO" | ||
| 887 | |||
| 888 | struct palo_table { | ||
| 889 | u8 signature[4]; /* Should be "PALO" */ | ||
| 890 | u32 length; | ||
| 891 | u8 minor_revision; | ||
| 892 | u8 major_revision; | ||
| 893 | u8 checksum; | ||
| 894 | u8 reserved1[5]; | ||
| 895 | u16 max_tlb_purges; | ||
| 896 | u8 reserved2[6]; | ||
| 897 | }; | ||
| 898 | |||
| 899 | #define NPTCG_FROM_PAL 0 | ||
| 900 | #define NPTCG_FROM_PALO 1 | ||
| 901 | #define NPTCG_FROM_KERNEL_PARAMETER 2 | ||
| 902 | |||
| 882 | #endif /* __ASSEMBLY__ */ | 903 | #endif /* __ASSEMBLY__ */ |
| 883 | 904 | ||
| 884 | #endif /* _ASM_IA64_SAL_H */ | 905 | #endif /* _ASM_IA64_SAL_H */ |
diff --git a/include/asm-ia64/tlbflush.h b/include/asm-ia64/tlbflush.h index 7774a1cac0cc..3be25dfed164 100644 --- a/include/asm-ia64/tlbflush.h +++ b/include/asm-ia64/tlbflush.h | |||
| @@ -17,6 +17,7 @@ | |||
| 17 | * Now for some TLB flushing routines. This is the kind of stuff that | 17 | * Now for some TLB flushing routines. This is the kind of stuff that |
| 18 | * can be very expensive, so try to avoid them whenever possible. | 18 | * can be very expensive, so try to avoid them whenever possible. |
| 19 | */ | 19 | */ |
| 20 | extern void setup_ptcg_sem(int max_purges, int from_palo); | ||
| 20 | 21 | ||
| 21 | /* | 22 | /* |
| 22 | * Flush everything (kernel mapping may also have changed due to | 23 | * Flush everything (kernel mapping may also have changed due to |
