diff options
author | Yinghai Lu <yinghai@kernel.org> | 2013-06-13 18:33:35 -0400 |
---|---|---|
committer | Greg Kroah-Hartman <gregkh@linuxfoundation.org> | 2013-08-04 04:51:18 -0400 |
commit | b185162885bc2346101a7b79c7737d2683b44782 (patch) | |
tree | 3513925b9a5799f8f91ee865b83097fc477baff5 /arch/x86 | |
parent | 0915f45b1275f392665df955e2e93ec459dac538 (diff) |
x86: Fix /proc/mtrr with base/size more than 44bits
commit d5c78673b1b28467354c2c30c3d4f003666ff385 upstream.
On one sytem that mtrr range is more then 44bits, in dmesg we have
[ 0.000000] MTRR default type: write-back
[ 0.000000] MTRR fixed ranges enabled:
[ 0.000000] 00000-9FFFF write-back
[ 0.000000] A0000-BFFFF uncachable
[ 0.000000] C0000-DFFFF write-through
[ 0.000000] E0000-FFFFF write-protect
[ 0.000000] MTRR variable ranges enabled:
[ 0.000000] 0 [000080000000-0000FFFFFFFF] mask 3FFF80000000 uncachable
[ 0.000000] 1 [380000000000-38FFFFFFFFFF] mask 3F0000000000 uncachable
[ 0.000000] 2 [000099000000-000099FFFFFF] mask 3FFFFF000000 write-through
[ 0.000000] 3 [00009A000000-00009AFFFFFF] mask 3FFFFF000000 write-through
[ 0.000000] 4 [381FFA000000-381FFBFFFFFF] mask 3FFFFE000000 write-through
[ 0.000000] 5 [381FFC000000-381FFC0FFFFF] mask 3FFFFFF00000 write-through
[ 0.000000] 6 [0000AD000000-0000ADFFFFFF] mask 3FFFFF000000 write-through
[ 0.000000] 7 [0000BD000000-0000BDFFFFFF] mask 3FFFFF000000 write-through
[ 0.000000] 8 disabled
[ 0.000000] 9 disabled
but /proc/mtrr report wrong:
reg00: base=0x080000000 ( 2048MB), size= 2048MB, count=1: uncachable
reg01: base=0x80000000000 (8388608MB), size=1048576MB, count=1: uncachable
reg02: base=0x099000000 ( 2448MB), size= 16MB, count=1: write-through
reg03: base=0x09a000000 ( 2464MB), size= 16MB, count=1: write-through
reg04: base=0x81ffa000000 (8519584MB), size= 32MB, count=1: write-through
reg05: base=0x81ffc000000 (8519616MB), size= 1MB, count=1: write-through
reg06: base=0x0ad000000 ( 2768MB), size= 16MB, count=1: write-through
reg07: base=0x0bd000000 ( 3024MB), size= 16MB, count=1: write-through
reg08: base=0x09b000000 ( 2480MB), size= 16MB, count=1: write-combining
so bit 44 and bit 45 get cut off.
We have problems in arch/x86/kernel/cpu/mtrr/generic.c::generic_get_mtrr().
1. for base, we miss cast base_lo to 64bit before shifting.
Fix that by adding u64 casting.
2. for size, it only can handle 44 bits aka 32bits + page_shift
Fix that with 64bit mask instead of 32bit mask_lo, then range could be
more than 44bits.
At the same time, we need to update size_or_mask for old cpus that does
support cpuid 0x80000008 to get phys_addr. Need to set high 32bits
to all 1s, otherwise will not get correct size for them.
Also fix mtrr_add_page: it should check base and (base + size - 1)
instead of base and size, as base and size could be small but
base + size could bigger enough to be out of boundary. We can
use boot_cpu_data.x86_phys_bits directly to avoid size_or_mask.
So When are we going to have size more than 44bits? that is 16TiB.
after patch we have right ouput:
reg00: base=0x080000000 ( 2048MB), size= 2048MB, count=1: uncachable
reg01: base=0x380000000000 (58720256MB), size=1048576MB, count=1: uncachable
reg02: base=0x099000000 ( 2448MB), size= 16MB, count=1: write-through
reg03: base=0x09a000000 ( 2464MB), size= 16MB, count=1: write-through
reg04: base=0x381ffa000000 (58851232MB), size= 32MB, count=1: write-through
reg05: base=0x381ffc000000 (58851264MB), size= 1MB, count=1: write-through
reg06: base=0x0ad000000 ( 2768MB), size= 16MB, count=1: write-through
reg07: base=0x0bd000000 ( 3024MB), size= 16MB, count=1: write-through
reg08: base=0x09b000000 ( 2480MB), size= 16MB, count=1: write-combining
-v2: simply checking in mtrr_add_page according to hpa.
[ hpa: This probably wants to go into -stable only after having sat in
mainline for a bit. It is not a regression. ]
Signed-off-by: Yinghai Lu <yinghai@kernel.org>
Link: http://lkml.kernel.org/r/1371162815-29931-1-git-send-email-yinghai@kernel.org
Signed-off-by: H. Peter Anvin <hpa@linux.intel.com>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Diffstat (limited to 'arch/x86')
-rw-r--r-- | arch/x86/kernel/cpu/mtrr/generic.c | 21 | ||||
-rw-r--r-- | arch/x86/kernel/cpu/mtrr/main.c | 16 |
2 files changed, 20 insertions, 17 deletions
diff --git a/arch/x86/kernel/cpu/mtrr/generic.c b/arch/x86/kernel/cpu/mtrr/generic.c index fa72a39e5d46..3982357de5b0 100644 --- a/arch/x86/kernel/cpu/mtrr/generic.c +++ b/arch/x86/kernel/cpu/mtrr/generic.c | |||
@@ -510,8 +510,9 @@ generic_get_free_region(unsigned long base, unsigned long size, int replace_reg) | |||
510 | static void generic_get_mtrr(unsigned int reg, unsigned long *base, | 510 | static void generic_get_mtrr(unsigned int reg, unsigned long *base, |
511 | unsigned long *size, mtrr_type *type) | 511 | unsigned long *size, mtrr_type *type) |
512 | { | 512 | { |
513 | unsigned int mask_lo, mask_hi, base_lo, base_hi; | 513 | u32 mask_lo, mask_hi, base_lo, base_hi; |
514 | unsigned int tmp, hi; | 514 | unsigned int hi; |
515 | u64 tmp, mask; | ||
515 | 516 | ||
516 | /* | 517 | /* |
517 | * get_mtrr doesn't need to update mtrr_state, also it could be called | 518 | * get_mtrr doesn't need to update mtrr_state, also it could be called |
@@ -532,18 +533,18 @@ static void generic_get_mtrr(unsigned int reg, unsigned long *base, | |||
532 | rdmsr(MTRRphysBase_MSR(reg), base_lo, base_hi); | 533 | rdmsr(MTRRphysBase_MSR(reg), base_lo, base_hi); |
533 | 534 | ||
534 | /* Work out the shifted address mask: */ | 535 | /* Work out the shifted address mask: */ |
535 | tmp = mask_hi << (32 - PAGE_SHIFT) | mask_lo >> PAGE_SHIFT; | 536 | tmp = (u64)mask_hi << (32 - PAGE_SHIFT) | mask_lo >> PAGE_SHIFT; |
536 | mask_lo = size_or_mask | tmp; | 537 | mask = size_or_mask | tmp; |
537 | 538 | ||
538 | /* Expand tmp with high bits to all 1s: */ | 539 | /* Expand tmp with high bits to all 1s: */ |
539 | hi = fls(tmp); | 540 | hi = fls64(tmp); |
540 | if (hi > 0) { | 541 | if (hi > 0) { |
541 | tmp |= ~((1<<(hi - 1)) - 1); | 542 | tmp |= ~((1ULL<<(hi - 1)) - 1); |
542 | 543 | ||
543 | if (tmp != mask_lo) { | 544 | if (tmp != mask) { |
544 | printk(KERN_WARNING "mtrr: your BIOS has configured an incorrect mask, fixing it.\n"); | 545 | printk(KERN_WARNING "mtrr: your BIOS has configured an incorrect mask, fixing it.\n"); |
545 | add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK); | 546 | add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK); |
546 | mask_lo = tmp; | 547 | mask = tmp; |
547 | } | 548 | } |
548 | } | 549 | } |
549 | 550 | ||
@@ -551,8 +552,8 @@ static void generic_get_mtrr(unsigned int reg, unsigned long *base, | |||
551 | * This works correctly if size is a power of two, i.e. a | 552 | * This works correctly if size is a power of two, i.e. a |
552 | * contiguous range: | 553 | * contiguous range: |
553 | */ | 554 | */ |
554 | *size = -mask_lo; | 555 | *size = -mask; |
555 | *base = base_hi << (32 - PAGE_SHIFT) | base_lo >> PAGE_SHIFT; | 556 | *base = (u64)base_hi << (32 - PAGE_SHIFT) | base_lo >> PAGE_SHIFT; |
556 | *type = base_lo & 0xff; | 557 | *type = base_lo & 0xff; |
557 | 558 | ||
558 | out_put_cpu: | 559 | out_put_cpu: |
diff --git a/arch/x86/kernel/cpu/mtrr/main.c b/arch/x86/kernel/cpu/mtrr/main.c index 726bf963c227..ca22b73aaa25 100644 --- a/arch/x86/kernel/cpu/mtrr/main.c +++ b/arch/x86/kernel/cpu/mtrr/main.c | |||
@@ -305,7 +305,8 @@ int mtrr_add_page(unsigned long base, unsigned long size, | |||
305 | return -EINVAL; | 305 | return -EINVAL; |
306 | } | 306 | } |
307 | 307 | ||
308 | if (base & size_or_mask || size & size_or_mask) { | 308 | if ((base | (base + size - 1)) >> |
309 | (boot_cpu_data.x86_phys_bits - PAGE_SHIFT)) { | ||
309 | pr_warning("mtrr: base or size exceeds the MTRR width\n"); | 310 | pr_warning("mtrr: base or size exceeds the MTRR width\n"); |
310 | return -EINVAL; | 311 | return -EINVAL; |
311 | } | 312 | } |
@@ -583,6 +584,7 @@ static struct syscore_ops mtrr_syscore_ops = { | |||
583 | 584 | ||
584 | int __initdata changed_by_mtrr_cleanup; | 585 | int __initdata changed_by_mtrr_cleanup; |
585 | 586 | ||
587 | #define SIZE_OR_MASK_BITS(n) (~((1ULL << ((n) - PAGE_SHIFT)) - 1)) | ||
586 | /** | 588 | /** |
587 | * mtrr_bp_init - initialize mtrrs on the boot CPU | 589 | * mtrr_bp_init - initialize mtrrs on the boot CPU |
588 | * | 590 | * |
@@ -600,7 +602,7 @@ void __init mtrr_bp_init(void) | |||
600 | 602 | ||
601 | if (cpu_has_mtrr) { | 603 | if (cpu_has_mtrr) { |
602 | mtrr_if = &generic_mtrr_ops; | 604 | mtrr_if = &generic_mtrr_ops; |
603 | size_or_mask = 0xff000000; /* 36 bits */ | 605 | size_or_mask = SIZE_OR_MASK_BITS(36); |
604 | size_and_mask = 0x00f00000; | 606 | size_and_mask = 0x00f00000; |
605 | phys_addr = 36; | 607 | phys_addr = 36; |
606 | 608 | ||
@@ -619,7 +621,7 @@ void __init mtrr_bp_init(void) | |||
619 | boot_cpu_data.x86_mask == 0x4)) | 621 | boot_cpu_data.x86_mask == 0x4)) |
620 | phys_addr = 36; | 622 | phys_addr = 36; |
621 | 623 | ||
622 | size_or_mask = ~((1ULL << (phys_addr - PAGE_SHIFT)) - 1); | 624 | size_or_mask = SIZE_OR_MASK_BITS(phys_addr); |
623 | size_and_mask = ~size_or_mask & 0xfffff00000ULL; | 625 | size_and_mask = ~size_or_mask & 0xfffff00000ULL; |
624 | } else if (boot_cpu_data.x86_vendor == X86_VENDOR_CENTAUR && | 626 | } else if (boot_cpu_data.x86_vendor == X86_VENDOR_CENTAUR && |
625 | boot_cpu_data.x86 == 6) { | 627 | boot_cpu_data.x86 == 6) { |
@@ -627,7 +629,7 @@ void __init mtrr_bp_init(void) | |||
627 | * VIA C* family have Intel style MTRRs, | 629 | * VIA C* family have Intel style MTRRs, |
628 | * but don't support PAE | 630 | * but don't support PAE |
629 | */ | 631 | */ |
630 | size_or_mask = 0xfff00000; /* 32 bits */ | 632 | size_or_mask = SIZE_OR_MASK_BITS(32); |
631 | size_and_mask = 0; | 633 | size_and_mask = 0; |
632 | phys_addr = 32; | 634 | phys_addr = 32; |
633 | } | 635 | } |
@@ -637,21 +639,21 @@ void __init mtrr_bp_init(void) | |||
637 | if (cpu_has_k6_mtrr) { | 639 | if (cpu_has_k6_mtrr) { |
638 | /* Pre-Athlon (K6) AMD CPU MTRRs */ | 640 | /* Pre-Athlon (K6) AMD CPU MTRRs */ |
639 | mtrr_if = mtrr_ops[X86_VENDOR_AMD]; | 641 | mtrr_if = mtrr_ops[X86_VENDOR_AMD]; |
640 | size_or_mask = 0xfff00000; /* 32 bits */ | 642 | size_or_mask = SIZE_OR_MASK_BITS(32); |
641 | size_and_mask = 0; | 643 | size_and_mask = 0; |
642 | } | 644 | } |
643 | break; | 645 | break; |
644 | case X86_VENDOR_CENTAUR: | 646 | case X86_VENDOR_CENTAUR: |
645 | if (cpu_has_centaur_mcr) { | 647 | if (cpu_has_centaur_mcr) { |
646 | mtrr_if = mtrr_ops[X86_VENDOR_CENTAUR]; | 648 | mtrr_if = mtrr_ops[X86_VENDOR_CENTAUR]; |
647 | size_or_mask = 0xfff00000; /* 32 bits */ | 649 | size_or_mask = SIZE_OR_MASK_BITS(32); |
648 | size_and_mask = 0; | 650 | size_and_mask = 0; |
649 | } | 651 | } |
650 | break; | 652 | break; |
651 | case X86_VENDOR_CYRIX: | 653 | case X86_VENDOR_CYRIX: |
652 | if (cpu_has_cyrix_arr) { | 654 | if (cpu_has_cyrix_arr) { |
653 | mtrr_if = mtrr_ops[X86_VENDOR_CYRIX]; | 655 | mtrr_if = mtrr_ops[X86_VENDOR_CYRIX]; |
654 | size_or_mask = 0xfff00000; /* 32 bits */ | 656 | size_or_mask = SIZE_OR_MASK_BITS(32); |
655 | size_and_mask = 0; | 657 | size_and_mask = 0; |
656 | } | 658 | } |
657 | break; | 659 | break; |