aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorDavid Gibson <david@gibson.dropbear.id.au>2009-10-26 15:24:31 -0400
committerBenjamin Herrenschmidt <benh@kernel.crashing.org>2009-10-30 02:20:58 -0400
commitd1837cba5d5d5458c09f0a2849db2d3c203cb8e9 (patch)
tree144a4eb43ed6b9909133dc1ac0619d813e4cb131
parenta4fe3ce7699bfe1bd88f816b55d42d8fe1dac655 (diff)
powerpc/mm: Cleanup initialization of hugepages on powerpc
This patch simplifies the logic used to initialize hugepages on powerpc. The somewhat oddly named set_huge_psize() is renamed to add_huge_page_size() and now does all necessary verification of whether it's given a valid hugepage sizes (instead of just some) and instantiates the generic hstate structure (but no more). hugetlbpage_init() now steps through the available pagesizes, checks if they're valid for hugepages by calling add_huge_page_size() and initializes the kmem_caches for the hugepage pagetables. This means we can now eliminate the mmu_huge_psizes array, since we no longer need to pass the sizing information for the pagetable caches from set_huge_psize() into hugetlbpage_init() Determination of the default huge page size is also moved from the hash code into the general hugepage code. Signed-off-by: David Gibson <dwg@au1.ibm.com> Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
-rw-r--r--arch/powerpc/include/asm/page_64.h2
-rw-r--r--arch/powerpc/mm/hash_utils_64.c10
-rw-r--r--arch/powerpc/mm/hugetlbpage.c128
3 files changed, 63 insertions, 77 deletions
diff --git a/arch/powerpc/include/asm/page_64.h b/arch/powerpc/include/asm/page_64.h
index 3f17b83f55a1..bfc4e027e2ad 100644
--- a/arch/powerpc/include/asm/page_64.h
+++ b/arch/powerpc/include/asm/page_64.h
@@ -90,7 +90,7 @@ extern unsigned int HPAGE_SHIFT;
90#define HPAGE_SIZE ((1UL) << HPAGE_SHIFT) 90#define HPAGE_SIZE ((1UL) << HPAGE_SHIFT)
91#define HPAGE_MASK (~(HPAGE_SIZE - 1)) 91#define HPAGE_MASK (~(HPAGE_SIZE - 1))
92#define HUGETLB_PAGE_ORDER (HPAGE_SHIFT - PAGE_SHIFT) 92#define HUGETLB_PAGE_ORDER (HPAGE_SHIFT - PAGE_SHIFT)
93#define HUGE_MAX_HSTATE 3 93#define HUGE_MAX_HSTATE (MMU_PAGE_COUNT-1)
94 94
95#endif /* __ASSEMBLY__ */ 95#endif /* __ASSEMBLY__ */
96 96
diff --git a/arch/powerpc/mm/hash_utils_64.c b/arch/powerpc/mm/hash_utils_64.c
index 485dcd197a61..ef1f047f5431 100644
--- a/arch/powerpc/mm/hash_utils_64.c
+++ b/arch/powerpc/mm/hash_utils_64.c
@@ -481,16 +481,6 @@ static void __init htab_init_page_sizes(void)
481#ifdef CONFIG_HUGETLB_PAGE 481#ifdef CONFIG_HUGETLB_PAGE
482 /* Reserve 16G huge page memory sections for huge pages */ 482 /* Reserve 16G huge page memory sections for huge pages */
483 of_scan_flat_dt(htab_dt_scan_hugepage_blocks, NULL); 483 of_scan_flat_dt(htab_dt_scan_hugepage_blocks, NULL);
484
485/* Set default large page size. Currently, we pick 16M or 1M depending
486 * on what is available
487 */
488 if (mmu_psize_defs[MMU_PAGE_16M].shift)
489 HPAGE_SHIFT = mmu_psize_defs[MMU_PAGE_16M].shift;
490 /* With 4k/4level pagetables, we can't (for now) cope with a
491 * huge page size < PMD_SIZE */
492 else if (mmu_psize_defs[MMU_PAGE_1M].shift)
493 HPAGE_SHIFT = mmu_psize_defs[MMU_PAGE_1M].shift;
494#endif /* CONFIG_HUGETLB_PAGE */ 484#endif /* CONFIG_HUGETLB_PAGE */
495} 485}
496 486
diff --git a/arch/powerpc/mm/hugetlbpage.c b/arch/powerpc/mm/hugetlbpage.c
index 95220a5dee58..a7161c07886d 100644
--- a/arch/powerpc/mm/hugetlbpage.c
+++ b/arch/powerpc/mm/hugetlbpage.c
@@ -37,27 +37,17 @@
37static unsigned long gpage_freearray[MAX_NUMBER_GPAGES]; 37static unsigned long gpage_freearray[MAX_NUMBER_GPAGES];
38static unsigned nr_gpages; 38static unsigned nr_gpages;
39 39
40/* Array of valid huge page sizes - non-zero value(hugepte_shift) is
41 * stored for the huge page sizes that are valid.
42 */
43static unsigned int mmu_huge_psizes[MMU_PAGE_COUNT] = { }; /* initialize all to 0 */
44
45/* Flag to mark huge PD pointers. This means pmd_bad() and pud_bad() 40/* Flag to mark huge PD pointers. This means pmd_bad() and pud_bad()
46 * will choke on pointers to hugepte tables, which is handy for 41 * will choke on pointers to hugepte tables, which is handy for
47 * catching screwups early. */ 42 * catching screwups early. */
48 43
49static inline int shift_to_mmu_psize(unsigned int shift) 44static inline int shift_to_mmu_psize(unsigned int shift)
50{ 45{
51 switch (shift) { 46 int psize;
52#ifndef CONFIG_PPC_64K_PAGES 47
53 case PAGE_SHIFT_64K: 48 for (psize = 0; psize < MMU_PAGE_COUNT; ++psize)
54 return MMU_PAGE_64K; 49 if (mmu_psize_defs[psize].shift == shift)
55#endif 50 return psize;
56 case PAGE_SHIFT_16M:
57 return MMU_PAGE_16M;
58 case PAGE_SHIFT_16G:
59 return MMU_PAGE_16G;
60 }
61 return -1; 51 return -1;
62} 52}
63 53
@@ -502,8 +492,6 @@ unsigned long hugetlb_get_unmapped_area(struct file *file, unsigned long addr,
502 struct hstate *hstate = hstate_file(file); 492 struct hstate *hstate = hstate_file(file);
503 int mmu_psize = shift_to_mmu_psize(huge_page_shift(hstate)); 493 int mmu_psize = shift_to_mmu_psize(huge_page_shift(hstate));
504 494
505 if (!mmu_huge_psizes[mmu_psize])
506 return -EINVAL;
507 return slice_get_unmapped_area(addr, len, flags, mmu_psize, 1, 0); 495 return slice_get_unmapped_area(addr, len, flags, mmu_psize, 1, 0);
508} 496}
509 497
@@ -666,47 +654,46 @@ repeat:
666 return err; 654 return err;
667} 655}
668 656
669static void __init set_huge_psize(int psize) 657static int __init add_huge_page_size(unsigned long long size)
670{ 658{
671 unsigned pdshift; 659 int shift = __ffs(size);
660 int mmu_psize;
672 661
673 /* Check that it is a page size supported by the hardware and 662 /* Check that it is a page size supported by the hardware and
674 * that it fits within pagetable limits. */ 663 * that it fits within pagetable and slice limits. */
675 if (mmu_psize_defs[psize].shift && 664 if (!is_power_of_2(size)
676 mmu_psize_defs[psize].shift < SID_SHIFT_1T && 665 || (shift > SLICE_HIGH_SHIFT) || (shift <= PAGE_SHIFT))
677 (mmu_psize_defs[psize].shift > MIN_HUGEPTE_SHIFT || 666 return -EINVAL;
678 mmu_psize_defs[psize].shift == PAGE_SHIFT_64K ||
679 mmu_psize_defs[psize].shift == PAGE_SHIFT_16G)) {
680 /* Return if huge page size has already been setup or is the
681 * same as the base page size. */
682 if (mmu_huge_psizes[psize] ||
683 mmu_psize_defs[psize].shift == PAGE_SHIFT)
684 return;
685 hugetlb_add_hstate(mmu_psize_defs[psize].shift - PAGE_SHIFT);
686 667
687 if (mmu_psize_defs[psize].shift < PMD_SHIFT) 668 if ((mmu_psize = shift_to_mmu_psize(shift)) < 0)
688 pdshift = PMD_SHIFT; 669 return -EINVAL;
689 else if (mmu_psize_defs[psize].shift < PUD_SHIFT) 670
690 pdshift = PUD_SHIFT; 671#ifdef CONFIG_SPU_FS_64K_LS
691 else 672 /* Disable support for 64K huge pages when 64K SPU local store
692 pdshift = PGDIR_SHIFT; 673 * support is enabled as the current implementation conflicts.
693 mmu_huge_psizes[psize] = pdshift - mmu_psize_defs[psize].shift; 674 */
694 } 675 if (shift == PAGE_SHIFT_64K)
676 return -EINVAL;
677#endif /* CONFIG_SPU_FS_64K_LS */
678
679 BUG_ON(mmu_psize_defs[mmu_psize].shift != shift);
680
681 /* Return if huge page size has already been setup */
682 if (size_to_hstate(size))
683 return 0;
684
685 hugetlb_add_hstate(shift - PAGE_SHIFT);
686
687 return 0;
695} 688}
696 689
697static int __init hugepage_setup_sz(char *str) 690static int __init hugepage_setup_sz(char *str)
698{ 691{
699 unsigned long long size; 692 unsigned long long size;
700 int mmu_psize;
701 int shift;
702 693
703 size = memparse(str, &str); 694 size = memparse(str, &str);
704 695
705 shift = __ffs(size); 696 if (add_huge_page_size(size) != 0)
706 mmu_psize = shift_to_mmu_psize(shift);
707 if (mmu_psize >= 0 && mmu_psize_defs[mmu_psize].shift)
708 set_huge_psize(mmu_psize);
709 else
710 printk(KERN_WARNING "Invalid huge page size specified(%llu)\n", size); 697 printk(KERN_WARNING "Invalid huge page size specified(%llu)\n", size);
711 698
712 return 1; 699 return 1;
@@ -720,30 +707,39 @@ static int __init hugetlbpage_init(void)
720 if (!cpu_has_feature(CPU_FTR_16M_PAGE)) 707 if (!cpu_has_feature(CPU_FTR_16M_PAGE))
721 return -ENODEV; 708 return -ENODEV;
722 709
723 /* Add supported huge page sizes. Need to change 710 for (psize = 0; psize < MMU_PAGE_COUNT; ++psize) {
724 * HUGE_MAX_HSTATE if the number of supported huge page sizes 711 unsigned shift;
725 * changes. 712 unsigned pdshift;
726 */
727 set_huge_psize(MMU_PAGE_16M);
728 set_huge_psize(MMU_PAGE_16G);
729 713
730 /* Temporarily disable support for 64K huge pages when 64K SPU local 714 if (!mmu_psize_defs[psize].shift)
731 * store support is enabled as the current implementation conflicts. 715 continue;
732 */
733#ifndef CONFIG_SPU_FS_64K_LS
734 set_huge_psize(MMU_PAGE_64K);
735#endif
736 716
737 for (psize = 0; psize < MMU_PAGE_COUNT; ++psize) { 717 shift = mmu_psize_to_shift(psize);
738 if (mmu_huge_psizes[psize]) { 718
739 pgtable_cache_add(mmu_huge_psizes[psize], NULL); 719 if (add_huge_page_size(1ULL << shift) < 0)
740 if (!PGT_CACHE(mmu_huge_psizes[psize])) 720 continue;
741 panic("hugetlbpage_init(): could not create " 721
742 "pgtable cache for %d bit pagesize\n", 722 if (shift < PMD_SHIFT)
743 mmu_psize_to_shift(psize)); 723 pdshift = PMD_SHIFT;
744 } 724 else if (shift < PUD_SHIFT)
725 pdshift = PUD_SHIFT;
726 else
727 pdshift = PGDIR_SHIFT;
728
729 pgtable_cache_add(pdshift - shift, NULL);
730 if (!PGT_CACHE(pdshift - shift))
731 panic("hugetlbpage_init(): could not create "
732 "pgtable cache for %d bit pagesize\n", shift);
745 } 733 }
746 734
735 /* Set default large page size. Currently, we pick 16M or 1M
736 * depending on what is available
737 */
738 if (mmu_psize_defs[MMU_PAGE_16M].shift)
739 HPAGE_SHIFT = mmu_psize_defs[MMU_PAGE_16M].shift;
740 else if (mmu_psize_defs[MMU_PAGE_1M].shift)
741 HPAGE_SHIFT = mmu_psize_defs[MMU_PAGE_1M].shift;
742
747 return 0; 743 return 0;
748} 744}
749 745