diff options
author | Naoya Horiguchi <n-horiguchi@ah.jp.nec.com> | 2010-04-06 17:35:04 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2010-04-07 11:38:04 -0400 |
commit | 116354d177ba2da37e91cf884e3d11e67f825efd (patch) | |
tree | 150227e8a5c9ce8b6dd9333593ed513c8c012686 /fs | |
parent | 57119c34e53bbb8d244c3ff1335ef5145768538f (diff) |
pagemap: fix pfn calculation for hugepage
When we look into pagemap using page-types with option -p, the value of
pfn for hugepages looks wrong (see below.) This is because pte was
evaluated only once for one vma although it should be updated for each
hugepage. This patch fixes it.
$ page-types -p 3277 -Nl -b huge
voffset offset len flags
7f21e8a00 11e400 1 ___U___________H_G________________
7f21e8a01 11e401 1ff ________________TG________________
^^^
7f21e8c00 11e400 1 ___U___________H_G________________
7f21e8c01 11e401 1ff ________________TG________________
^^^
One hugepage contains 1 head page and 511 tail pages in x86_64 and each
two lines represent each hugepage. Voffset and offset mean virtual
address and physical address in the page unit, respectively. The
different hugepages should not have the same offset value.
With this patch applied:
$ page-types -p 3386 -Nl -b huge
voffset offset len flags
7fec7a600 112c00 1 ___UD__________H_G________________
7fec7a601 112c01 1ff ________________TG________________
^^^
7fec7a800 113200 1 ___UD__________H_G________________
7fec7a801 113201 1ff ________________TG________________
^^^
OK
More info:
- This patch modifies walk_page_range()'s hugepage walker. But the
change only affects pagemap_read(), which is the only caller of hugepage
callback.
- Without this patch, hugetlb_entry() callback is called per vma, that
doesn't match the natural expectation from its name.
- With this patch, hugetlb_entry() is called per hugepte entry and the
callback can become much simpler.
Signed-off-by: Naoya Horiguchi <n-horiguchi@ah.jp.nec.com>
Signed-off-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>
Acked-by: Matt Mackall <mpm@selenic.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'fs')
-rw-r--r-- | fs/proc/task_mmu.c | 27 |
1 files changed, 7 insertions, 20 deletions
diff --git a/fs/proc/task_mmu.c b/fs/proc/task_mmu.c index a05a669510a4..070553427dd5 100644 --- a/fs/proc/task_mmu.c +++ b/fs/proc/task_mmu.c | |||
@@ -662,31 +662,18 @@ static u64 huge_pte_to_pagemap_entry(pte_t pte, int offset) | |||
662 | return pme; | 662 | return pme; |
663 | } | 663 | } |
664 | 664 | ||
665 | static int pagemap_hugetlb_range(pte_t *pte, unsigned long addr, | 665 | /* This function walks within one hugetlb entry in the single call */ |
666 | unsigned long end, struct mm_walk *walk) | 666 | static int pagemap_hugetlb_range(pte_t *pte, unsigned long hmask, |
667 | unsigned long addr, unsigned long end, | ||
668 | struct mm_walk *walk) | ||
667 | { | 669 | { |
668 | struct vm_area_struct *vma; | ||
669 | struct pagemapread *pm = walk->private; | 670 | struct pagemapread *pm = walk->private; |
670 | struct hstate *hs = NULL; | ||
671 | int err = 0; | 671 | int err = 0; |
672 | u64 pfn; | ||
672 | 673 | ||
673 | vma = find_vma(walk->mm, addr); | ||
674 | if (vma) | ||
675 | hs = hstate_vma(vma); | ||
676 | for (; addr != end; addr += PAGE_SIZE) { | 674 | for (; addr != end; addr += PAGE_SIZE) { |
677 | u64 pfn = PM_NOT_PRESENT; | 675 | int offset = (addr & ~hmask) >> PAGE_SHIFT; |
678 | 676 | pfn = huge_pte_to_pagemap_entry(*pte, offset); | |
679 | if (vma && (addr >= vma->vm_end)) { | ||
680 | vma = find_vma(walk->mm, addr); | ||
681 | if (vma) | ||
682 | hs = hstate_vma(vma); | ||
683 | } | ||
684 | |||
685 | if (vma && (vma->vm_start <= addr) && is_vm_hugetlb_page(vma)) { | ||
686 | /* calculate pfn of the "raw" page in the hugepage. */ | ||
687 | int offset = (addr & ~huge_page_mask(hs)) >> PAGE_SHIFT; | ||
688 | pfn = huge_pte_to_pagemap_entry(*pte, offset); | ||
689 | } | ||
690 | err = add_to_pagemap(addr, pfn, pm); | 677 | err = add_to_pagemap(addr, pfn, pm); |
691 | if (err) | 678 | if (err) |
692 | return err; | 679 | return err; |