aboutsummaryrefslogtreecommitdiffstats
path: root/mm/huge_memory.c
diff options
context:
space:
mode:
authorMichel Lespinasse <walken@google.com>2012-10-08 19:31:39 -0400
committerLinus Torvalds <torvalds@linux-foundation.org>2012-10-09 03:22:41 -0400
commitbf181b9f9d8dfbba58b23441ad60d0bc33806d64 (patch)
tree7ad0caaf8998f31c5d910dcbb768f5a1d381b5f4 /mm/huge_memory.c
parent108d6642ad81bb1d62b401490a334d2c12397517 (diff)
mm anon rmap: replace same_anon_vma linked list with an interval tree.
When a large VMA (anon or private file mapping) is first touched, which will populate its anon_vma field, and then split into many regions through the use of mprotect(), the original anon_vma ends up linking all of the vmas on a linked list. This can cause rmap to become inefficient, as we have to walk potentially thousands of irrelevent vmas before finding the one a given anon page might fall into. By replacing the same_anon_vma linked list with an interval tree (where each avc's interval is determined by its vma's start and last pgoffs), we can make rmap efficient for this use case again. While the change is large, all of its pieces are fairly simple. Most places that were walking the same_anon_vma list were looking for a known pgoff, so they can just use the anon_vma_interval_tree_foreach() interval tree iterator instead. The exception here is ksm, where the page's index is not known. It would probably be possible to rework ksm so that the index would be known, but for now I have decided to keep things simple and just walk the entirety of the interval tree there. When updating vma's that already have an anon_vma assigned, we must take care to re-index the corresponding avc's on their interval tree. This is done through the use of anon_vma_interval_tree_pre_update_vma() and anon_vma_interval_tree_post_update_vma(), which remove the avc's from their interval tree before the update and re-insert them after the update. The anon_vma stays locked during the update, so there is no chance that rmap would miss the vmas that are being updated. Signed-off-by: Michel Lespinasse <walken@google.com> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Rik van Riel <riel@redhat.com> Cc: Peter Zijlstra <a.p.zijlstra@chello.nl> Cc: Daniel Santos <daniel.santos@pobox.com> Cc: Hugh Dickins <hughd@google.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/huge_memory.c')
-rw-r--r--mm/huge_memory.c5
1 files changed, 3 insertions, 2 deletions
diff --git a/mm/huge_memory.c b/mm/huge_memory.c
index 010d32944d14..ce59ada09462 100644
--- a/mm/huge_memory.c
+++ b/mm/huge_memory.c
@@ -1375,13 +1375,14 @@ static void __split_huge_page(struct page *page,
1375 struct anon_vma *anon_vma) 1375 struct anon_vma *anon_vma)
1376{ 1376{
1377 int mapcount, mapcount2; 1377 int mapcount, mapcount2;
1378 pgoff_t pgoff = page->index << (PAGE_CACHE_SHIFT - PAGE_SHIFT);
1378 struct anon_vma_chain *avc; 1379 struct anon_vma_chain *avc;
1379 1380
1380 BUG_ON(!PageHead(page)); 1381 BUG_ON(!PageHead(page));
1381 BUG_ON(PageTail(page)); 1382 BUG_ON(PageTail(page));
1382 1383
1383 mapcount = 0; 1384 mapcount = 0;
1384 list_for_each_entry(avc, &anon_vma->head, same_anon_vma) { 1385 anon_vma_interval_tree_foreach(avc, &anon_vma->rb_root, pgoff, pgoff) {
1385 struct vm_area_struct *vma = avc->vma; 1386 struct vm_area_struct *vma = avc->vma;
1386 unsigned long addr = vma_address(page, vma); 1387 unsigned long addr = vma_address(page, vma);
1387 BUG_ON(is_vma_temporary_stack(vma)); 1388 BUG_ON(is_vma_temporary_stack(vma));
@@ -1407,7 +1408,7 @@ static void __split_huge_page(struct page *page,
1407 __split_huge_page_refcount(page); 1408 __split_huge_page_refcount(page);
1408 1409
1409 mapcount2 = 0; 1410 mapcount2 = 0;
1410 list_for_each_entry(avc, &anon_vma->head, same_anon_vma) { 1411 anon_vma_interval_tree_foreach(avc, &anon_vma->rb_root, pgoff, pgoff) {
1411 struct vm_area_struct *vma = avc->vma; 1412 struct vm_area_struct *vma = avc->vma;
1412 unsigned long addr = vma_address(page, vma); 1413 unsigned long addr = vma_address(page, vma);
1413 BUG_ON(is_vma_temporary_stack(vma)); 1414 BUG_ON(is_vma_temporary_stack(vma));