aboutsummaryrefslogtreecommitdiffstats
path: root/mm/memcontrol.c
diff options
context:
space:
mode:
authorHirokazu Takahashi <taka@valinux.co.jp>2008-03-04 17:29:15 -0500
committerLinus Torvalds <torvalds@woody.linux-foundation.org>2008-03-04 19:35:15 -0500
commit9b3c0a07e0fca35e36751680de3e4c76dbff5df3 (patch)
tree3dd6355a88282ea5577a05b7f2d2d3ae216ab9a8 /mm/memcontrol.c
parent2680eed723b664d83e6181ae275fac0ec8fa05ff (diff)
memcg: simplify force_empty and move_lists
As for force_empty, though this may not be the main topic here, mem_cgroup_force_empty_list() can be implemented simpler. It is possible to make the function just call mem_cgroup_uncharge_page() instead of releasing page_cgroups by itself. The tip is to call get_page() before invoking mem_cgroup_uncharge_page(), so the page won't be released during this function. Kamezawa-san points out that by the time mem_cgroup_uncharge_page() uncharges, the page might have been reassigned to an lru of a different mem_cgroup, and now be emptied from that; but Hugh claims that's okay, the end state is the same as when it hasn't gone to another list. And once force_empty stops taking lock_page_cgroup within mz->lru_lock, mem_cgroup_move_lists() can be simplified to take mz->lru_lock directly while holding page_cgroup lock (but still has to use try_lock_page_cgroup). Signed-off-by: Hirokazu Takahashi <taka@valinux.co.jp> Signed-off-by: Hugh Dickins <hugh@veritas.com> Cc: David Rientjes <rientjes@google.com> Cc: Balbir Singh <balbir@linux.vnet.ibm.com> Cc: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com> Cc: YAMAMOTO Takashi <yamamoto@valinux.co.jp> Cc: Paul Menage <menage@google.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/memcontrol.c')
-rw-r--r--mm/memcontrol.c62
1 files changed, 13 insertions, 49 deletions
diff --git a/mm/memcontrol.c b/mm/memcontrol.c
index dcbe30aad1da..f72067094e05 100644
--- a/mm/memcontrol.c
+++ b/mm/memcontrol.c
@@ -353,7 +353,6 @@ int task_in_mem_cgroup(struct task_struct *task, const struct mem_cgroup *mem)
353void mem_cgroup_move_lists(struct page *page, bool active) 353void mem_cgroup_move_lists(struct page *page, bool active)
354{ 354{
355 struct page_cgroup *pc; 355 struct page_cgroup *pc;
356 struct mem_cgroup *mem;
357 struct mem_cgroup_per_zone *mz; 356 struct mem_cgroup_per_zone *mz;
358 unsigned long flags; 357 unsigned long flags;
359 358
@@ -367,35 +366,14 @@ void mem_cgroup_move_lists(struct page *page, bool active)
367 if (!try_lock_page_cgroup(page)) 366 if (!try_lock_page_cgroup(page))
368 return; 367 return;
369 368
370 /*
371 * Now page_cgroup is stable, but we cannot acquire mz->lru_lock
372 * while holding it, because mem_cgroup_force_empty_list does the
373 * reverse. Get a hold on the mem_cgroup before unlocking, so that
374 * the zoneinfo remains stable, then take mz->lru_lock; then check
375 * that page still points to pc and pc (even if freed and reassigned
376 * to that same page meanwhile) still points to the same mem_cgroup.
377 * Then we know mz still points to the right spinlock, so it's safe
378 * to move_lists (page->page_cgroup might be reset while we do so, but
379 * that doesn't matter: pc->page is stable till we drop mz->lru_lock).
380 * We're being a little naughty not to try_lock_page_cgroup again
381 * inside there, but we are safe, aren't we? Aren't we? Whistle...
382 */
383 pc = page_get_page_cgroup(page); 369 pc = page_get_page_cgroup(page);
384 if (pc) { 370 if (pc) {
385 mem = pc->mem_cgroup;
386 mz = page_cgroup_zoneinfo(pc); 371 mz = page_cgroup_zoneinfo(pc);
387 css_get(&mem->css);
388
389 unlock_page_cgroup(page);
390
391 spin_lock_irqsave(&mz->lru_lock, flags); 372 spin_lock_irqsave(&mz->lru_lock, flags);
392 if (page_get_page_cgroup(page) == pc && pc->mem_cgroup == mem) 373 __mem_cgroup_move_lists(pc, active);
393 __mem_cgroup_move_lists(pc, active);
394 spin_unlock_irqrestore(&mz->lru_lock, flags); 374 spin_unlock_irqrestore(&mz->lru_lock, flags);
395 375 }
396 css_put(&mem->css); 376 unlock_page_cgroup(page);
397 } else
398 unlock_page_cgroup(page);
399} 377}
400 378
401/* 379/*
@@ -789,7 +767,7 @@ static void mem_cgroup_force_empty_list(struct mem_cgroup *mem,
789{ 767{
790 struct page_cgroup *pc; 768 struct page_cgroup *pc;
791 struct page *page; 769 struct page *page;
792 int count; 770 int count = FORCE_UNCHARGE_BATCH;
793 unsigned long flags; 771 unsigned long flags;
794 struct list_head *list; 772 struct list_head *list;
795 773
@@ -798,35 +776,21 @@ static void mem_cgroup_force_empty_list(struct mem_cgroup *mem,
798 else 776 else
799 list = &mz->inactive_list; 777 list = &mz->inactive_list;
800 778
801 if (list_empty(list))
802 return;
803retry:
804 count = FORCE_UNCHARGE_BATCH;
805 spin_lock_irqsave(&mz->lru_lock, flags); 779 spin_lock_irqsave(&mz->lru_lock, flags);
806 780 while (!list_empty(list)) {
807 while (--count && !list_empty(list)) {
808 pc = list_entry(list->prev, struct page_cgroup, lru); 781 pc = list_entry(list->prev, struct page_cgroup, lru);
809 page = pc->page; 782 page = pc->page;
810 lock_page_cgroup(page); 783 get_page(page);
811 if (page_get_page_cgroup(page) == pc) { 784 spin_unlock_irqrestore(&mz->lru_lock, flags);
812 page_assign_page_cgroup(page, NULL); 785 mem_cgroup_uncharge_page(page);
813 unlock_page_cgroup(page); 786 put_page(page);
814 __mem_cgroup_remove_list(pc); 787 if (--count <= 0) {
815 res_counter_uncharge(&mem->res, PAGE_SIZE); 788 count = FORCE_UNCHARGE_BATCH;
816 css_put(&mem->css); 789 cond_resched();
817 kfree(pc);
818 } else {
819 /* racing uncharge: let page go then retry */
820 unlock_page_cgroup(page);
821 break;
822 } 790 }
791 spin_lock_irqsave(&mz->lru_lock, flags);
823 } 792 }
824
825 spin_unlock_irqrestore(&mz->lru_lock, flags); 793 spin_unlock_irqrestore(&mz->lru_lock, flags);
826 if (!list_empty(list)) {
827 cond_resched();
828 goto retry;
829 }
830} 794}
831 795
832/* 796/*