diff options
author | KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com> | 2011-01-13 18:47:38 -0500 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2011-01-13 20:32:50 -0500 |
commit | dbd4ea78f002df283c95d9774837041735fa1bf9 (patch) | |
tree | e709c6c5c026b1c230bb87ddcfe8415aaf255820 /mm | |
parent | 2a7106f2cb0768d00fe8c1eb42a754a7d8518f08 (diff) |
memcg: add lock to synchronize page accounting and migration
Introduce a new bit spin lock, PCG_MOVE_LOCK, to synchronize the page
accounting and migration code. This reworks the locking scheme of
_update_stat() and _move_account() by adding new lock bit PCG_MOVE_LOCK,
which is always taken under IRQ disable.
1. If pages are being migrated from a memcg, then updates to that
memcg page statistics are protected by grabbing PCG_MOVE_LOCK using
move_lock_page_cgroup(). In an upcoming commit, memcg dirty page
accounting will be updating memcg page accounting (specifically: num
writeback pages) from IRQ context (softirq). Avoid a deadlocking
nested spin lock attempt by disabling irq on the local processor when
grabbing the PCG_MOVE_LOCK.
2. lock for update_page_stat is used only for avoiding race with
move_account(). So, IRQ awareness of lock_page_cgroup() itself is not
a problem. The problem is between mem_cgroup_update_page_stat() and
mem_cgroup_move_account_page().
Trade-off:
* Changing lock_page_cgroup() to always disable IRQ (or
local_bh) has some impacts on performance and I think
it's bad to disable IRQ when it's not necessary.
* adding a new lock makes move_account() slower. Score is
here.
Performance Impact: moving a 8G anon process.
Before:
real 0m0.792s
user 0m0.000s
sys 0m0.780s
After:
real 0m0.854s
user 0m0.000s
sys 0m0.842s
This score is bad but planned patches for optimization can reduce
this impact.
Signed-off-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>
Signed-off-by: Greg Thelen <gthelen@google.com>
Reviewed-by: Minchan Kim <minchan.kim@gmail.com>
Acked-by: Daisuke Nishimura <nishimura@mxp.nes.nec.co.jp>
Cc: Andrea Righi <arighi@develer.com>
Cc: Balbir Singh <balbir@linux.vnet.ibm.com>
Cc: Wu Fengguang <fengguang.wu@intel.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm')
-rw-r--r-- | mm/memcontrol.c | 9 |
1 files changed, 7 insertions, 2 deletions
diff --git a/mm/memcontrol.c b/mm/memcontrol.c index 3d8a0c79dece..d888956a2cfc 100644 --- a/mm/memcontrol.c +++ b/mm/memcontrol.c | |||
@@ -1606,6 +1606,7 @@ void mem_cgroup_update_page_stat(struct page *page, | |||
1606 | struct mem_cgroup *mem; | 1606 | struct mem_cgroup *mem; |
1607 | struct page_cgroup *pc = lookup_page_cgroup(page); | 1607 | struct page_cgroup *pc = lookup_page_cgroup(page); |
1608 | bool need_unlock = false; | 1608 | bool need_unlock = false; |
1609 | unsigned long uninitialized_var(flags); | ||
1609 | 1610 | ||
1610 | if (unlikely(!pc)) | 1611 | if (unlikely(!pc)) |
1611 | return; | 1612 | return; |
@@ -1617,7 +1618,7 @@ void mem_cgroup_update_page_stat(struct page *page, | |||
1617 | /* pc->mem_cgroup is unstable ? */ | 1618 | /* pc->mem_cgroup is unstable ? */ |
1618 | if (unlikely(mem_cgroup_stealed(mem))) { | 1619 | if (unlikely(mem_cgroup_stealed(mem))) { |
1619 | /* take a lock against to access pc->mem_cgroup */ | 1620 | /* take a lock against to access pc->mem_cgroup */ |
1620 | lock_page_cgroup(pc); | 1621 | move_lock_page_cgroup(pc, &flags); |
1621 | need_unlock = true; | 1622 | need_unlock = true; |
1622 | mem = pc->mem_cgroup; | 1623 | mem = pc->mem_cgroup; |
1623 | if (!mem || !PageCgroupUsed(pc)) | 1624 | if (!mem || !PageCgroupUsed(pc)) |
@@ -1640,7 +1641,7 @@ void mem_cgroup_update_page_stat(struct page *page, | |||
1640 | 1641 | ||
1641 | out: | 1642 | out: |
1642 | if (unlikely(need_unlock)) | 1643 | if (unlikely(need_unlock)) |
1643 | unlock_page_cgroup(pc); | 1644 | move_unlock_page_cgroup(pc, &flags); |
1644 | rcu_read_unlock(); | 1645 | rcu_read_unlock(); |
1645 | return; | 1646 | return; |
1646 | } | 1647 | } |
@@ -2211,9 +2212,13 @@ static int mem_cgroup_move_account(struct page_cgroup *pc, | |||
2211 | struct mem_cgroup *from, struct mem_cgroup *to, bool uncharge) | 2212 | struct mem_cgroup *from, struct mem_cgroup *to, bool uncharge) |
2212 | { | 2213 | { |
2213 | int ret = -EINVAL; | 2214 | int ret = -EINVAL; |
2215 | unsigned long flags; | ||
2216 | |||
2214 | lock_page_cgroup(pc); | 2217 | lock_page_cgroup(pc); |
2215 | if (PageCgroupUsed(pc) && pc->mem_cgroup == from) { | 2218 | if (PageCgroupUsed(pc) && pc->mem_cgroup == from) { |
2219 | move_lock_page_cgroup(pc, &flags); | ||
2216 | __mem_cgroup_move_account(pc, from, to, uncharge); | 2220 | __mem_cgroup_move_account(pc, from, to, uncharge); |
2221 | move_unlock_page_cgroup(pc, &flags); | ||
2217 | ret = 0; | 2222 | ret = 0; |
2218 | } | 2223 | } |
2219 | unlock_page_cgroup(pc); | 2224 | unlock_page_cgroup(pc); |