diff options
author | KOSAKI Motohiro <kosaki.motohiro@jp.fujitsu.com> | 2009-01-07 21:08:18 -0500 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2009-01-08 11:31:08 -0500 |
commit | 14797e2363c2b2f1ce139fd1c5a215e4e05aa1d9 (patch) | |
tree | a56edaa680c7c338a5a3043aa24897d7f668b6c9 /mm/memcontrol.c | |
parent | 549927620b04a8f8073ce2ee2a8977f209af2ee5 (diff) |
memcg: add inactive_anon_is_low()
The inactive_anon_is_low() is key component of active/inactive anon
balancing on reclaim. However current inactive_anon_is_low() function
only consider global reclaim.
Therefore, we need following ugly scan_global_lru() condition.
if (lru == LRU_ACTIVE_ANON &&
(!scan_global_lru(sc) || inactive_anon_is_low(zone))) {
shrink_active_list(nr_to_scan, zone, sc, priority, file);
return 0;
it cause that memcg reclaim always deactivate pages when shrink_list() is
called. To make mem_cgroup_inactive_anon_is_low() improve active/inactive
anon balancing of memcgroup.
Acked-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>
Acked-by: Rik van Riel <riel@redhat.com>
Signed-off-by: KOSAKI Motohiro <kosaki.motohiro@jp.fujitsu.com>
Cc: Cyrill Gorcunov <gorcunov@gmail.com>
Cc: "Pekka Enberg" <penberg@cs.helsinki.fi>
Cc: Balbir Singh <balbir@in.ibm.com>
Cc: Daisuke Nishimura <nishimura@mxp.nes.nec.co.jp>
Cc: Hugh Dickins <hugh@veritas.com>
Cc: KOSAKI Motohiro <kosaki.motohiro@jp.fujitsu.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/memcontrol.c')
-rw-r--r-- | mm/memcontrol.c | 46 |
1 files changed, 45 insertions, 1 deletions
diff --git a/mm/memcontrol.c b/mm/memcontrol.c index 457d671029b8..6611328460e9 100644 --- a/mm/memcontrol.c +++ b/mm/memcontrol.c | |||
@@ -156,6 +156,9 @@ struct mem_cgroup { | |||
156 | unsigned long last_oom_jiffies; | 156 | unsigned long last_oom_jiffies; |
157 | int obsolete; | 157 | int obsolete; |
158 | atomic_t refcnt; | 158 | atomic_t refcnt; |
159 | |||
160 | unsigned int inactive_ratio; | ||
161 | |||
159 | /* | 162 | /* |
160 | * statistics. This must be placed at the end of memcg. | 163 | * statistics. This must be placed at the end of memcg. |
161 | */ | 164 | */ |
@@ -431,6 +434,20 @@ long mem_cgroup_calc_reclaim(struct mem_cgroup *mem, struct zone *zone, | |||
431 | return (nr_pages >> priority); | 434 | return (nr_pages >> priority); |
432 | } | 435 | } |
433 | 436 | ||
437 | int mem_cgroup_inactive_anon_is_low(struct mem_cgroup *memcg, struct zone *zone) | ||
438 | { | ||
439 | unsigned long active; | ||
440 | unsigned long inactive; | ||
441 | |||
442 | inactive = mem_cgroup_get_all_zonestat(memcg, LRU_INACTIVE_ANON); | ||
443 | active = mem_cgroup_get_all_zonestat(memcg, LRU_ACTIVE_ANON); | ||
444 | |||
445 | if (inactive * memcg->inactive_ratio < active) | ||
446 | return 1; | ||
447 | |||
448 | return 0; | ||
449 | } | ||
450 | |||
434 | unsigned long mem_cgroup_isolate_pages(unsigned long nr_to_scan, | 451 | unsigned long mem_cgroup_isolate_pages(unsigned long nr_to_scan, |
435 | struct list_head *dst, | 452 | struct list_head *dst, |
436 | unsigned long *scanned, int order, | 453 | unsigned long *scanned, int order, |
@@ -1360,6 +1377,29 @@ int mem_cgroup_shrink_usage(struct mm_struct *mm, gfp_t gfp_mask) | |||
1360 | return 0; | 1377 | return 0; |
1361 | } | 1378 | } |
1362 | 1379 | ||
1380 | /* | ||
1381 | * The inactive anon list should be small enough that the VM never has to | ||
1382 | * do too much work, but large enough that each inactive page has a chance | ||
1383 | * to be referenced again before it is swapped out. | ||
1384 | * | ||
1385 | * this calculation is straightforward porting from | ||
1386 | * page_alloc.c::setup_per_zone_inactive_ratio(). | ||
1387 | * it describe more detail. | ||
1388 | */ | ||
1389 | static void mem_cgroup_set_inactive_ratio(struct mem_cgroup *memcg) | ||
1390 | { | ||
1391 | unsigned int gb, ratio; | ||
1392 | |||
1393 | gb = res_counter_read_u64(&memcg->res, RES_LIMIT) >> 30; | ||
1394 | if (gb) | ||
1395 | ratio = int_sqrt(10 * gb); | ||
1396 | else | ||
1397 | ratio = 1; | ||
1398 | |||
1399 | memcg->inactive_ratio = ratio; | ||
1400 | |||
1401 | } | ||
1402 | |||
1363 | static DEFINE_MUTEX(set_limit_mutex); | 1403 | static DEFINE_MUTEX(set_limit_mutex); |
1364 | 1404 | ||
1365 | static int mem_cgroup_resize_limit(struct mem_cgroup *memcg, | 1405 | static int mem_cgroup_resize_limit(struct mem_cgroup *memcg, |
@@ -1398,6 +1438,10 @@ static int mem_cgroup_resize_limit(struct mem_cgroup *memcg, | |||
1398 | GFP_KERNEL, false); | 1438 | GFP_KERNEL, false); |
1399 | if (!progress) retry_count--; | 1439 | if (!progress) retry_count--; |
1400 | } | 1440 | } |
1441 | |||
1442 | if (!ret) | ||
1443 | mem_cgroup_set_inactive_ratio(memcg); | ||
1444 | |||
1401 | return ret; | 1445 | return ret; |
1402 | } | 1446 | } |
1403 | 1447 | ||
@@ -1982,7 +2026,7 @@ mem_cgroup_create(struct cgroup_subsys *ss, struct cgroup *cont) | |||
1982 | res_counter_init(&mem->res, NULL); | 2026 | res_counter_init(&mem->res, NULL); |
1983 | res_counter_init(&mem->memsw, NULL); | 2027 | res_counter_init(&mem->memsw, NULL); |
1984 | } | 2028 | } |
1985 | 2029 | mem_cgroup_set_inactive_ratio(mem); | |
1986 | mem->last_scanned_child = NULL; | 2030 | mem->last_scanned_child = NULL; |
1987 | 2031 | ||
1988 | return &mem->css; | 2032 | return &mem->css; |