diff options
author | Mel Gorman <mel@csn.ul.ie> | 2011-01-13 18:46:22 -0500 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2011-01-13 20:32:37 -0500 |
commit | 0abdee2bd4118366c62349a304f81537be69af33 (patch) | |
tree | c013abd2dd49b3837d033eb4d32dfb57984d273e /mm/vmscan.c | |
parent | 1741c87757448cedd03224f01586504f9256415d (diff) |
mm: kswapd: use the order that kswapd was reclaiming at for sleeping_prematurely()
Before kswapd goes to sleep, it uses sleeping_prematurely() to check if
there was a race pushing a zone below its watermark. If the race
happened, it stays awake. However, balance_pgdat() can decide to reclaim
at order-0 if it decides that high-order reclaim is not working as
expected. This information is not passed back to sleeping_prematurely().
The impact is that kswapd remains awake reclaiming pages long after it
should have gone to sleep. This patch passes the adjusted order to
sleeping_prematurely and uses the same logic as balance_pgdat to decide if
it's ok to go to sleep.
Signed-off-by: Mel Gorman <mel@csn.ul.ie>
Reviewed-by: Minchan Kim <minchan.kim@gmail.com>
Reviewed-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>
Reviewed-by: Eric B Munson <emunson@mgebm.net>
Cc: Simon Kirby <sim@hostway.ca>
Cc: KOSAKI Motohiro <kosaki.motohiro@jp.fujitsu.com>
Cc: Shaohua Li <shaohua.li@intel.com>
Cc: Dave Hansen <dave@linux.vnet.ibm.com>
Cc: Johannes Weiner <hannes@cmpxchg.org>
Cc: Rik van Riel <riel@redhat.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/vmscan.c')
-rw-r--r-- | mm/vmscan.c | 16 |
1 files changed, 11 insertions, 5 deletions
diff --git a/mm/vmscan.c b/mm/vmscan.c index d3488828331a..46711f080f38 100644 --- a/mm/vmscan.c +++ b/mm/vmscan.c | |||
@@ -2227,7 +2227,7 @@ static bool pgdat_balanced(pg_data_t *pgdat, unsigned long balanced_pages, | |||
2227 | } | 2227 | } |
2228 | 2228 | ||
2229 | /* is kswapd sleeping prematurely? */ | 2229 | /* is kswapd sleeping prematurely? */ |
2230 | static int sleeping_prematurely(pg_data_t *pgdat, int order, long remaining) | 2230 | static bool sleeping_prematurely(pg_data_t *pgdat, int order, long remaining) |
2231 | { | 2231 | { |
2232 | int i; | 2232 | int i; |
2233 | unsigned long balanced = 0; | 2233 | unsigned long balanced = 0; |
@@ -2237,7 +2237,7 @@ static int sleeping_prematurely(pg_data_t *pgdat, int order, long remaining) | |||
2237 | if (remaining) | 2237 | if (remaining) |
2238 | return 1; | 2238 | return 1; |
2239 | 2239 | ||
2240 | /* If after HZ/10, a zone is below the high mark, it's premature */ | 2240 | /* Check the watermark levels */ |
2241 | for (i = 0; i < pgdat->nr_zones; i++) { | 2241 | for (i = 0; i < pgdat->nr_zones; i++) { |
2242 | struct zone *zone = pgdat->node_zones + i; | 2242 | struct zone *zone = pgdat->node_zones + i; |
2243 | 2243 | ||
@@ -2269,7 +2269,7 @@ static int sleeping_prematurely(pg_data_t *pgdat, int order, long remaining) | |||
2269 | * For kswapd, balance_pgdat() will work across all this node's zones until | 2269 | * For kswapd, balance_pgdat() will work across all this node's zones until |
2270 | * they are all at high_wmark_pages(zone). | 2270 | * they are all at high_wmark_pages(zone). |
2271 | * | 2271 | * |
2272 | * Returns the number of pages which were actually freed. | 2272 | * Returns the final order kswapd was reclaiming at |
2273 | * | 2273 | * |
2274 | * There is special handling here for zones which are full of pinned pages. | 2274 | * There is special handling here for zones which are full of pinned pages. |
2275 | * This can happen if the pages are all mlocked, or if they are all used by | 2275 | * This can happen if the pages are all mlocked, or if they are all used by |
@@ -2532,7 +2532,13 @@ out: | |||
2532 | } | 2532 | } |
2533 | } | 2533 | } |
2534 | 2534 | ||
2535 | return sc.nr_reclaimed; | 2535 | /* |
2536 | * Return the order we were reclaiming at so sleeping_prematurely() | ||
2537 | * makes a decision on the order we were last reclaiming at. However, | ||
2538 | * if another caller entered the allocator slow path while kswapd | ||
2539 | * was awake, order will remain at the higher level | ||
2540 | */ | ||
2541 | return order; | ||
2536 | } | 2542 | } |
2537 | 2543 | ||
2538 | static void kswapd_try_to_sleep(pg_data_t *pgdat, int order) | 2544 | static void kswapd_try_to_sleep(pg_data_t *pgdat, int order) |
@@ -2659,7 +2665,7 @@ static int kswapd(void *p) | |||
2659 | */ | 2665 | */ |
2660 | if (!ret) { | 2666 | if (!ret) { |
2661 | trace_mm_vmscan_kswapd_wake(pgdat->node_id, order); | 2667 | trace_mm_vmscan_kswapd_wake(pgdat->node_id, order); |
2662 | balance_pgdat(pgdat, order, classzone_idx); | 2668 | order = balance_pgdat(pgdat, order, classzone_idx); |
2663 | } | 2669 | } |
2664 | } | 2670 | } |
2665 | return 0; | 2671 | return 0; |