aboutsummaryrefslogtreecommitdiffstats
path: root/mm/vmscan.c
diff options
context:
space:
mode:
Diffstat (limited to 'mm/vmscan.c')
-rw-r--r--mm/vmscan.c92
1 files changed, 46 insertions, 46 deletions
diff --git a/mm/vmscan.c b/mm/vmscan.c
index 86f8c3418795..cacdf6684971 100644
--- a/mm/vmscan.c
+++ b/mm/vmscan.c
@@ -2371,6 +2371,50 @@ out:
2371 return sc.nr_reclaimed; 2371 return sc.nr_reclaimed;
2372} 2372}
2373 2373
2374static void kswapd_try_to_sleep(pg_data_t *pgdat, int order)
2375{
2376 long remaining = 0;
2377 DEFINE_WAIT(wait);
2378
2379 if (freezing(current) || kthread_should_stop())
2380 return;
2381
2382 prepare_to_wait(&pgdat->kswapd_wait, &wait, TASK_INTERRUPTIBLE);
2383
2384 /* Try to sleep for a short interval */
2385 if (!sleeping_prematurely(pgdat, order, remaining)) {
2386 remaining = schedule_timeout(HZ/10);
2387 finish_wait(&pgdat->kswapd_wait, &wait);
2388 prepare_to_wait(&pgdat->kswapd_wait, &wait, TASK_INTERRUPTIBLE);
2389 }
2390
2391 /*
2392 * After a short sleep, check if it was a premature sleep. If not, then
2393 * go fully to sleep until explicitly woken up.
2394 */
2395 if (!sleeping_prematurely(pgdat, order, remaining)) {
2396 trace_mm_vmscan_kswapd_sleep(pgdat->node_id);
2397
2398 /*
2399 * vmstat counters are not perfectly accurate and the estimated
2400 * value for counters such as NR_FREE_PAGES can deviate from the
2401 * true value by nr_online_cpus * threshold. To avoid the zone
2402 * watermarks being breached while under pressure, we reduce the
2403 * per-cpu vmstat threshold while kswapd is awake and restore
2404 * them before going back to sleep.
2405 */
2406 set_pgdat_percpu_threshold(pgdat, calculate_normal_threshold);
2407 schedule();
2408 set_pgdat_percpu_threshold(pgdat, calculate_pressure_threshold);
2409 } else {
2410 if (remaining)
2411 count_vm_event(KSWAPD_LOW_WMARK_HIT_QUICKLY);
2412 else
2413 count_vm_event(KSWAPD_HIGH_WMARK_HIT_QUICKLY);
2414 }
2415 finish_wait(&pgdat->kswapd_wait, &wait);
2416}
2417
2374/* 2418/*
2375 * The background pageout daemon, started as a kernel thread 2419 * The background pageout daemon, started as a kernel thread
2376 * from the init process. 2420 * from the init process.
@@ -2389,7 +2433,7 @@ static int kswapd(void *p)
2389 unsigned long order; 2433 unsigned long order;
2390 pg_data_t *pgdat = (pg_data_t*)p; 2434 pg_data_t *pgdat = (pg_data_t*)p;
2391 struct task_struct *tsk = current; 2435 struct task_struct *tsk = current;
2392 DEFINE_WAIT(wait); 2436
2393 struct reclaim_state reclaim_state = { 2437 struct reclaim_state reclaim_state = {
2394 .reclaimed_slab = 0, 2438 .reclaimed_slab = 0,
2395 }; 2439 };
@@ -2421,7 +2465,6 @@ static int kswapd(void *p)
2421 unsigned long new_order; 2465 unsigned long new_order;
2422 int ret; 2466 int ret;
2423 2467
2424 prepare_to_wait(&pgdat->kswapd_wait, &wait, TASK_INTERRUPTIBLE);
2425 new_order = pgdat->kswapd_max_order; 2468 new_order = pgdat->kswapd_max_order;
2426 pgdat->kswapd_max_order = 0; 2469 pgdat->kswapd_max_order = 0;
2427 if (order < new_order) { 2470 if (order < new_order) {
@@ -2431,52 +2474,9 @@ static int kswapd(void *p)
2431 */ 2474 */
2432 order = new_order; 2475 order = new_order;
2433 } else { 2476 } else {
2434 if (!freezing(current) && !kthread_should_stop()) { 2477 kswapd_try_to_sleep(pgdat, order);
2435 long remaining = 0;
2436
2437 /* Try to sleep for a short interval */
2438 if (!sleeping_prematurely(pgdat, order, remaining)) {
2439 remaining = schedule_timeout(HZ/10);
2440 finish_wait(&pgdat->kswapd_wait, &wait);
2441 prepare_to_wait(&pgdat->kswapd_wait, &wait, TASK_INTERRUPTIBLE);
2442 }
2443
2444 /*
2445 * After a short sleep, check if it was a
2446 * premature sleep. If not, then go fully
2447 * to sleep until explicitly woken up
2448 */
2449 if (!sleeping_prematurely(pgdat, order, remaining)) {
2450 trace_mm_vmscan_kswapd_sleep(pgdat->node_id);
2451
2452 /*
2453 * vmstat counters are not perfectly
2454 * accurate and the estimated value
2455 * for counters such as NR_FREE_PAGES
2456 * can deviate from the true value by
2457 * nr_online_cpus * threshold. To
2458 * avoid the zone watermarks being
2459 * breached while under pressure, we
2460 * reduce the per-cpu vmstat threshold
2461 * while kswapd is awake and restore
2462 * them before going back to sleep.
2463 */
2464 set_pgdat_percpu_threshold(pgdat,
2465 calculate_normal_threshold);
2466 schedule();
2467 set_pgdat_percpu_threshold(pgdat,
2468 calculate_pressure_threshold);
2469 } else {
2470 if (remaining)
2471 count_vm_event(KSWAPD_LOW_WMARK_HIT_QUICKLY);
2472 else
2473 count_vm_event(KSWAPD_HIGH_WMARK_HIT_QUICKLY);
2474 }
2475 }
2476
2477 order = pgdat->kswapd_max_order; 2478 order = pgdat->kswapd_max_order;
2478 } 2479 }
2479 finish_wait(&pgdat->kswapd_wait, &wait);
2480 2480
2481 ret = try_to_freeze(); 2481 ret = try_to_freeze();
2482 if (kthread_should_stop()) 2482 if (kthread_should_stop())