summaryrefslogtreecommitdiffstats
path: root/mm/compaction.c
diff options
context:
space:
mode:
authorMel Gorman <mgorman@techsingularity.net>2019-03-05 18:45:07 -0500
committerLinus Torvalds <torvalds@linux-foundation.org>2019-03-06 00:07:16 -0500
commit804d3121ba5f03af0ab225e2f688ee3ee669c0d2 (patch)
tree2b545cb4329435fb175cbb59607a426d1c2597fa /mm/compaction.c
parent5a811889de10f1ebb8e03a2744be006e909c405c (diff)
mm, compaction: avoid rescanning the same pageblock multiple times
Pageblocks are marked for skip when no pages are isolated after a scan. However, it's possible to hit corner cases where the migration scanner gets stuck near the boundary between the source and target scanner. Due to pages being migrated in blocks of COMPACT_CLUSTER_MAX, pages that are migrated can be reallocated before the pageblock is complete. The pageblock is not necessarily skipped so it can be rescanned multiple times. Similarly, a pageblock with some dirty/writeback pages may fail to migrate and be rescanned until writeback completes which is wasteful. This patch tracks if a pageblock is being rescanned. If so, then the entire pageblock will be migrated as one operation. This narrows the race window during which pages can be reallocated during migration. Secondly, if there are pages that cannot be isolated then the pageblock will still be fully scanned and marked for skipping. On the second rescan, the pageblock skip is set and the migration scanner makes progress. 5.0.0-rc1 5.0.0-rc1 findfree-v3r16 norescan-v3r16 Amean fault-both-1 0.00 ( 0.00%) 0.00 * 0.00%* Amean fault-both-3 3200.68 ( 0.00%) 3002.07 ( 6.21%) Amean fault-both-5 4847.75 ( 0.00%) 4684.47 ( 3.37%) Amean fault-both-7 6658.92 ( 0.00%) 6815.54 ( -2.35%) Amean fault-both-12 11077.62 ( 0.00%) 10864.02 ( 1.93%) Amean fault-both-18 12403.97 ( 0.00%) 12247.52 ( 1.26%) Amean fault-both-24 15607.10 ( 0.00%) 15683.99 ( -0.49%) Amean fault-both-30 18752.27 ( 0.00%) 18620.02 ( 0.71%) Amean fault-both-32 21207.54 ( 0.00%) 19250.28 * 9.23%* 5.0.0-rc1 5.0.0-rc1 findfree-v3r16 norescan-v3r16 Percentage huge-3 96.86 ( 0.00%) 95.00 ( -1.91%) Percentage huge-5 93.72 ( 0.00%) 94.22 ( 0.53%) Percentage huge-7 94.31 ( 0.00%) 92.35 ( -2.08%) Percentage huge-12 92.66 ( 0.00%) 91.90 ( -0.82%) Percentage huge-18 91.51 ( 0.00%) 89.58 ( -2.11%) Percentage huge-24 90.50 ( 0.00%) 90.03 ( -0.52%) Percentage huge-30 91.57 ( 0.00%) 89.14 ( -2.65%) Percentage huge-32 91.00 ( 0.00%) 90.58 ( -0.46%) Negligible difference but this was likely a case when the specific corner case was not hit. A previous run of the same patch based on an earlier iteration of the series showed large differences where migration rates could be halved when the corner case was hit. The specific corner case where migration scan rates go through the roof was due to a dirty/writeback pageblock located at the boundary of the migration/free scanner did not happen in this case. When it does happen, the scan rates multipled by massive margins. Link: http://lkml.kernel.org/r/20190118175136.31341-13-mgorman@techsingularity.net Signed-off-by: Mel Gorman <mgorman@techsingularity.net> Acked-by: Vlastimil Babka <vbabka@suse.cz> Cc: Andrea Arcangeli <aarcange@redhat.com> Cc: Dan Carpenter <dan.carpenter@oracle.com> Cc: David Rientjes <rientjes@google.com> Cc: YueHaibing <yuehaibing@huawei.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/compaction.c')
-rw-r--r--mm/compaction.c32
1 files changed, 26 insertions, 6 deletions
diff --git a/mm/compaction.c b/mm/compaction.c
index 6d42ea126242..00a5126b6548 100644
--- a/mm/compaction.c
+++ b/mm/compaction.c
@@ -949,8 +949,11 @@ isolate_success:
949 cc->nr_migratepages++; 949 cc->nr_migratepages++;
950 nr_isolated++; 950 nr_isolated++;
951 951
952 /* Avoid isolating too much */ 952 /*
953 if (cc->nr_migratepages == COMPACT_CLUSTER_MAX) { 953 * Avoid isolating too much unless this block is being
954 * rescanned (e.g. dirty/writeback pages, parallel allocation).
955 */
956 if (cc->nr_migratepages == COMPACT_CLUSTER_MAX && !cc->rescan) {
954 ++low_pfn; 957 ++low_pfn;
955 break; 958 break;
956 } 959 }
@@ -997,11 +1000,14 @@ isolate_abort:
997 spin_unlock_irqrestore(zone_lru_lock(zone), flags); 1000 spin_unlock_irqrestore(zone_lru_lock(zone), flags);
998 1001
999 /* 1002 /*
1000 * Updated the cached scanner pfn if the pageblock was scanned 1003 * Updated the cached scanner pfn once the pageblock has been scanned
1001 * without isolating a page. The pageblock may not be marked 1004 * Pages will either be migrated in which case there is no point
1002 * skipped already if there were no LRU pages in the block. 1005 * scanning in the near future or migration failed in which case the
1006 * failure reason may persist. The block is marked for skipping if
1007 * there were no pages isolated in the block or if the block is
1008 * rescanned twice in a row.
1003 */ 1009 */
1004 if (low_pfn == end_pfn && !nr_isolated) { 1010 if (low_pfn == end_pfn && (!nr_isolated || cc->rescan)) {
1005 if (valid_page && !skip_updated) 1011 if (valid_page && !skip_updated)
1006 set_pageblock_skip(valid_page); 1012 set_pageblock_skip(valid_page);
1007 update_cached_migrate(cc, low_pfn); 1013 update_cached_migrate(cc, low_pfn);
@@ -2035,6 +2041,20 @@ static enum compact_result compact_zone(struct compact_control *cc)
2035 int err; 2041 int err;
2036 unsigned long start_pfn = cc->migrate_pfn; 2042 unsigned long start_pfn = cc->migrate_pfn;
2037 2043
2044 /*
2045 * Avoid multiple rescans which can happen if a page cannot be
2046 * isolated (dirty/writeback in async mode) or if the migrated
2047 * pages are being allocated before the pageblock is cleared.
2048 * The first rescan will capture the entire pageblock for
2049 * migration. If it fails, it'll be marked skip and scanning
2050 * will proceed as normal.
2051 */
2052 cc->rescan = false;
2053 if (pageblock_start_pfn(last_migrated_pfn) ==
2054 pageblock_start_pfn(start_pfn)) {
2055 cc->rescan = true;
2056 }
2057
2038 switch (isolate_migratepages(cc->zone, cc)) { 2058 switch (isolate_migratepages(cc->zone, cc)) {
2039 case ISOLATE_ABORT: 2059 case ISOLATE_ABORT:
2040 ret = COMPACT_CONTENDED; 2060 ret = COMPACT_CONTENDED;