diff options
author | Andi Kleen <ak@linux.intel.com> | 2011-03-22 19:33:12 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2011-03-22 20:44:05 -0400 |
commit | 78afd5612deb8268bafc8b6507d72341d5ed9aac (patch) | |
tree | b96131d6f237b9ce6848d95c8eccdd1f7855365c /mm | |
parent | 11bc82d67d1150767901bca54a24466621d763d7 (diff) |
mm: add __GFP_OTHER_NODE flag
Add a new __GFP_OTHER_NODE flag to tell the low level numa statistics in
zone_statistics() that an allocation is on behalf of another thread. This
way the local and remote counters can be still correct, even when
background daemons like khugepaged are changing memory mappings.
This only affects the accounting, but I think it's worth doing that right
to avoid confusing users.
I first tried to just pass down the right node, but this required a lot of
changes to pass down this parameter and at least one addition of a 10th
argument to a 9 argument function. Using the flag is a lot less
intrusive.
Open: should be also used for migration?
[akpm@linux-foundation.org: coding-style fixes]
Signed-off-by: Andi Kleen <ak@linux.intel.com>
Cc: Andrea Arcangeli <aarcange@redhat.com>
Reviewed-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com>
Cc: Johannes Weiner <hannes@cmpxchg.org>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm')
-rw-r--r-- | mm/page_alloc.c | 2 | ||||
-rw-r--r-- | mm/vmstat.c | 9 |
2 files changed, 8 insertions, 3 deletions
diff --git a/mm/page_alloc.c b/mm/page_alloc.c index 6d0032bdb5d..136a547262a 100644 --- a/mm/page_alloc.c +++ b/mm/page_alloc.c | |||
@@ -1337,7 +1337,7 @@ again: | |||
1337 | } | 1337 | } |
1338 | 1338 | ||
1339 | __count_zone_vm_events(PGALLOC, zone, 1 << order); | 1339 | __count_zone_vm_events(PGALLOC, zone, 1 << order); |
1340 | zone_statistics(preferred_zone, zone); | 1340 | zone_statistics(preferred_zone, zone, gfp_flags); |
1341 | local_irq_restore(flags); | 1341 | local_irq_restore(flags); |
1342 | 1342 | ||
1343 | VM_BUG_ON(bad_range(zone, page)); | 1343 | VM_BUG_ON(bad_range(zone, page)); |
diff --git a/mm/vmstat.c b/mm/vmstat.c index 0c3b5048773..772b39b87d9 100644 --- a/mm/vmstat.c +++ b/mm/vmstat.c | |||
@@ -500,8 +500,12 @@ void refresh_cpu_vm_stats(int cpu) | |||
500 | * z = the zone from which the allocation occurred. | 500 | * z = the zone from which the allocation occurred. |
501 | * | 501 | * |
502 | * Must be called with interrupts disabled. | 502 | * Must be called with interrupts disabled. |
503 | * | ||
504 | * When __GFP_OTHER_NODE is set assume the node of the preferred | ||
505 | * zone is the local node. This is useful for daemons who allocate | ||
506 | * memory on behalf of other processes. | ||
503 | */ | 507 | */ |
504 | void zone_statistics(struct zone *preferred_zone, struct zone *z) | 508 | void zone_statistics(struct zone *preferred_zone, struct zone *z, gfp_t flags) |
505 | { | 509 | { |
506 | if (z->zone_pgdat == preferred_zone->zone_pgdat) { | 510 | if (z->zone_pgdat == preferred_zone->zone_pgdat) { |
507 | __inc_zone_state(z, NUMA_HIT); | 511 | __inc_zone_state(z, NUMA_HIT); |
@@ -509,7 +513,8 @@ void zone_statistics(struct zone *preferred_zone, struct zone *z) | |||
509 | __inc_zone_state(z, NUMA_MISS); | 513 | __inc_zone_state(z, NUMA_MISS); |
510 | __inc_zone_state(preferred_zone, NUMA_FOREIGN); | 514 | __inc_zone_state(preferred_zone, NUMA_FOREIGN); |
511 | } | 515 | } |
512 | if (z->node == numa_node_id()) | 516 | if (z->node == ((flags & __GFP_OTHER_NODE) ? |
517 | preferred_zone->node : numa_node_id())) | ||
513 | __inc_zone_state(z, NUMA_LOCAL); | 518 | __inc_zone_state(z, NUMA_LOCAL); |
514 | else | 519 | else |
515 | __inc_zone_state(z, NUMA_OTHER); | 520 | __inc_zone_state(z, NUMA_OTHER); |