aboutsummaryrefslogtreecommitdiffstats
path: root/mm
diff options
context:
space:
mode:
authorJohannes Weiner <hannes@cmpxchg.org>2016-01-20 18:03:16 -0500
committerLinus Torvalds <torvalds@linux-foundation.org>2016-01-20 20:09:18 -0500
commit44b7a8d33d666268062e0f725d5f14813a63a6ea (patch)
tree976a8ef6d69e8d34be1b07ec5f5d75e26b291ceb /mm
parent3e24b19dd5ff0587674ac7578cc11ef079708327 (diff)
mm: memcontrol: do not uncharge old page in page cache replacement
Changing page->mem_cgroup of a live page is tricky and fragile. In particular, the memcg writeback code relies on that mapping being stable and users of mem_cgroup_replace_page() not overlapping with dirtyable inodes. Page cache replacement doesn't have to do that, though. Instead of being clever and transferring the charge from the old page to the new, force-charge the new page and leave the old page alone. A temporary overcharge won't matter in practice, and the old page is going to be freed shortly after this anyway. And this is not performance critical. Signed-off-by: Johannes Weiner <hannes@cmpxchg.org> Cc: Michal Hocko <mhocko@suse.cz> Cc: Vladimir Davydov <vdavydov@virtuozzo.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm')
-rw-r--r--mm/memcontrol.c26
1 files changed, 15 insertions, 11 deletions
diff --git a/mm/memcontrol.c b/mm/memcontrol.c
index 6a0007965e31..bf35bff282fc 100644
--- a/mm/memcontrol.c
+++ b/mm/memcontrol.c
@@ -366,13 +366,6 @@ mem_cgroup_zone_zoneinfo(struct mem_cgroup *memcg, struct zone *zone)
366 * 366 *
367 * If memcg is bound to a traditional hierarchy, the css of root_mem_cgroup 367 * If memcg is bound to a traditional hierarchy, the css of root_mem_cgroup
368 * is returned. 368 * is returned.
369 *
370 * XXX: The above description of behavior on the default hierarchy isn't
371 * strictly true yet as replace_page_cache_page() can modify the
372 * association before @page is released even on the default hierarchy;
373 * however, the current and planned usages don't mix the the two functions
374 * and replace_page_cache_page() will soon be updated to make the invariant
375 * actually true.
376 */ 369 */
377struct cgroup_subsys_state *mem_cgroup_css_from_page(struct page *page) 370struct cgroup_subsys_state *mem_cgroup_css_from_page(struct page *page)
378{ 371{
@@ -5464,7 +5457,8 @@ void mem_cgroup_uncharge_list(struct list_head *page_list)
5464void mem_cgroup_replace_page(struct page *oldpage, struct page *newpage) 5457void mem_cgroup_replace_page(struct page *oldpage, struct page *newpage)
5465{ 5458{
5466 struct mem_cgroup *memcg; 5459 struct mem_cgroup *memcg;
5467 int isolated; 5460 unsigned int nr_pages;
5461 bool compound;
5468 5462
5469 VM_BUG_ON_PAGE(!PageLocked(oldpage), oldpage); 5463 VM_BUG_ON_PAGE(!PageLocked(oldpage), oldpage);
5470 VM_BUG_ON_PAGE(!PageLocked(newpage), newpage); 5464 VM_BUG_ON_PAGE(!PageLocked(newpage), newpage);
@@ -5484,11 +5478,21 @@ void mem_cgroup_replace_page(struct page *oldpage, struct page *newpage)
5484 if (!memcg) 5478 if (!memcg)
5485 return; 5479 return;
5486 5480
5487 lock_page_lru(oldpage, &isolated); 5481 /* Force-charge the new page. The old one will be freed soon */
5488 oldpage->mem_cgroup = NULL; 5482 compound = PageTransHuge(newpage);
5489 unlock_page_lru(oldpage, isolated); 5483 nr_pages = compound ? hpage_nr_pages(newpage) : 1;
5484
5485 page_counter_charge(&memcg->memory, nr_pages);
5486 if (do_memsw_account())
5487 page_counter_charge(&memcg->memsw, nr_pages);
5488 css_get_many(&memcg->css, nr_pages);
5490 5489
5491 commit_charge(newpage, memcg, true); 5490 commit_charge(newpage, memcg, true);
5491
5492 local_irq_disable();
5493 mem_cgroup_charge_statistics(memcg, newpage, compound, nr_pages);
5494 memcg_check_events(memcg, newpage);
5495 local_irq_enable();
5492} 5496}
5493 5497
5494DEFINE_STATIC_KEY_FALSE(memcg_sockets_enabled_key); 5498DEFINE_STATIC_KEY_FALSE(memcg_sockets_enabled_key);