diff options
author | Konstantin Khlebnikov <khlebnikov@yandex-team.ru> | 2015-04-14 18:45:27 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2015-04-14 19:49:01 -0400 |
commit | b9ea25152e56365ce149b9a39637cd7a16eec556 (patch) | |
tree | e8ab83d71a0bea5330d38e77e948170c0054d2a3 /mm/truncate.c | |
parent | ca0984caa8235762dc4e22c1c47ae6719dcc4064 (diff) |
page_writeback: clean up mess around cancel_dirty_page()
This patch replaces cancel_dirty_page() with a helper function
account_page_cleaned() which only updates counters. It's called from
truncate_complete_page() and from try_to_free_buffers() (hack for ext3).
Page is locked in both cases, page-lock protects against concurrent
dirtiers: see commit 2d6d7f982846 ("mm: protect set_page_dirty() from
ongoing truncation").
Delete_from_page_cache() shouldn't be called for dirty pages, they must
be handled by caller (either written or truncated). This patch treats
final dirty accounting fixup at the end of __delete_from_page_cache() as
a debug check and adds WARN_ON_ONCE() around it. If something removes
dirty pages without proper handling that might be a bug and unwritten
data might be lost.
Hugetlbfs has no dirty pages accounting, ClearPageDirty() is enough
here.
cancel_dirty_page() in nfs_wb_page_cancel() is redundant. This is
helper for nfs_invalidate_page() and it's called only in case complete
invalidation.
The mess was started in v2.6.20 after commits 46d2277c796f ("Clean up
and make try_to_free_buffers() not race with dirty pages") and
3e67c0987d75 ("truncate: clear page dirtiness before running
try_to_free_buffers()") first was reverted right in v2.6.20 in commit
ecdfc9787fe5 ("Resurrect 'try_to_free_buffers()' VM hackery"), second in
v2.6.25 commit a2b345642f53 ("Fix dirty page accounting leak with ext3
data=journal").
Custom fixes were introduced between these points. NFS in v2.6.23, commit
1b3b4a1a2deb ("NFS: Fix a write request leak in nfs_invalidate_page()").
Kludge in __delete_from_page_cache() in v2.6.24, commit 3a6927906f1b ("Do
dirty page accounting when removing a page from the page cache"). Since
v2.6.25 all of them are redundant.
[akpm@linux-foundation.org: coding-style fixes]
Signed-off-by: Konstantin Khlebnikov <khlebnikov@yandex-team.ru>
Cc: Tejun Heo <tj@kernel.org>
Cc: Jan Kara <jack@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/truncate.c')
-rw-r--r-- | mm/truncate.c | 37 |
1 files changed, 7 insertions, 30 deletions
diff --git a/mm/truncate.c b/mm/truncate.c index ddec5a5966d7..7a9d8a3cb143 100644 --- a/mm/truncate.c +++ b/mm/truncate.c | |||
@@ -93,35 +93,6 @@ void do_invalidatepage(struct page *page, unsigned int offset, | |||
93 | } | 93 | } |
94 | 94 | ||
95 | /* | 95 | /* |
96 | * This cancels just the dirty bit on the kernel page itself, it | ||
97 | * does NOT actually remove dirty bits on any mmap's that may be | ||
98 | * around. It also leaves the page tagged dirty, so any sync | ||
99 | * activity will still find it on the dirty lists, and in particular, | ||
100 | * clear_page_dirty_for_io() will still look at the dirty bits in | ||
101 | * the VM. | ||
102 | * | ||
103 | * Doing this should *normally* only ever be done when a page | ||
104 | * is truncated, and is not actually mapped anywhere at all. However, | ||
105 | * fs/buffer.c does this when it notices that somebody has cleaned | ||
106 | * out all the buffers on a page without actually doing it through | ||
107 | * the VM. Can you say "ext3 is horribly ugly"? Tought you could. | ||
108 | */ | ||
109 | void cancel_dirty_page(struct page *page, unsigned int account_size) | ||
110 | { | ||
111 | if (TestClearPageDirty(page)) { | ||
112 | struct address_space *mapping = page->mapping; | ||
113 | if (mapping && mapping_cap_account_dirty(mapping)) { | ||
114 | dec_zone_page_state(page, NR_FILE_DIRTY); | ||
115 | dec_bdi_stat(inode_to_bdi(mapping->host), | ||
116 | BDI_RECLAIMABLE); | ||
117 | if (account_size) | ||
118 | task_io_account_cancelled_write(account_size); | ||
119 | } | ||
120 | } | ||
121 | } | ||
122 | EXPORT_SYMBOL(cancel_dirty_page); | ||
123 | |||
124 | /* | ||
125 | * If truncate cannot remove the fs-private metadata from the page, the page | 96 | * If truncate cannot remove the fs-private metadata from the page, the page |
126 | * becomes orphaned. It will be left on the LRU and may even be mapped into | 97 | * becomes orphaned. It will be left on the LRU and may even be mapped into |
127 | * user pagetables if we're racing with filemap_fault(). | 98 | * user pagetables if we're racing with filemap_fault(). |
@@ -140,7 +111,13 @@ truncate_complete_page(struct address_space *mapping, struct page *page) | |||
140 | if (page_has_private(page)) | 111 | if (page_has_private(page)) |
141 | do_invalidatepage(page, 0, PAGE_CACHE_SIZE); | 112 | do_invalidatepage(page, 0, PAGE_CACHE_SIZE); |
142 | 113 | ||
143 | cancel_dirty_page(page, PAGE_CACHE_SIZE); | 114 | /* |
115 | * Some filesystems seem to re-dirty the page even after | ||
116 | * the VM has canceled the dirty bit (eg ext3 journaling). | ||
117 | * Hence dirty accounting check is placed after invalidation. | ||
118 | */ | ||
119 | if (TestClearPageDirty(page)) | ||
120 | account_page_cleaned(page, mapping); | ||
144 | 121 | ||
145 | ClearPageMappedToDisk(page); | 122 | ClearPageMappedToDisk(page); |
146 | delete_from_page_cache(page); | 123 | delete_from_page_cache(page); |