diff options
author | Hugh Dickins <hughd@google.com> | 2011-08-03 19:21:19 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@linux-foundation.org> | 2011-08-03 20:25:22 -0400 |
commit | a2c16d6cb0e478812829ca84aeabd02e36af35eb (patch) | |
tree | 7803a522da5deee7ce753dc5404dca01f42aa176 /mm/filemap.c | |
parent | 6328650bb4d854a7dc1498d1c0048b838b0d340c (diff) |
mm: let swap use exceptional entries
If swap entries are to be stored along with struct page pointers in a
radix tree, they need to be distinguished as exceptional entries.
Most of the handling of swap entries in radix tree will be contained in
shmem.c, but a few functions in filemap.c's common code need to check
for their appearance: find_get_page(), find_lock_page(),
find_get_pages() and find_get_pages_contig().
So as not to slow their fast paths, tuck those checks inside the
existing checks for unlikely radix_tree_deref_slot(); except for
find_lock_page(), where it is an added test. And make it a BUG in
find_get_pages_tag(), which is not applied to tmpfs files.
A part of the reason for eliminating shmem_readpage() earlier, was to
minimize the places where common code would need to allow for swap
entries.
The swp_entry_t known to swapfile.c must be massaged into a slightly
different form when stored in the radix tree, just as it gets massaged
into a pte_t when stored in page tables.
In an i386 kernel this limits its information (type and page offset) to
30 bits: given 32 "types" of swapfile and 4kB pagesize, that's a maximum
swapfile size of 128GB. Which is less than the 512GB we previously
allowed with X86_PAE (where the swap entry can occupy the entire upper
32 bits of a pte_t), but not a new limitation on 32-bit without PAE; and
there's not a new limitation on 64-bit (where swap filesize is already
limited to 16TB by a 32-bit page offset). Thirty areas of 128GB is
probably still enough swap for a 64GB 32-bit machine.
Provide swp_to_radix_entry() and radix_to_swp_entry() conversions, and
enforce filesize limit in read_swap_header(), just as for ptes.
Signed-off-by: Hugh Dickins <hughd@google.com>
Acked-by: Rik van Riel <riel@redhat.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/filemap.c')
-rw-r--r-- | mm/filemap.c | 49 |
1 files changed, 31 insertions, 18 deletions
diff --git a/mm/filemap.c b/mm/filemap.c index b83aebfd0a00..76bfb6460f57 100644 --- a/mm/filemap.c +++ b/mm/filemap.c | |||
@@ -714,9 +714,12 @@ repeat: | |||
714 | page = radix_tree_deref_slot(pagep); | 714 | page = radix_tree_deref_slot(pagep); |
715 | if (unlikely(!page)) | 715 | if (unlikely(!page)) |
716 | goto out; | 716 | goto out; |
717 | if (radix_tree_deref_retry(page)) | 717 | if (radix_tree_exception(page)) { |
718 | if (radix_tree_exceptional_entry(page)) | ||
719 | goto out; | ||
720 | /* radix_tree_deref_retry(page) */ | ||
718 | goto repeat; | 721 | goto repeat; |
719 | 722 | } | |
720 | if (!page_cache_get_speculative(page)) | 723 | if (!page_cache_get_speculative(page)) |
721 | goto repeat; | 724 | goto repeat; |
722 | 725 | ||
@@ -753,7 +756,7 @@ struct page *find_lock_page(struct address_space *mapping, pgoff_t offset) | |||
753 | 756 | ||
754 | repeat: | 757 | repeat: |
755 | page = find_get_page(mapping, offset); | 758 | page = find_get_page(mapping, offset); |
756 | if (page) { | 759 | if (page && !radix_tree_exception(page)) { |
757 | lock_page(page); | 760 | lock_page(page); |
758 | /* Has the page been truncated? */ | 761 | /* Has the page been truncated? */ |
759 | if (unlikely(page->mapping != mapping)) { | 762 | if (unlikely(page->mapping != mapping)) { |
@@ -849,11 +852,14 @@ repeat: | |||
849 | if (unlikely(!page)) | 852 | if (unlikely(!page)) |
850 | continue; | 853 | continue; |
851 | 854 | ||
852 | /* | 855 | if (radix_tree_exception(page)) { |
853 | * This can only trigger when the entry at index 0 moves out | 856 | if (radix_tree_exceptional_entry(page)) |
854 | * of or back to the root: none yet gotten, safe to restart. | 857 | continue; |
855 | */ | 858 | /* |
856 | if (radix_tree_deref_retry(page)) { | 859 | * radix_tree_deref_retry(page): |
860 | * can only trigger when entry at index 0 moves out of | ||
861 | * or back to root: none yet gotten, safe to restart. | ||
862 | */ | ||
857 | WARN_ON(start | i); | 863 | WARN_ON(start | i); |
858 | goto restart; | 864 | goto restart; |
859 | } | 865 | } |
@@ -912,12 +918,16 @@ repeat: | |||
912 | if (unlikely(!page)) | 918 | if (unlikely(!page)) |
913 | continue; | 919 | continue; |
914 | 920 | ||
915 | /* | 921 | if (radix_tree_exception(page)) { |
916 | * This can only trigger when the entry at index 0 moves out | 922 | if (radix_tree_exceptional_entry(page)) |
917 | * of or back to the root: none yet gotten, safe to restart. | 923 | break; |
918 | */ | 924 | /* |
919 | if (radix_tree_deref_retry(page)) | 925 | * radix_tree_deref_retry(page): |
926 | * can only trigger when entry at index 0 moves out of | ||
927 | * or back to root: none yet gotten, safe to restart. | ||
928 | */ | ||
920 | goto restart; | 929 | goto restart; |
930 | } | ||
921 | 931 | ||
922 | if (!page_cache_get_speculative(page)) | 932 | if (!page_cache_get_speculative(page)) |
923 | goto repeat; | 933 | goto repeat; |
@@ -977,12 +987,15 @@ repeat: | |||
977 | if (unlikely(!page)) | 987 | if (unlikely(!page)) |
978 | continue; | 988 | continue; |
979 | 989 | ||
980 | /* | 990 | if (radix_tree_exception(page)) { |
981 | * This can only trigger when the entry at index 0 moves out | 991 | BUG_ON(radix_tree_exceptional_entry(page)); |
982 | * of or back to the root: none yet gotten, safe to restart. | 992 | /* |
983 | */ | 993 | * radix_tree_deref_retry(page): |
984 | if (radix_tree_deref_retry(page)) | 994 | * can only trigger when entry at index 0 moves out of |
995 | * or back to root: none yet gotten, safe to restart. | ||
996 | */ | ||
985 | goto restart; | 997 | goto restart; |
998 | } | ||
986 | 999 | ||
987 | if (!page_cache_get_speculative(page)) | 1000 | if (!page_cache_get_speculative(page)) |
988 | goto repeat; | 1001 | goto repeat; |