aboutsummaryrefslogtreecommitdiffstats
path: root/mm/filemap.c
diff options
context:
space:
mode:
authorHugh Dickins <hughd@google.com>2011-08-03 19:21:19 -0400
committerLinus Torvalds <torvalds@linux-foundation.org>2011-08-03 20:25:22 -0400
commita2c16d6cb0e478812829ca84aeabd02e36af35eb (patch)
tree7803a522da5deee7ce753dc5404dca01f42aa176 /mm/filemap.c
parent6328650bb4d854a7dc1498d1c0048b838b0d340c (diff)
mm: let swap use exceptional entries
If swap entries are to be stored along with struct page pointers in a radix tree, they need to be distinguished as exceptional entries. Most of the handling of swap entries in radix tree will be contained in shmem.c, but a few functions in filemap.c's common code need to check for their appearance: find_get_page(), find_lock_page(), find_get_pages() and find_get_pages_contig(). So as not to slow their fast paths, tuck those checks inside the existing checks for unlikely radix_tree_deref_slot(); except for find_lock_page(), where it is an added test. And make it a BUG in find_get_pages_tag(), which is not applied to tmpfs files. A part of the reason for eliminating shmem_readpage() earlier, was to minimize the places where common code would need to allow for swap entries. The swp_entry_t known to swapfile.c must be massaged into a slightly different form when stored in the radix tree, just as it gets massaged into a pte_t when stored in page tables. In an i386 kernel this limits its information (type and page offset) to 30 bits: given 32 "types" of swapfile and 4kB pagesize, that's a maximum swapfile size of 128GB. Which is less than the 512GB we previously allowed with X86_PAE (where the swap entry can occupy the entire upper 32 bits of a pte_t), but not a new limitation on 32-bit without PAE; and there's not a new limitation on 64-bit (where swap filesize is already limited to 16TB by a 32-bit page offset). Thirty areas of 128GB is probably still enough swap for a 64GB 32-bit machine. Provide swp_to_radix_entry() and radix_to_swp_entry() conversions, and enforce filesize limit in read_swap_header(), just as for ptes. Signed-off-by: Hugh Dickins <hughd@google.com> Acked-by: Rik van Riel <riel@redhat.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'mm/filemap.c')
-rw-r--r--mm/filemap.c49
1 files changed, 31 insertions, 18 deletions
diff --git a/mm/filemap.c b/mm/filemap.c
index b83aebfd0a00..76bfb6460f57 100644
--- a/mm/filemap.c
+++ b/mm/filemap.c
@@ -714,9 +714,12 @@ repeat:
714 page = radix_tree_deref_slot(pagep); 714 page = radix_tree_deref_slot(pagep);
715 if (unlikely(!page)) 715 if (unlikely(!page))
716 goto out; 716 goto out;
717 if (radix_tree_deref_retry(page)) 717 if (radix_tree_exception(page)) {
718 if (radix_tree_exceptional_entry(page))
719 goto out;
720 /* radix_tree_deref_retry(page) */
718 goto repeat; 721 goto repeat;
719 722 }
720 if (!page_cache_get_speculative(page)) 723 if (!page_cache_get_speculative(page))
721 goto repeat; 724 goto repeat;
722 725
@@ -753,7 +756,7 @@ struct page *find_lock_page(struct address_space *mapping, pgoff_t offset)
753 756
754repeat: 757repeat:
755 page = find_get_page(mapping, offset); 758 page = find_get_page(mapping, offset);
756 if (page) { 759 if (page && !radix_tree_exception(page)) {
757 lock_page(page); 760 lock_page(page);
758 /* Has the page been truncated? */ 761 /* Has the page been truncated? */
759 if (unlikely(page->mapping != mapping)) { 762 if (unlikely(page->mapping != mapping)) {
@@ -849,11 +852,14 @@ repeat:
849 if (unlikely(!page)) 852 if (unlikely(!page))
850 continue; 853 continue;
851 854
852 /* 855 if (radix_tree_exception(page)) {
853 * This can only trigger when the entry at index 0 moves out 856 if (radix_tree_exceptional_entry(page))
854 * of or back to the root: none yet gotten, safe to restart. 857 continue;
855 */ 858 /*
856 if (radix_tree_deref_retry(page)) { 859 * radix_tree_deref_retry(page):
860 * can only trigger when entry at index 0 moves out of
861 * or back to root: none yet gotten, safe to restart.
862 */
857 WARN_ON(start | i); 863 WARN_ON(start | i);
858 goto restart; 864 goto restart;
859 } 865 }
@@ -912,12 +918,16 @@ repeat:
912 if (unlikely(!page)) 918 if (unlikely(!page))
913 continue; 919 continue;
914 920
915 /* 921 if (radix_tree_exception(page)) {
916 * This can only trigger when the entry at index 0 moves out 922 if (radix_tree_exceptional_entry(page))
917 * of or back to the root: none yet gotten, safe to restart. 923 break;
918 */ 924 /*
919 if (radix_tree_deref_retry(page)) 925 * radix_tree_deref_retry(page):
926 * can only trigger when entry at index 0 moves out of
927 * or back to root: none yet gotten, safe to restart.
928 */
920 goto restart; 929 goto restart;
930 }
921 931
922 if (!page_cache_get_speculative(page)) 932 if (!page_cache_get_speculative(page))
923 goto repeat; 933 goto repeat;
@@ -977,12 +987,15 @@ repeat:
977 if (unlikely(!page)) 987 if (unlikely(!page))
978 continue; 988 continue;
979 989
980 /* 990 if (radix_tree_exception(page)) {
981 * This can only trigger when the entry at index 0 moves out 991 BUG_ON(radix_tree_exceptional_entry(page));
982 * of or back to the root: none yet gotten, safe to restart. 992 /*
983 */ 993 * radix_tree_deref_retry(page):
984 if (radix_tree_deref_retry(page)) 994 * can only trigger when entry at index 0 moves out of
995 * or back to root: none yet gotten, safe to restart.
996 */
985 goto restart; 997 goto restart;
998 }
986 999
987 if (!page_cache_get_speculative(page)) 1000 if (!page_cache_get_speculative(page))
988 goto repeat; 1001 goto repeat;