diff options
author | Hugh Dickins <hugh@veritas.com> | 2006-02-21 18:49:47 -0500 |
---|---|---|
committer | Linus Torvalds <torvalds@g5.osdl.org> | 2006-02-21 20:10:15 -0500 |
commit | b00dc3ad74fdb676552d46ee573b88e927240d0c (patch) | |
tree | 6dcf7806f1f0fc791d3455dcf233a11088b18b3a | |
parent | 808c783e9bfb217a90be5a996a867c41a69b40bd (diff) |
[PATCH] tmpfs: fix mount mpol nodelist parsing
I've been dissatisfied with the mpol_nodelist mount option which was
added to tmpfs earlier in -rc. Replace it by mpol=policy:nodelist.
And it was broken: a nodelist is a comma-separated list of numbers and
ranges; the mount options are a comma-separated list of token=values.
Whoops, blindly strsep'ing on commas doesn't work so well: since we've
no numeric tokens, and unlikely to add them, use that to distinguish.
Move the mpol= parsing to shmem_parse_mpol under CONFIG_NUMA, reject
all its options as invalid if not NUMA. /proc shows MPOL_PREFERRED
as "prefer", so use that name for the policy instead of "preferred".
Enforce that mpol=default has no nodelist; that mpol=prefer has one
node only; that mpol=bind has a nodelist; but let mpol=interleave use
node_online_map if no nodelist given. Describe this in tmpfs.txt.
Signed-off-by: Hugh Dickins <hugh@veritas.com>
Acked-by: Robin Holt <holt@sgi.com>
Acked-by: Andi Kleen <ak@suse.de>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
-rw-r--r-- | Documentation/filesystems/tmpfs.txt | 21 | ||||
-rw-r--r-- | mm/shmem.c | 81 |
2 files changed, 81 insertions, 21 deletions
diff --git a/Documentation/filesystems/tmpfs.txt b/Documentation/filesystems/tmpfs.txt index dbe4d87d2615..8a155418c705 100644 --- a/Documentation/filesystems/tmpfs.txt +++ b/Documentation/filesystems/tmpfs.txt | |||
@@ -79,15 +79,18 @@ that instance in a system with many cpus making intensive use of it. | |||
79 | 79 | ||
80 | 80 | ||
81 | tmpfs has a mount option to set the NUMA memory allocation policy for | 81 | tmpfs has a mount option to set the NUMA memory allocation policy for |
82 | all files in that instance: | 82 | all files in that instance (if CONFIG_NUMA is enabled) - which can be |
83 | mpol=interleave prefers to allocate memory from each node in turn | 83 | adjusted on the fly via 'mount -o remount ...' |
84 | mpol=default prefers to allocate memory from the local node | ||
85 | mpol=bind prefers to allocate from mpol_nodelist | ||
86 | mpol=preferred prefers to allocate from first node in mpol_nodelist | ||
87 | 84 | ||
88 | The following mount option is used in conjunction with mpol=interleave, | 85 | mpol=default prefers to allocate memory from the local node |
89 | mpol=bind or mpol=preferred: | 86 | mpol=prefer:Node prefers to allocate memory from the given Node |
90 | mpol_nodelist: nodelist suitable for parsing with nodelist_parse. | 87 | mpol=bind:NodeList allocates memory only from nodes in NodeList |
88 | mpol=interleave prefers to allocate from each node in turn | ||
89 | mpol=interleave:NodeList allocates from each node of NodeList in turn | ||
90 | |||
91 | NodeList format is a comma-separated list of decimal numbers and ranges, | ||
92 | a range being two hyphen-separated decimal numbers, the smallest and | ||
93 | largest node numbers in the range. For example, mpol=bind:0-3,5,7,9-15 | ||
91 | 94 | ||
92 | 95 | ||
93 | To specify the initial root directory you can use the following mount | 96 | To specify the initial root directory you can use the following mount |
@@ -109,4 +112,4 @@ RAM/SWAP in 10240 inodes and it is only accessible by root. | |||
109 | Author: | 112 | Author: |
110 | Christoph Rohland <cr@sap.com>, 1.12.01 | 113 | Christoph Rohland <cr@sap.com>, 1.12.01 |
111 | Updated: | 114 | Updated: |
112 | Hugh Dickins <hugh@veritas.com>, 13 March 2005 | 115 | Hugh Dickins <hugh@veritas.com>, 19 February 2006 |
diff --git a/mm/shmem.c b/mm/shmem.c index f7ac7b812f92..7c455fbaff7b 100644 --- a/mm/shmem.c +++ b/mm/shmem.c | |||
@@ -45,6 +45,7 @@ | |||
45 | #include <linux/swapops.h> | 45 | #include <linux/swapops.h> |
46 | #include <linux/mempolicy.h> | 46 | #include <linux/mempolicy.h> |
47 | #include <linux/namei.h> | 47 | #include <linux/namei.h> |
48 | #include <linux/ctype.h> | ||
48 | #include <asm/uaccess.h> | 49 | #include <asm/uaccess.h> |
49 | #include <asm/div64.h> | 50 | #include <asm/div64.h> |
50 | #include <asm/pgtable.h> | 51 | #include <asm/pgtable.h> |
@@ -874,6 +875,51 @@ redirty: | |||
874 | } | 875 | } |
875 | 876 | ||
876 | #ifdef CONFIG_NUMA | 877 | #ifdef CONFIG_NUMA |
878 | static int shmem_parse_mpol(char *value, int *policy, nodemask_t *policy_nodes) | ||
879 | { | ||
880 | char *nodelist = strchr(value, ':'); | ||
881 | int err = 1; | ||
882 | |||
883 | if (nodelist) { | ||
884 | /* NUL-terminate policy string */ | ||
885 | *nodelist++ = '\0'; | ||
886 | if (nodelist_parse(nodelist, *policy_nodes)) | ||
887 | goto out; | ||
888 | } | ||
889 | if (!strcmp(value, "default")) { | ||
890 | *policy = MPOL_DEFAULT; | ||
891 | /* Don't allow a nodelist */ | ||
892 | if (!nodelist) | ||
893 | err = 0; | ||
894 | } else if (!strcmp(value, "prefer")) { | ||
895 | *policy = MPOL_PREFERRED; | ||
896 | /* Insist on a nodelist of one node only */ | ||
897 | if (nodelist) { | ||
898 | char *rest = nodelist; | ||
899 | while (isdigit(*rest)) | ||
900 | rest++; | ||
901 | if (!*rest) | ||
902 | err = 0; | ||
903 | } | ||
904 | } else if (!strcmp(value, "bind")) { | ||
905 | *policy = MPOL_BIND; | ||
906 | /* Insist on a nodelist */ | ||
907 | if (nodelist) | ||
908 | err = 0; | ||
909 | } else if (!strcmp(value, "interleave")) { | ||
910 | *policy = MPOL_INTERLEAVE; | ||
911 | /* Default to nodes online if no nodelist */ | ||
912 | if (!nodelist) | ||
913 | *policy_nodes = node_online_map; | ||
914 | err = 0; | ||
915 | } | ||
916 | out: | ||
917 | /* Restore string for error message */ | ||
918 | if (nodelist) | ||
919 | *--nodelist = ':'; | ||
920 | return err; | ||
921 | } | ||
922 | |||
877 | static struct page *shmem_swapin_async(struct shared_policy *p, | 923 | static struct page *shmem_swapin_async(struct shared_policy *p, |
878 | swp_entry_t entry, unsigned long idx) | 924 | swp_entry_t entry, unsigned long idx) |
879 | { | 925 | { |
@@ -926,6 +972,11 @@ shmem_alloc_page(gfp_t gfp, struct shmem_inode_info *info, | |||
926 | return page; | 972 | return page; |
927 | } | 973 | } |
928 | #else | 974 | #else |
975 | static inline int shmem_parse_mpol(char *value, int *policy, nodemask_t *policy_nodes) | ||
976 | { | ||
977 | return 1; | ||
978 | } | ||
979 | |||
929 | static inline struct page * | 980 | static inline struct page * |
930 | shmem_swapin(struct shmem_inode_info *info,swp_entry_t entry,unsigned long idx) | 981 | shmem_swapin(struct shmem_inode_info *info,swp_entry_t entry,unsigned long idx) |
931 | { | 982 | { |
@@ -1859,7 +1910,23 @@ static int shmem_parse_options(char *options, int *mode, uid_t *uid, | |||
1859 | { | 1910 | { |
1860 | char *this_char, *value, *rest; | 1911 | char *this_char, *value, *rest; |
1861 | 1912 | ||
1862 | while ((this_char = strsep(&options, ",")) != NULL) { | 1913 | while (options != NULL) { |
1914 | this_char = options; | ||
1915 | for (;;) { | ||
1916 | /* | ||
1917 | * NUL-terminate this option: unfortunately, | ||
1918 | * mount options form a comma-separated list, | ||
1919 | * but mpol's nodelist may also contain commas. | ||
1920 | */ | ||
1921 | options = strchr(options, ','); | ||
1922 | if (options == NULL) | ||
1923 | break; | ||
1924 | options++; | ||
1925 | if (!isdigit(*options)) { | ||
1926 | options[-1] = '\0'; | ||
1927 | break; | ||
1928 | } | ||
1929 | } | ||
1863 | if (!*this_char) | 1930 | if (!*this_char) |
1864 | continue; | 1931 | continue; |
1865 | if ((value = strchr(this_char,'=')) != NULL) { | 1932 | if ((value = strchr(this_char,'=')) != NULL) { |
@@ -1910,18 +1977,8 @@ static int shmem_parse_options(char *options, int *mode, uid_t *uid, | |||
1910 | if (*rest) | 1977 | if (*rest) |
1911 | goto bad_val; | 1978 | goto bad_val; |
1912 | } else if (!strcmp(this_char,"mpol")) { | 1979 | } else if (!strcmp(this_char,"mpol")) { |
1913 | if (!strcmp(value,"default")) | 1980 | if (shmem_parse_mpol(value,policy,policy_nodes)) |
1914 | *policy = MPOL_DEFAULT; | ||
1915 | else if (!strcmp(value,"preferred")) | ||
1916 | *policy = MPOL_PREFERRED; | ||
1917 | else if (!strcmp(value,"bind")) | ||
1918 | *policy = MPOL_BIND; | ||
1919 | else if (!strcmp(value,"interleave")) | ||
1920 | *policy = MPOL_INTERLEAVE; | ||
1921 | else | ||
1922 | goto bad_val; | 1981 | goto bad_val; |
1923 | } else if (!strcmp(this_char,"mpol_nodelist")) { | ||
1924 | nodelist_parse(value, *policy_nodes); | ||
1925 | } else { | 1982 | } else { |
1926 | printk(KERN_ERR "tmpfs: Bad mount option %s\n", | 1983 | printk(KERN_ERR "tmpfs: Bad mount option %s\n", |
1927 | this_char); | 1984 | this_char); |