diff options
author | Paul Mundt <lethal@linux-sh.org> | 2007-07-16 02:38:22 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@woody.linux-foundation.org> | 2007-07-16 12:05:36 -0400 |
commit | 6193a2ff180920f84ee06977165ebf32431fc2d2 (patch) | |
tree | d3c6423c50463ea741080a58a2e654cf103431f3 /include/linux/slab.h | |
parent | f7977793240d836e60ff413e94e6914f08e10941 (diff) |
slob: initial NUMA support
This adds preliminary NUMA support to SLOB, primarily aimed at systems with
small nodes (tested all the way down to a 128kB SRAM block), whether
asymmetric or otherwise.
We follow the same conventions as SLAB/SLUB, preferring current node
placement for new pages, or with explicit placement, if a node has been
specified. Presently on UP NUMA this has the side-effect of preferring
node#0 allocations (since numa_node_id() == 0, though this could be
reworked if we could hand off a pfn to determine node placement), so
single-CPU NUMA systems will want to place smaller nodes further out in
terms of node id. Once a page has been bound to a node (via explicit node
id typing), we only do block allocations from partial free pages that have
a matching node id in the page flags.
The current implementation does have some scalability problems, in that all
partial free pages are tracked in the global freelist (with contention due
to the single spinlock). However, these are things that are being reworked
for SMP scalability first, while things like per-node freelists can easily
be built on top of this sort of functionality once it's been added.
More background can be found in:
http://marc.info/?l=linux-mm&m=118117916022379&w=2
http://marc.info/?l=linux-mm&m=118170446306199&w=2
http://marc.info/?l=linux-mm&m=118187859420048&w=2
and subsequent threads.
Acked-by: Christoph Lameter <clameter@sgi.com>
Acked-by: Matt Mackall <mpm@selenic.com>
Signed-off-by: Paul Mundt <lethal@linux-sh.org>
Acked-by: Nick Piggin <nickpiggin@yahoo.com.au>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Diffstat (limited to 'include/linux/slab.h')
-rw-r--r-- | include/linux/slab.h | 126 |
1 files changed, 62 insertions, 64 deletions
diff --git a/include/linux/slab.h b/include/linux/slab.h index cd6ab658553f..27402fea9b79 100644 --- a/include/linux/slab.h +++ b/include/linux/slab.h | |||
@@ -42,7 +42,6 @@ struct kmem_cache *kmem_cache_create(const char *, size_t, size_t, | |||
42 | void (*)(void *, struct kmem_cache *, unsigned long)); | 42 | void (*)(void *, struct kmem_cache *, unsigned long)); |
43 | void kmem_cache_destroy(struct kmem_cache *); | 43 | void kmem_cache_destroy(struct kmem_cache *); |
44 | int kmem_cache_shrink(struct kmem_cache *); | 44 | int kmem_cache_shrink(struct kmem_cache *); |
45 | void *kmem_cache_alloc(struct kmem_cache *, gfp_t); | ||
46 | void *kmem_cache_zalloc(struct kmem_cache *, gfp_t); | 45 | void *kmem_cache_zalloc(struct kmem_cache *, gfp_t); |
47 | void kmem_cache_free(struct kmem_cache *, void *); | 46 | void kmem_cache_free(struct kmem_cache *, void *); |
48 | unsigned int kmem_cache_size(struct kmem_cache *); | 47 | unsigned int kmem_cache_size(struct kmem_cache *); |
@@ -61,16 +60,6 @@ int kmem_ptr_validate(struct kmem_cache *cachep, const void *ptr); | |||
61 | sizeof(struct __struct), __alignof__(struct __struct),\ | 60 | sizeof(struct __struct), __alignof__(struct __struct),\ |
62 | (__flags), NULL, NULL) | 61 | (__flags), NULL, NULL) |
63 | 62 | ||
64 | #ifdef CONFIG_NUMA | ||
65 | extern void *kmem_cache_alloc_node(struct kmem_cache *, gfp_t flags, int node); | ||
66 | #else | ||
67 | static inline void *kmem_cache_alloc_node(struct kmem_cache *cachep, | ||
68 | gfp_t flags, int node) | ||
69 | { | ||
70 | return kmem_cache_alloc(cachep, flags); | ||
71 | } | ||
72 | #endif | ||
73 | |||
74 | /* | 63 | /* |
75 | * The largest kmalloc size supported by the slab allocators is | 64 | * The largest kmalloc size supported by the slab allocators is |
76 | * 32 megabyte (2^25) or the maximum allocatable page order if that is | 65 | * 32 megabyte (2^25) or the maximum allocatable page order if that is |
@@ -89,7 +78,6 @@ static inline void *kmem_cache_alloc_node(struct kmem_cache *cachep, | |||
89 | /* | 78 | /* |
90 | * Common kmalloc functions provided by all allocators | 79 | * Common kmalloc functions provided by all allocators |
91 | */ | 80 | */ |
92 | void *__kmalloc(size_t, gfp_t); | ||
93 | void *__kzalloc(size_t, gfp_t); | 81 | void *__kzalloc(size_t, gfp_t); |
94 | void * __must_check krealloc(const void *, size_t, gfp_t); | 82 | void * __must_check krealloc(const void *, size_t, gfp_t); |
95 | void kfree(const void *); | 83 | void kfree(const void *); |
@@ -100,40 +88,6 @@ size_t ksize(const void *); | |||
100 | * @n: number of elements. | 88 | * @n: number of elements. |
101 | * @size: element size. | 89 | * @size: element size. |
102 | * @flags: the type of memory to allocate. | 90 | * @flags: the type of memory to allocate. |
103 | */ | ||
104 | static inline void *kcalloc(size_t n, size_t size, gfp_t flags) | ||
105 | { | ||
106 | if (n != 0 && size > ULONG_MAX / n) | ||
107 | return NULL; | ||
108 | return __kzalloc(n * size, flags); | ||
109 | } | ||
110 | |||
111 | /* | ||
112 | * Allocator specific definitions. These are mainly used to establish optimized | ||
113 | * ways to convert kmalloc() calls to kmem_cache_alloc() invocations by selecting | ||
114 | * the appropriate general cache at compile time. | ||
115 | */ | ||
116 | |||
117 | #if defined(CONFIG_SLAB) || defined(CONFIG_SLUB) | ||
118 | #ifdef CONFIG_SLUB | ||
119 | #include <linux/slub_def.h> | ||
120 | #else | ||
121 | #include <linux/slab_def.h> | ||
122 | #endif /* !CONFIG_SLUB */ | ||
123 | #else | ||
124 | |||
125 | /* | ||
126 | * Fallback definitions for an allocator not wanting to provide | ||
127 | * its own optimized kmalloc definitions (like SLOB). | ||
128 | */ | ||
129 | |||
130 | /** | ||
131 | * kmalloc - allocate memory | ||
132 | * @size: how many bytes of memory are required. | ||
133 | * @flags: the type of memory to allocate. | ||
134 | * | ||
135 | * kmalloc is the normal method of allocating memory | ||
136 | * in the kernel. | ||
137 | * | 91 | * |
138 | * The @flags argument may be one of: | 92 | * The @flags argument may be one of: |
139 | * | 93 | * |
@@ -141,7 +95,7 @@ static inline void *kcalloc(size_t n, size_t size, gfp_t flags) | |||
141 | * | 95 | * |
142 | * %GFP_KERNEL - Allocate normal kernel ram. May sleep. | 96 | * %GFP_KERNEL - Allocate normal kernel ram. May sleep. |
143 | * | 97 | * |
144 | * %GFP_ATOMIC - Allocation will not sleep. | 98 | * %GFP_ATOMIC - Allocation will not sleep. May use emergency pools. |
145 | * For example, use this inside interrupt handlers. | 99 | * For example, use this inside interrupt handlers. |
146 | * | 100 | * |
147 | * %GFP_HIGHUSER - Allocate pages from high memory. | 101 | * %GFP_HIGHUSER - Allocate pages from high memory. |
@@ -150,18 +104,22 @@ static inline void *kcalloc(size_t n, size_t size, gfp_t flags) | |||
150 | * | 104 | * |
151 | * %GFP_NOFS - Do not make any fs calls while trying to get memory. | 105 | * %GFP_NOFS - Do not make any fs calls while trying to get memory. |
152 | * | 106 | * |
107 | * %GFP_NOWAIT - Allocation will not sleep. | ||
108 | * | ||
109 | * %GFP_THISNODE - Allocate node-local memory only. | ||
110 | * | ||
111 | * %GFP_DMA - Allocation suitable for DMA. | ||
112 | * Should only be used for kmalloc() caches. Otherwise, use a | ||
113 | * slab created with SLAB_DMA. | ||
114 | * | ||
153 | * Also it is possible to set different flags by OR'ing | 115 | * Also it is possible to set different flags by OR'ing |
154 | * in one or more of the following additional @flags: | 116 | * in one or more of the following additional @flags: |
155 | * | 117 | * |
156 | * %__GFP_COLD - Request cache-cold pages instead of | 118 | * %__GFP_COLD - Request cache-cold pages instead of |
157 | * trying to return cache-warm pages. | 119 | * trying to return cache-warm pages. |
158 | * | 120 | * |
159 | * %__GFP_DMA - Request memory from the DMA-capable zone. | ||
160 | * | ||
161 | * %__GFP_HIGH - This allocation has high priority and may use emergency pools. | 121 | * %__GFP_HIGH - This allocation has high priority and may use emergency pools. |
162 | * | 122 | * |
163 | * %__GFP_HIGHMEM - Allocated memory may be from highmem. | ||
164 | * | ||
165 | * %__GFP_NOFAIL - Indicate that this allocation is in no way allowed to fail | 123 | * %__GFP_NOFAIL - Indicate that this allocation is in no way allowed to fail |
166 | * (think twice before using). | 124 | * (think twice before using). |
167 | * | 125 | * |
@@ -171,24 +129,57 @@ static inline void *kcalloc(size_t n, size_t size, gfp_t flags) | |||
171 | * %__GFP_NOWARN - If allocation fails, don't issue any warnings. | 129 | * %__GFP_NOWARN - If allocation fails, don't issue any warnings. |
172 | * | 130 | * |
173 | * %__GFP_REPEAT - If allocation fails initially, try once more before failing. | 131 | * %__GFP_REPEAT - If allocation fails initially, try once more before failing. |
132 | * | ||
133 | * There are other flags available as well, but these are not intended | ||
134 | * for general use, and so are not documented here. For a full list of | ||
135 | * potential flags, always refer to linux/gfp.h. | ||
174 | */ | 136 | */ |
175 | static inline void *kmalloc(size_t size, gfp_t flags) | 137 | static inline void *kcalloc(size_t n, size_t size, gfp_t flags) |
176 | { | 138 | { |
177 | return __kmalloc(size, flags); | 139 | if (n != 0 && size > ULONG_MAX / n) |
140 | return NULL; | ||
141 | return __kzalloc(n * size, flags); | ||
178 | } | 142 | } |
179 | 143 | ||
180 | /** | 144 | /* |
181 | * kzalloc - allocate memory. The memory is set to zero. | 145 | * Allocator specific definitions. These are mainly used to establish optimized |
182 | * @size: how many bytes of memory are required. | 146 | * ways to convert kmalloc() calls to kmem_cache_alloc() invocations by |
183 | * @flags: the type of memory to allocate (see kmalloc). | 147 | * selecting the appropriate general cache at compile time. |
148 | * | ||
149 | * Allocators must define at least: | ||
150 | * | ||
151 | * kmem_cache_alloc() | ||
152 | * __kmalloc() | ||
153 | * kmalloc() | ||
154 | * kzalloc() | ||
155 | * | ||
156 | * Those wishing to support NUMA must also define: | ||
157 | * | ||
158 | * kmem_cache_alloc_node() | ||
159 | * kmalloc_node() | ||
160 | * | ||
161 | * See each allocator definition file for additional comments and | ||
162 | * implementation notes. | ||
184 | */ | 163 | */ |
185 | static inline void *kzalloc(size_t size, gfp_t flags) | 164 | #ifdef CONFIG_SLUB |
186 | { | 165 | #include <linux/slub_def.h> |
187 | return __kzalloc(size, flags); | 166 | #elif defined(CONFIG_SLOB) |
188 | } | 167 | #include <linux/slob_def.h> |
168 | #else | ||
169 | #include <linux/slab_def.h> | ||
189 | #endif | 170 | #endif |
190 | 171 | ||
191 | #ifndef CONFIG_NUMA | 172 | #if !defined(CONFIG_NUMA) && !defined(CONFIG_SLOB) |
173 | /** | ||
174 | * kmalloc_node - allocate memory from a specific node | ||
175 | * @size: how many bytes of memory are required. | ||
176 | * @flags: the type of memory to allocate (see kcalloc). | ||
177 | * @node: node to allocate from. | ||
178 | * | ||
179 | * kmalloc() for non-local nodes, used to allocate from a specific node | ||
180 | * if available. Equivalent to kmalloc() in the non-NUMA single-node | ||
181 | * case. | ||
182 | */ | ||
192 | static inline void *kmalloc_node(size_t size, gfp_t flags, int node) | 183 | static inline void *kmalloc_node(size_t size, gfp_t flags, int node) |
193 | { | 184 | { |
194 | return kmalloc(size, flags); | 185 | return kmalloc(size, flags); |
@@ -198,7 +189,15 @@ static inline void *__kmalloc_node(size_t size, gfp_t flags, int node) | |||
198 | { | 189 | { |
199 | return __kmalloc(size, flags); | 190 | return __kmalloc(size, flags); |
200 | } | 191 | } |
201 | #endif /* !CONFIG_NUMA */ | 192 | |
193 | void *kmem_cache_alloc(struct kmem_cache *, gfp_t); | ||
194 | |||
195 | static inline void *kmem_cache_alloc_node(struct kmem_cache *cachep, | ||
196 | gfp_t flags, int node) | ||
197 | { | ||
198 | return kmem_cache_alloc(cachep, flags); | ||
199 | } | ||
200 | #endif /* !CONFIG_NUMA && !CONFIG_SLOB */ | ||
202 | 201 | ||
203 | /* | 202 | /* |
204 | * kmalloc_track_caller is a special version of kmalloc that records the | 203 | * kmalloc_track_caller is a special version of kmalloc that records the |
@@ -245,4 +244,3 @@ extern void *__kmalloc_node_track_caller(size_t, gfp_t, int, void *); | |||
245 | 244 | ||
246 | #endif /* __KERNEL__ */ | 245 | #endif /* __KERNEL__ */ |
247 | #endif /* _LINUX_SLAB_H */ | 246 | #endif /* _LINUX_SLAB_H */ |
248 | |||