Merge branch 'akpm' (more patches from Andrew)

Merge patches from Andrew Morton: "Most of the rest of MM, plus a few dribs and drabs. I still have quite a few irritating patches left around: ones with dubious testing results, lack of review, ones which should have gone via maintainer trees but the maintainers are slack, etc. I need to be more activist in getting these things wrapped up outside the merge window, but they're such a PITA." * emailed patches from Andrew Morton <akpm@linux-foundation.org>: (48 commits) mm/vmscan.c: avoid possible deadlock caused by too_many_isolated() vmscan: comment too_many_isolated() mm/kmemleak.c: remove obsolete simple_strtoul mm/memory_hotplug.c: improve comments mm/hugetlb: create hugetlb cgroup file in hugetlb_init mm/mprotect.c: coding-style cleanups Documentation: ABI: /sys/devices/system/node/ slub: drop mutex before deleting sysfs entry memcg: add comments clarifying aspects of cache attribute propagation kmem: add slab-specific documentation about the kmem controller slub: slub-specific propagation changes slab: propagate tunable values memcg: aggregate memcg cache values in slabinfo memcg/sl[au]b: shrink dead caches memcg/sl[au]b: track all the memcg children of a kmem_cache memcg: destroy memcg caches sl[au]b: allocate objects from memcg cache sl[au]b: always get the cache from its page in kmem_cache_free() memcg: skip memcg kmem allocations in specified code regions memcg: infrastructure to match an allocation to the right cache ...
author: Linus Torvalds <torvalds@linux-foundation.org> 2012-12-18 18:08:12 -0500
committer: Linus Torvalds <torvalds@linux-foundation.org> 2012-12-18 18:08:12 -0500
commit: 673ab8783b596cda5b616b317b1a1b47480c66fd (patch)
tree: d3fc9bb4279720c53d0dc69c2a34c40635cf05f3 /include/linux/memcontrol.h
parent: d7b96ca5d08a8f2f836feb2b3b3bd721d2837a8e (diff)
parent: 3cf23841b4b76eb94d3f8d0fb3627690e4431413 (diff)
1 files changed, 209 insertions, 0 deletions
diff --git a/include/linux/memcontrol.h b/include/linux/memcontrol.h
index e98a74c0c9c0..0108a56f814e 100644
--- a/include/linux/memcontrol.h
+++ b/include/linux/memcontrol.h
@@ -21,11 +21,14 @@
 #define _LINUX_MEMCONTROL_H
 #include <linux/cgroup.h>
 #include <linux/vm_event_item.h>
+#include <linux/hardirq.h>
+#include <linux/jump_label.h>
 struct mem_cgroup;
 struct page_cgroup;
 struct page;
 struct mm_struct;
+struct kmem_cache;
 /* Stats that can be updated by kernel. */
 enum mem_cgroup_page_stat_item {
@@ -414,5 +417,211 @@ static inline void sock_release_memcg(struct sock *sk)
 {
 }
 #endif /* CONFIG_INET && CONFIG_MEMCG_KMEM */
+#ifdef CONFIG_MEMCG_KMEM
+extern struct static_key memcg_kmem_enabled_key;
+extern int memcg_limited_groups_array_size;
+/*
+ * Helper macro to loop through all memcg-specific caches. Callers must still
+ * check if the cache is valid (it is either valid or NULL).
+ * the slab_mutex must be held when looping through those caches
+ */
+#define for_each_memcg_cache_index(_idx)        \
+        for ((_idx) = 0; i < memcg_limited_groups_array_size; (_idx)++)
+static inline bool memcg_kmem_enabled(void)
+{
+        return static_key_false(&memcg_kmem_enabled_key);
+}
+/*
+ * In general, we'll do everything in our power to not incur in any overhead
+ * for non-memcg users for the kmem functions. Not even a function call, if we
+ * can avoid it.
+ *
+ * Therefore, we'll inline all those functions so that in the best case, we'll
+ * see that kmemcg is off for everybody and proceed quickly.  If it is on,
+ * we'll still do most of the flag checking inline. We check a lot of
+ * conditions, but because they are pretty simple, they are expected to be
+ * fast.
+ */
+bool __memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg,
+                                        int order);
+void __memcg_kmem_commit_charge(struct page *page,
+                                       struct mem_cgroup *memcg, int order);
+void __memcg_kmem_uncharge_pages(struct page *page, int order);
+int memcg_cache_id(struct mem_cgroup *memcg);
+int memcg_register_cache(struct mem_cgroup *memcg, struct kmem_cache *s,
+                         struct kmem_cache *root_cache);
+void memcg_release_cache(struct kmem_cache *cachep);
+void memcg_cache_list_add(struct mem_cgroup *memcg, struct kmem_cache *cachep);
+int memcg_update_cache_size(struct kmem_cache *s, int num_groups);
+void memcg_update_array_size(int num_groups);
+struct kmem_cache *
+__memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp);
+void mem_cgroup_destroy_cache(struct kmem_cache *cachep);
+void kmem_cache_destroy_memcg_children(struct kmem_cache *s);
+/**
+ * memcg_kmem_newpage_charge: verify if a new kmem allocation is allowed.
+ * @gfp: the gfp allocation flags.
+ * @memcg: a pointer to the memcg this was charged against.
+ * @order: allocation order.
+ *
+ * returns true if the memcg where the current task belongs can hold this
+ * allocation.
+ *
+ * We return true automatically if this allocation is not to be accounted to
+ * any memcg.
+ */
+static inline bool
+memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
+{
+        if (!memcg_kmem_enabled())
+                return true;
+        /*
+         * __GFP_NOFAIL allocations will move on even if charging is not
+         * possible. Therefore we don't even try, and have this allocation
+         * unaccounted. We could in theory charge it with
+         * res_counter_charge_nofail, but we hope those allocations are rare,
+         * and won't be worth the trouble.
+         */
+        if (!(gfp & __GFP_KMEMCG) || (gfp & __GFP_NOFAIL))
+                return true;
+        if (in_interrupt() || (!current->mm) || (current->flags & PF_KTHREAD))
+                return true;
+        /* If the test is dying, just let it go. */
+        if (unlikely(fatal_signal_pending(current)))
+                return true;
+        return __memcg_kmem_newpage_charge(gfp, memcg, order);
+}
+/**
+ * memcg_kmem_uncharge_pages: uncharge pages from memcg
+ * @page: pointer to struct page being freed
+ * @order: allocation order.
+ *
+ * there is no need to specify memcg here, since it is embedded in page_cgroup
+ */
+static inline void
+memcg_kmem_uncharge_pages(struct page *page, int order)
+{
+        if (memcg_kmem_enabled())
+                __memcg_kmem_uncharge_pages(page, order);
+}
+/**
+ * memcg_kmem_commit_charge: embeds correct memcg in a page
+ * @page: pointer to struct page recently allocated
+ * @memcg: the memcg structure we charged against
+ * @order: allocation order.
+ *
+ * Needs to be called after memcg_kmem_newpage_charge, regardless of success or
+ * failure of the allocation. if @page is NULL, this function will revert the
+ * charges. Otherwise, it will commit the memcg given by @memcg to the
+ * corresponding page_cgroup.
+ */
+static inline void
+memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg, int order)
+{
+        if (memcg_kmem_enabled() && memcg)
+                __memcg_kmem_commit_charge(page, memcg, order);
+}
+/**
+ * memcg_kmem_get_cache: selects the correct per-memcg cache for allocation
+ * @cachep: the original global kmem cache
+ * @gfp: allocation flags.
+ *
+ * This function assumes that the task allocating, which determines the memcg
+ * in the page allocator, belongs to the same cgroup throughout the whole
+ * process.  Misacounting can happen if the task calls memcg_kmem_get_cache()
+ * while belonging to a cgroup, and later on changes. This is considered
+ * acceptable, and should only happen upon task migration.
+ *
+ * Before the cache is created by the memcg core, there is also a possible
+ * imbalance: the task belongs to a memcg, but the cache being allocated from
+ * is the global cache, since the child cache is not yet guaranteed to be
+ * ready. This case is also fine, since in this case the GFP_KMEMCG will not be
+ * passed and the page allocator will not attempt any cgroup accounting.
+ */
+static __always_inline struct kmem_cache *
+memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
+{
+        if (!memcg_kmem_enabled())
+                return cachep;
+        if (gfp & __GFP_NOFAIL)
+                return cachep;
+        if (in_interrupt() || (!current->mm) || (current->flags & PF_KTHREAD))
+                return cachep;
+        if (unlikely(fatal_signal_pending(current)))
+                return cachep;
+        return __memcg_kmem_get_cache(cachep, gfp);
+}
+#else
+#define for_each_memcg_cache_index(_idx)        \
+        for (; NULL; )
+static inline bool memcg_kmem_enabled(void)
+{
+        return false;
+}
+static inline bool
+memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
+{
+        return true;
+}
+static inline void memcg_kmem_uncharge_pages(struct page *page, int order)
+{
+}
+static inline void
+memcg_kmem_commit_charge(struct page *page, struct mem_cgroup *memcg, int order)
+{
+}
+static inline int memcg_cache_id(struct mem_cgroup *memcg)
+{
+        return -1;
+}
+static inline int
+memcg_register_cache(struct mem_cgroup *memcg, struct kmem_cache *s,
+                     struct kmem_cache *root_cache)
+{
+        return 0;
+}
+static inline void memcg_release_cache(struct kmem_cache *cachep)
+{
+}
+static inline void memcg_cache_list_add(struct mem_cgroup *memcg,
+                                        struct kmem_cache *s)
+{
+}
+static inline struct kmem_cache *
+memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
+{
+        return cachep;
+}
+static inline void kmem_cache_destroy_memcg_children(struct kmem_cache *s)
+{
+}
+#endif /* CONFIG_MEMCG_KMEM */
 #endif /* _LINUX_MEMCONTROL_H */
author	Linus Torvalds <torvalds@linux-foundation.org>	2012-12-18 18:08:12 -0500
committer	Linus Torvalds <torvalds@linux-foundation.org>	2012-12-18 18:08:12 -0500
commit	673ab8783b596cda5b616b317b1a1b47480c66fd (patch)
tree	d3fc9bb4279720c53d0dc69c2a34c40635cf05f3 /include/linux/memcontrol.h
parent	d7b96ca5d08a8f2f836feb2b3b3bd721d2837a8e (diff)
parent	3cf23841b4b76eb94d3f8d0fb3627690e4431413 (diff)

diff --git a/include/linux/memcontrol.h b/include/linux/memcontrol.h index e98a74c0c9c0..0108a56f814e 100644 --- a/include/linux/memcontrol.h +++ b/include/linux/memcontrol.h
@@ -21,11 +21,14 @@
21	#define _LINUX_MEMCONTROL_H	21	#define _LINUX_MEMCONTROL_H
22	#include <linux/cgroup.h>	22	#include <linux/cgroup.h>
23	#include <linux/vm_event_item.h>	23	#include <linux/vm_event_item.h>
		24	#include <linux/hardirq.h>
		25	#include <linux/jump_label.h>
24		26
25	struct mem_cgroup;	27	struct mem_cgroup;
26	struct page_cgroup;	28	struct page_cgroup;
27	struct page;	29	struct page;
28	struct mm_struct;	30	struct mm_struct;
		31	struct kmem_cache;
29		32
30	/* Stats that can be updated by kernel. */	33	/* Stats that can be updated by kernel. */
31	enum mem_cgroup_page_stat_item {	34	enum mem_cgroup_page_stat_item {
@@ -414,5 +417,211 @@ static inline void sock_release_memcg(struct sock *sk)
414	{	417	{
415	}	418	}
416	#endif /* CONFIG_INET && CONFIG_MEMCG_KMEM */	419	#endif /* CONFIG_INET && CONFIG_MEMCG_KMEM */
		420
		421	#ifdef CONFIG_MEMCG_KMEM
		422	extern struct static_key memcg_kmem_enabled_key;
		423
		424	extern int memcg_limited_groups_array_size;
		425
		426	/*
		427	* Helper macro to loop through all memcg-specific caches. Callers must still
		428	* check if the cache is valid (it is either valid or NULL).
		429	* the slab_mutex must be held when looping through those caches
		430	*/
		431	#define for_each_memcg_cache_index(_idx) \
		432	for ((_idx) = 0; i < memcg_limited_groups_array_size; (_idx)++)
		433
		434	static inline bool memcg_kmem_enabled(void)
		435	{
		436	return static_key_false(&memcg_kmem_enabled_key);
		437	}
		438
		439	/*
		440	* In general, we'll do everything in our power to not incur in any overhead
		441	* for non-memcg users for the kmem functions. Not even a function call, if we
		442	* can avoid it.
		443	*
		444	* Therefore, we'll inline all those functions so that in the best case, we'll
		445	* see that kmemcg is off for everybody and proceed quickly. If it is on,
		446	* we'll still do most of the flag checking inline. We check a lot of
		447	* conditions, but because they are pretty simple, they are expected to be
		448	* fast.
		449	*/
		450	bool __memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg,
		451	int order);
		452	void __memcg_kmem_commit_charge(struct page *page,
		453	struct mem_cgroup *memcg, int order);
		454	void __memcg_kmem_uncharge_pages(struct page *page, int order);
		455
		456	int memcg_cache_id(struct mem_cgroup *memcg);
		457	int memcg_register_cache(struct mem_cgroup memcg, struct kmem_cache s,
		458	struct kmem_cache *root_cache);
		459	void memcg_release_cache(struct kmem_cache *cachep);
		460	void memcg_cache_list_add(struct mem_cgroup memcg, struct kmem_cache cachep);
		461
		462	int memcg_update_cache_size(struct kmem_cache *s, int num_groups);
		463	void memcg_update_array_size(int num_groups);
		464
		465	struct kmem_cache *
		466	__memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp);
		467
		468	void mem_cgroup_destroy_cache(struct kmem_cache *cachep);
		469	void kmem_cache_destroy_memcg_children(struct kmem_cache *s);
		470
		471	/**
		472	* memcg_kmem_newpage_charge: verify if a new kmem allocation is allowed.
		473	* @gfp: the gfp allocation flags.
		474	* @memcg: a pointer to the memcg this was charged against.
		475	* @order: allocation order.
		476	*
		477	* returns true if the memcg where the current task belongs can hold this
		478	* allocation.
		479	*
		480	* We return true automatically if this allocation is not to be accounted to
		481	* any memcg.
		482	*/
		483	static inline bool
		484	memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
		485	{
		486	if (!memcg_kmem_enabled())
		487	return true;
		488
		489	/*
		490	* __GFP_NOFAIL allocations will move on even if charging is not
		491	* possible. Therefore we don't even try, and have this allocation
		492	* unaccounted. We could in theory charge it with
		493	* res_counter_charge_nofail, but we hope those allocations are rare,
		494	* and won't be worth the trouble.
		495	*/
		496	if (!(gfp & __GFP_KMEMCG) \|\| (gfp & __GFP_NOFAIL))
		497	return true;
		498	if (in_interrupt() \|\| (!current->mm) \|\| (current->flags & PF_KTHREAD))
		499	return true;
		500
		501	/* If the test is dying, just let it go. */
		502	if (unlikely(fatal_signal_pending(current)))
		503	return true;
		504
		505	return __memcg_kmem_newpage_charge(gfp, memcg, order);
		506	}
		507
		508	/**
		509	* memcg_kmem_uncharge_pages: uncharge pages from memcg
		510	* @page: pointer to struct page being freed
		511	* @order: allocation order.
		512	*
		513	* there is no need to specify memcg here, since it is embedded in page_cgroup
		514	*/
		515	static inline void
		516	memcg_kmem_uncharge_pages(struct page *page, int order)
		517	{
		518	if (memcg_kmem_enabled())
		519	__memcg_kmem_uncharge_pages(page, order);
		520	}
		521
		522	/**
		523	* memcg_kmem_commit_charge: embeds correct memcg in a page
		524	* @page: pointer to struct page recently allocated
		525	* @memcg: the memcg structure we charged against
		526	* @order: allocation order.
		527	*
		528	* Needs to be called after memcg_kmem_newpage_charge, regardless of success or
		529	* failure of the allocation. if @page is NULL, this function will revert the
		530	* charges. Otherwise, it will commit the memcg given by @memcg to the
		531	* corresponding page_cgroup.
		532	*/
		533	static inline void
		534	memcg_kmem_commit_charge(struct page page, struct mem_cgroup memcg, int order)
		535	{
		536	if (memcg_kmem_enabled() && memcg)
		537	__memcg_kmem_commit_charge(page, memcg, order);
		538	}
		539
		540	/**
		541	* memcg_kmem_get_cache: selects the correct per-memcg cache for allocation
		542	* @cachep: the original global kmem cache
		543	* @gfp: allocation flags.
		544	*
		545	* This function assumes that the task allocating, which determines the memcg
		546	* in the page allocator, belongs to the same cgroup throughout the whole
		547	* process. Misacounting can happen if the task calls memcg_kmem_get_cache()
		548	* while belonging to a cgroup, and later on changes. This is considered
		549	* acceptable, and should only happen upon task migration.
		550	*
		551	* Before the cache is created by the memcg core, there is also a possible
		552	* imbalance: the task belongs to a memcg, but the cache being allocated from
		553	* is the global cache, since the child cache is not yet guaranteed to be
		554	* ready. This case is also fine, since in this case the GFP_KMEMCG will not be
		555	* passed and the page allocator will not attempt any cgroup accounting.
		556	*/
		557	static __always_inline struct kmem_cache *
		558	memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
		559	{
		560	if (!memcg_kmem_enabled())
		561	return cachep;
		562	if (gfp & __GFP_NOFAIL)
		563	return cachep;
		564	if (in_interrupt() \|\| (!current->mm) \|\| (current->flags & PF_KTHREAD))
		565	return cachep;
		566	if (unlikely(fatal_signal_pending(current)))
		567	return cachep;
		568
		569	return __memcg_kmem_get_cache(cachep, gfp);
		570	}
		571	#else
		572	#define for_each_memcg_cache_index(_idx) \
		573	for (; NULL; )
		574
		575	static inline bool memcg_kmem_enabled(void)
		576	{
		577	return false;
		578	}
		579
		580	static inline bool
		581	memcg_kmem_newpage_charge(gfp_t gfp, struct mem_cgroup **memcg, int order)
		582	{
		583	return true;
		584	}
		585
		586	static inline void memcg_kmem_uncharge_pages(struct page *page, int order)
		587	{
		588	}
		589
		590	static inline void
		591	memcg_kmem_commit_charge(struct page page, struct mem_cgroup memcg, int order)
		592	{
		593	}
		594
		595	static inline int memcg_cache_id(struct mem_cgroup *memcg)
		596	{
		597	return -1;
		598	}
		599
		600	static inline int
		601	memcg_register_cache(struct mem_cgroup memcg, struct kmem_cache s,
		602	struct kmem_cache *root_cache)
		603	{
		604	return 0;
		605	}
		606
		607	static inline void memcg_release_cache(struct kmem_cache *cachep)
		608	{
		609	}
		610
		611	static inline void memcg_cache_list_add(struct mem_cgroup *memcg,
		612	struct kmem_cache *s)
		613	{
		614	}
		615
		616	static inline struct kmem_cache *
		617	memcg_kmem_get_cache(struct kmem_cache *cachep, gfp_t gfp)
		618	{
		619	return cachep;
		620	}
		621
		622	static inline void kmem_cache_destroy_memcg_children(struct kmem_cache *s)
		623	{
		624	}
		625	#endif /* CONFIG_MEMCG_KMEM */
417	#endif /* _LINUX_MEMCONTROL_H */	626	#endif /* _LINUX_MEMCONTROL_H */
418		627