mm: extended batches for generic mmu_gather

Instead of using a single batch (the small on-stack, or an allocated page), try and extend the batch every time it runs out and only flush once either the extend fails or we're done. Signed-off-by: Peter Zijlstra <a.p.zijlstra@chello.nl> Requested-by: Nick Piggin <npiggin@kernel.dk> Reviewed-by: KAMEZAWA Hiroyuki <kamezawa.hiroyu@jp.fujitsu.com> Acked-by: Hugh Dickins <hughd@google.com> Cc: Benjamin Herrenschmidt <benh@kernel.crashing.org> Cc: David Miller <davem@davemloft.net> Cc: Martin Schwidefsky <schwidefsky@de.ibm.com> Cc: Russell King <rmk@arm.linux.org.uk> Cc: Paul Mundt <lethal@linux-sh.org> Cc: Jeff Dike <jdike@addtoit.com> Cc: Richard Weinberger <richard@nod.at> Cc: Tony Luck <tony.luck@intel.com> Cc: Mel Gorman <mel@csn.ul.ie> Cc: KOSAKI Motohiro <kosaki.motohiro@jp.fujitsu.com> Cc: Nick Piggin <npiggin@kernel.dk> Cc: Namhyung Kim <namhyung@gmail.com> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
author: Peter Zijlstra <a.p.zijlstra@chello.nl> 2011-05-24 20:12:01 -0400
committer: Linus Torvalds <torvalds@linux-foundation.org> 2011-05-25 11:39:16 -0400
commit: e303297e6c3a7b847c4731eb14006ca6b435ecca (patch)
tree: c2bbec8fb0cad1405f4a3ff908cd1d22abcd3e77 /include/asm-generic
parent: 267239116987d64850ad2037d8e0f3071dc3b5ce (diff)
1 files changed, 83 insertions, 46 deletions
diff --git a/include/asm-generic/tlb.h b/include/asm-generic/tlb.h
index 74f80f6b6cf1..5a946a08ff9d 100644
--- a/include/asm-generic/tlb.h
+++ b/include/asm-generic/tlb.h
@@ -19,16 +19,6 @@
 #include <asm/pgalloc.h>
 #include <asm/tlbflush.h>
-/*
- * For UP we don't need to worry about TLB flush
- * and page free order so much..
- */
-#ifdef CONFIG_SMP
-  #define tlb_fast_mode(tlb) ((tlb)->nr == ~0U)
-#else
-  #define tlb_fast_mode(tlb) 1
-#endif
 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
 /*
 * Semi RCU freeing of the page directories.
@@ -78,6 +68,16 @@ extern void tlb_remove_table(struct mmu_gather *tlb, void *table);
 */
 #define MMU_GATHER_BUNDLE       8
+struct mmu_gather_batch {
+        struct mmu_gather_batch *next;
+        unsigned int            nr;
+        unsigned int            max;
+        struct page             *pages[0];
+};
+#define MAX_GATHER_BATCH        \
+        ((PAGE_SIZE - sizeof(struct mmu_gather_batch)) / sizeof(void *))
 /* struct mmu_gather is an opaque type used by the mm code for passing around
 * any data needed by arch specific code for tlb_remove_page.
 */
@@ -86,22 +86,48 @@ struct mmu_gather {
 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
        struct mmu_table_batch  *batch;
 #endif
-        unsigned int            nr;     /* set to ~0U means fast mode */
+        unsigned int            need_flush : 1, /* Did free PTEs */
-        unsigned int            max;    /* nr < max */
+                                fast_mode  : 1; /* No batching   */
-        unsigned int            need_flush;/* Really unmapped some ptes? */
-        unsigned int            fullmm; /* non-zero means full mm flush */
+        unsigned int            fullmm;
-        struct page             **pages;
-        struct page             *local[MMU_GATHER_BUNDLE];
+        struct mmu_gather_batch *active;
+        struct mmu_gather_batch local;
+        struct page             *__pages[MMU_GATHER_BUNDLE];
 };
-static inline void __tlb_alloc_page(struct mmu_gather *tlb)
+/*
+ * For UP we don't need to worry about TLB flush
+ * and page free order so much..
+ */
+#ifdef CONFIG_SMP
+  #define tlb_fast_mode(tlb) (tlb->fast_mode)
+#else
+  #define tlb_fast_mode(tlb) 1
+#endif
+static inline int tlb_next_batch(struct mmu_gather *tlb)
 {
-        unsigned long addr = __get_free_pages(GFP_NOWAIT | __GFP_NOWARN, 0);
+        struct mmu_gather_batch *batch;
-        if (addr) {
+        batch = tlb->active;
-                tlb->pages = (void *)addr;
+        if (batch->next) {
-                tlb->max = PAGE_SIZE / sizeof(struct page *);
+                tlb->active = batch->next;
+                return 1;
        }
+        batch = (void *)__get_free_pages(GFP_NOWAIT | __GFP_NOWARN, 0);
+        if (!batch)
+                return 0;
+        batch->next = NULL;
+        batch->nr   = 0;
+        batch->max  = MAX_GATHER_BATCH;
+        tlb->active->next = batch;
+        tlb->active = batch;
+        return 1;
 }
 /* tlb_gather_mmu
@@ -114,16 +140,13 @@ tlb_gather_mmu(struct mmu_gather *tlb, struct mm_struct *mm, bool fullmm)
 {
        tlb->mm = mm;
-        tlb->max = ARRAY_SIZE(tlb->local);
+        tlb->fullmm     = fullmm;
-        tlb->pages = tlb->local;
+        tlb->need_flush = 0;
+        tlb->fast_mode  = (num_possible_cpus() == 1);
-        if (num_online_cpus() > 1) {
+        tlb->local.next = NULL;
-                tlb->nr = 0;
+        tlb->local.nr   = 0;
-                __tlb_alloc_page(tlb);
+        tlb->local.max  = ARRAY_SIZE(tlb->__pages);
-        } else /* Use fast mode if only one CPU is online */
+        tlb->active     = &tlb->local;
-                tlb->nr = ~0U;
-        tlb->fullmm = fullmm;
 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
        tlb->batch = NULL;
@@ -133,6 +156,8 @@ tlb_gather_mmu(struct mmu_gather *tlb, struct mm_struct *mm, bool fullmm)
 static inline void
 tlb_flush_mmu(struct mmu_gather *tlb)
 {
+        struct mmu_gather_batch *batch;
        if (!tlb->need_flush)
                return;
        tlb->need_flush = 0;
@@ -140,17 +165,15 @@ tlb_flush_mmu(struct mmu_gather *tlb)
 #ifdef CONFIG_HAVE_RCU_TABLE_FREE
        tlb_table_flush(tlb);
 #endif
-        if (!tlb_fast_mode(tlb)) {
-                free_pages_and_swap_cache(tlb->pages, tlb->nr);
+        if (tlb_fast_mode(tlb))
-                tlb->nr = 0;
+                return;
-                /*
-                 * If we are using the local on-stack array of pages for MMU
+        for (batch = &tlb->local; batch; batch = batch->next) {
-                 * gather, try allocating an off-stack array again as we have
+                free_pages_and_swap_cache(batch->pages, batch->nr);
-                 * recently freed pages.
+                batch->nr = 0;
-                 */
-                if (tlb->pages == tlb->local)
-                        __tlb_alloc_page(tlb);
        }
+        tlb->active = &tlb->local;
 }
 /* tlb_finish_mmu
@@ -160,13 +183,18 @@ tlb_flush_mmu(struct mmu_gather *tlb)
 static inline void
 tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
 {
+        struct mmu_gather_batch *batch, *next;
        tlb_flush_mmu(tlb);
        /* keep the page table cache within bounds */
        check_pgt_cache();
-        if (tlb->pages != tlb->local)
+        for (batch = tlb->local.next; batch; batch = next) {
-                free_pages((unsigned long)tlb->pages, 0);
+                next = batch->next;
+                free_pages((unsigned long)batch, 0);
+        }
+        tlb->local.next = NULL;
 }
 /* __tlb_remove_page
@@ -177,15 +205,24 @@ tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
 */
 static inline int __tlb_remove_page(struct mmu_gather *tlb, struct page *page)
 {
+        struct mmu_gather_batch *batch;
        tlb->need_flush = 1;
        if (tlb_fast_mode(tlb)) {
                free_page_and_swap_cache(page);
                return 1; /* avoid calling tlb_flush_mmu() */
        }
-        tlb->pages[tlb->nr++] = page;
-        VM_BUG_ON(tlb->nr > tlb->max);
-        return tlb->max - tlb->nr;
+        batch = tlb->active;
+        batch->pages[batch->nr++] = page;
+        VM_BUG_ON(batch->nr > batch->max);
+        if (batch->nr == batch->max) {
+                if (!tlb_next_batch(tlb))
+                        return 0;
+        }
+        return batch->max - batch->nr;
 }
 /* tlb_remove_page
author	Peter Zijlstra <a.p.zijlstra@chello.nl>	2011-05-24 20:12:01 -0400
committer	Linus Torvalds <torvalds@linux-foundation.org>	2011-05-25 11:39:16 -0400
commit	e303297e6c3a7b847c4731eb14006ca6b435ecca (patch)
tree	c2bbec8fb0cad1405f4a3ff908cd1d22abcd3e77 /include/asm-generic
parent	267239116987d64850ad2037d8e0f3071dc3b5ce (diff)

diff --git a/include/asm-generic/tlb.h b/include/asm-generic/tlb.h index 74f80f6b6cf1..5a946a08ff9d 100644 --- a/include/asm-generic/tlb.h +++ b/include/asm-generic/tlb.h
@@ -19,16 +19,6 @@
19	#include <asm/pgalloc.h>	19	#include <asm/pgalloc.h>
20	#include <asm/tlbflush.h>	20	#include <asm/tlbflush.h>
21		21
22	/*
23	* For UP we don't need to worry about TLB flush
24	* and page free order so much..
25	*/
26	#ifdef CONFIG_SMP
27	#define tlb_fast_mode(tlb) ((tlb)->nr == ~0U)
28	#else
29	#define tlb_fast_mode(tlb) 1
30	#endif
31
32	#ifdef CONFIG_HAVE_RCU_TABLE_FREE	22	#ifdef CONFIG_HAVE_RCU_TABLE_FREE
33	/*	23	/*
34	* Semi RCU freeing of the page directories.	24	* Semi RCU freeing of the page directories.
@@ -78,6 +68,16 @@ extern void tlb_remove_table(struct mmu_gather tlb, void table);
78	*/	68	*/
79	#define MMU_GATHER_BUNDLE 8	69	#define MMU_GATHER_BUNDLE 8
80		70
		71	struct mmu_gather_batch {
		72	struct mmu_gather_batch *next;
		73	unsigned int nr;
		74	unsigned int max;
		75	struct page *pages[0];
		76	};
		77
		78	#define MAX_GATHER_BATCH \
		79	((PAGE_SIZE - sizeof(struct mmu_gather_batch)) / sizeof(void *))
		80
81	/* struct mmu_gather is an opaque type used by the mm code for passing around	81	/* struct mmu_gather is an opaque type used by the mm code for passing around
82	* any data needed by arch specific code for tlb_remove_page.	82	* any data needed by arch specific code for tlb_remove_page.
83	*/	83	*/
@@ -86,22 +86,48 @@ struct mmu_gather {
86	#ifdef CONFIG_HAVE_RCU_TABLE_FREE	86	#ifdef CONFIG_HAVE_RCU_TABLE_FREE
87	struct mmu_table_batch *batch;	87	struct mmu_table_batch *batch;
88	#endif	88	#endif
89	unsigned int nr; /* set to ~0U means fast mode */	89	unsigned int need_flush : 1, /* Did free PTEs */
90	unsigned int max; /* nr < max */	90	fast_mode : 1; /* No batching */
91	unsigned int need_flush;/* Really unmapped some ptes? */	91
92	unsigned int fullmm; /* non-zero means full mm flush */	92	unsigned int fullmm;
93	struct page **pages;	93
94	struct page *local[MMU_GATHER_BUNDLE];	94	struct mmu_gather_batch *active;
		95	struct mmu_gather_batch local;
		96	struct page *__pages[MMU_GATHER_BUNDLE];
95	};	97	};
96		98
97	static inline void __tlb_alloc_page(struct mmu_gather *tlb)	99	/*
		100	* For UP we don't need to worry about TLB flush
		101	* and page free order so much..
		102	*/
		103	#ifdef CONFIG_SMP
		104	#define tlb_fast_mode(tlb) (tlb->fast_mode)
		105	#else
		106	#define tlb_fast_mode(tlb) 1
		107	#endif
		108
		109	static inline int tlb_next_batch(struct mmu_gather *tlb)
98	{	110	{
99	unsigned long addr = __get_free_pages(GFP_NOWAIT \| __GFP_NOWARN, 0);	111	struct mmu_gather_batch *batch;
100		112
101	if (addr) {	113	batch = tlb->active;
102	tlb->pages = (void *)addr;	114	if (batch->next) {
103	tlb->max = PAGE_SIZE / sizeof(struct page *);	115	tlb->active = batch->next;
		116	return 1;
104	}	117	}
		118
		119	batch = (void *)__get_free_pages(GFP_NOWAIT \| __GFP_NOWARN, 0);
		120	if (!batch)
		121	return 0;
		122
		123	batch->next = NULL;
		124	batch->nr = 0;
		125	batch->max = MAX_GATHER_BATCH;
		126
		127	tlb->active->next = batch;
		128	tlb->active = batch;
		129
		130	return 1;
105	}	131	}
106		132
107	/* tlb_gather_mmu	133	/* tlb_gather_mmu
@@ -114,16 +140,13 @@ tlb_gather_mmu(struct mmu_gather tlb, struct mm_struct mm, bool fullmm)
114	{	140	{
115	tlb->mm = mm;	141	tlb->mm = mm;
116		142
117	tlb->max = ARRAY_SIZE(tlb->local);	143	tlb->fullmm = fullmm;
118	tlb->pages = tlb->local;	144	tlb->need_flush = 0;
119		145	tlb->fast_mode = (num_possible_cpus() == 1);
120	if (num_online_cpus() > 1) {	146	tlb->local.next = NULL;
121	tlb->nr = 0;	147	tlb->local.nr = 0;
122	__tlb_alloc_page(tlb);	148	tlb->local.max = ARRAY_SIZE(tlb->__pages);
123	} else /* Use fast mode if only one CPU is online */	149	tlb->active = &tlb->local;
124	tlb->nr = ~0U;
125
126	tlb->fullmm = fullmm;
127		150
128	#ifdef CONFIG_HAVE_RCU_TABLE_FREE	151	#ifdef CONFIG_HAVE_RCU_TABLE_FREE
129	tlb->batch = NULL;	152	tlb->batch = NULL;
@@ -133,6 +156,8 @@ tlb_gather_mmu(struct mmu_gather tlb, struct mm_struct mm, bool fullmm)
133	static inline void	156	static inline void
134	tlb_flush_mmu(struct mmu_gather *tlb)	157	tlb_flush_mmu(struct mmu_gather *tlb)
135	{	158	{
		159	struct mmu_gather_batch *batch;
		160
136	if (!tlb->need_flush)	161	if (!tlb->need_flush)
137	return;	162	return;
138	tlb->need_flush = 0;	163	tlb->need_flush = 0;
@@ -140,17 +165,15 @@ tlb_flush_mmu(struct mmu_gather *tlb)
140	#ifdef CONFIG_HAVE_RCU_TABLE_FREE	165	#ifdef CONFIG_HAVE_RCU_TABLE_FREE
141	tlb_table_flush(tlb);	166	tlb_table_flush(tlb);
142	#endif	167	#endif
143	if (!tlb_fast_mode(tlb)) {	168
144	free_pages_and_swap_cache(tlb->pages, tlb->nr);	169	if (tlb_fast_mode(tlb))
145	tlb->nr = 0;	170	return;
146	/*	171
147	* If we are using the local on-stack array of pages for MMU	172	for (batch = &tlb->local; batch; batch = batch->next) {
148	* gather, try allocating an off-stack array again as we have	173	free_pages_and_swap_cache(batch->pages, batch->nr);
149	* recently freed pages.	174	batch->nr = 0;
150	*/
151	if (tlb->pages == tlb->local)
152	__tlb_alloc_page(tlb);
153	}	175	}
		176	tlb->active = &tlb->local;
154	}	177	}
155		178
156	/* tlb_finish_mmu	179	/* tlb_finish_mmu
@@ -160,13 +183,18 @@ tlb_flush_mmu(struct mmu_gather *tlb)
160	static inline void	183	static inline void
161	tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)	184	tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
162	{	185	{
		186	struct mmu_gather_batch batch, next;
		187
163	tlb_flush_mmu(tlb);	188	tlb_flush_mmu(tlb);
164		189
165	/* keep the page table cache within bounds */	190	/* keep the page table cache within bounds */
166	check_pgt_cache();	191	check_pgt_cache();
167		192
168	if (tlb->pages != tlb->local)	193	for (batch = tlb->local.next; batch; batch = next) {
169	free_pages((unsigned long)tlb->pages, 0);	194	next = batch->next;
		195	free_pages((unsigned long)batch, 0);
		196	}
		197	tlb->local.next = NULL;
170	}	198	}
171		199
172	/* __tlb_remove_page	200	/* __tlb_remove_page
@@ -177,15 +205,24 @@ tlb_finish_mmu(struct mmu_gather *tlb, unsigned long start, unsigned long end)
177	*/	205	*/
178	static inline int __tlb_remove_page(struct mmu_gather tlb, struct page page)	206	static inline int __tlb_remove_page(struct mmu_gather tlb, struct page page)
179	{	207	{
		208	struct mmu_gather_batch *batch;
		209
180	tlb->need_flush = 1;	210	tlb->need_flush = 1;
		211
181	if (tlb_fast_mode(tlb)) {	212	if (tlb_fast_mode(tlb)) {
182	free_page_and_swap_cache(page);	213	free_page_and_swap_cache(page);
183	return 1; /* avoid calling tlb_flush_mmu() */	214	return 1; /* avoid calling tlb_flush_mmu() */
184	}	215	}
185	tlb->pages[tlb->nr++] = page;
186	VM_BUG_ON(tlb->nr > tlb->max);
187		216
188	return tlb->max - tlb->nr;	217	batch = tlb->active;
		218	batch->pages[batch->nr++] = page;
		219	VM_BUG_ON(batch->nr > batch->max);
		220	if (batch->nr == batch->max) {
		221	if (!tlb_next_batch(tlb))
		222	return 0;
		223	}
		224
		225	return batch->max - batch->nr;
189	}	226	}
190		227
191	/* tlb_remove_page	228	/* tlb_remove_page