1 files changed, 64 insertions, 3 deletions
diff --git a/arch/x86/mm/gup.c b/arch/x86/mm/gup.c
index 6340cef6798a..71da1bca13cb 100644
--- a/arch/x86/mm/gup.c
+++ b/arch/x86/mm/gup.c
@@ -14,7 +14,7 @@
 static inline pte_t gup_get_pte(pte_t *ptep)
 {
 #ifndef CONFIG_X86_PAE
-        return *ptep;
+        return ACCESS_ONCE(*ptep);
 #else
        /*
         * With get_user_pages_fast, we walk down the pagetables without taking
@@ -219,6 +219,62 @@ static int gup_pud_range(pgd_t pgd, unsigned long addr, unsigned long end,
        return 1;
 }
+/*
+ * Like get_user_pages_fast() except its IRQ-safe in that it won't fall
+ * back to the regular GUP.
+ */
+int __get_user_pages_fast(unsigned long start, int nr_pages, int write,
+                          struct page **pages)
+{
+        struct mm_struct *mm = current->mm;
+        unsigned long addr, len, end;
+        unsigned long next;
+        unsigned long flags;
+        pgd_t *pgdp;
+        int nr = 0;
+        start &= PAGE_MASK;
+        addr = start;
+        len = (unsigned long) nr_pages << PAGE_SHIFT;
+        end = start + len;
+        if (unlikely(!access_ok(write ? VERIFY_WRITE : VERIFY_READ,
+                                        (void __user *)start, len)))
+                return 0;
+        /*
+         * XXX: batch / limit 'nr', to avoid large irq off latency
+         * needs some instrumenting to determine the common sizes used by
+         * important workloads (eg. DB2), and whether limiting the batch size
+         * will decrease performance.
+         *
+         * It seems like we're in the clear for the moment. Direct-IO is
+         * the main guy that batches up lots of get_user_pages, and even
+         * they are limited to 64-at-a-time which is not so many.
+         */
+        /*
+         * This doesn't prevent pagetable teardown, but does prevent
+         * the pagetables and pages from being freed on x86.
+         *
+         * So long as we atomically load page table pointers versus teardown
+         * (which we do on x86, with the above PAE exception), we can follow the
+         * address down to the the page and take a ref on it.
+         */
+        local_irq_save(flags);
+        pgdp = pgd_offset(mm, addr);
+        do {
+                pgd_t pgd = *pgdp;
+                next = pgd_addr_end(addr, end);
+                if (pgd_none(pgd))
+                        break;
+                if (!gup_pud_range(pgd, addr, next, write, pages, &nr))
+                        break;
+        } while (pgdp++, addr = next, addr != end);
+        local_irq_restore(flags);
+        return nr;
+}
 /**
 * get_user_pages_fast() - pin user pages in memory
 * @start:      starting user address
@@ -247,11 +303,16 @@ int get_user_pages_fast(unsigned long start, int nr_pages, int write,
        start &= PAGE_MASK;
        addr = start;
        len = (unsigned long) nr_pages << PAGE_SHIFT;
        end = start + len;
-        if (unlikely(!access_ok(write ? VERIFY_WRITE : VERIFY_READ,
+        if (end < start)
-                                        (void __user *)start, len)))
                goto slow_irqon;
+#ifdef CONFIG_X86_64
+        if (end >> __VIRTUAL_MASK_SHIFT)
+                goto slow_irqon;
+#endif
        /*
         * XXX: batch / limit 'nr', to avoid large irq off latency
         * needs some instrumenting to determine the common sizes used by

diff --git a/arch/x86/mm/gup.c b/arch/x86/mm/gup.c index 6340cef6798a..71da1bca13cb 100644 --- a/arch/x86/mm/gup.c +++ b/arch/x86/mm/gup.c
@@ -14,7 +14,7 @@
14	static inline pte_t gup_get_pte(pte_t *ptep)	14	static inline pte_t gup_get_pte(pte_t *ptep)
15	{	15	{
16	#ifndef CONFIG_X86_PAE	16	#ifndef CONFIG_X86_PAE
17	return *ptep;	17	return ACCESS_ONCE(*ptep);
18	#else	18	#else
19	/*	19	/*
20	* With get_user_pages_fast, we walk down the pagetables without taking	20	* With get_user_pages_fast, we walk down the pagetables without taking
@@ -219,6 +219,62 @@ static int gup_pud_range(pgd_t pgd, unsigned long addr, unsigned long end,
219	return 1;	219	return 1;
220	}	220	}
221		221
		222	/*
		223	* Like get_user_pages_fast() except its IRQ-safe in that it won't fall
		224	* back to the regular GUP.
		225	*/
		226	int __get_user_pages_fast(unsigned long start, int nr_pages, int write,
		227	struct page **pages)
		228	{
		229	struct mm_struct *mm = current->mm;
		230	unsigned long addr, len, end;
		231	unsigned long next;
		232	unsigned long flags;
		233	pgd_t *pgdp;
		234	int nr = 0;
		235
		236	start &= PAGE_MASK;
		237	addr = start;
		238	len = (unsigned long) nr_pages << PAGE_SHIFT;
		239	end = start + len;
		240	if (unlikely(!access_ok(write ? VERIFY_WRITE : VERIFY_READ,
		241	(void __user *)start, len)))
		242	return 0;
		243
		244	/*
		245	* XXX: batch / limit 'nr', to avoid large irq off latency
		246	* needs some instrumenting to determine the common sizes used by
		247	* important workloads (eg. DB2), and whether limiting the batch size
		248	* will decrease performance.
		249	*
		250	* It seems like we're in the clear for the moment. Direct-IO is
		251	* the main guy that batches up lots of get_user_pages, and even
		252	* they are limited to 64-at-a-time which is not so many.
		253	*/
		254	/*
		255	* This doesn't prevent pagetable teardown, but does prevent
		256	* the pagetables and pages from being freed on x86.
		257	*
		258	* So long as we atomically load page table pointers versus teardown
		259	* (which we do on x86, with the above PAE exception), we can follow the
		260	* address down to the the page and take a ref on it.
		261	*/
		262	local_irq_save(flags);
		263	pgdp = pgd_offset(mm, addr);
		264	do {
		265	pgd_t pgd = *pgdp;
		266
		267	next = pgd_addr_end(addr, end);
		268	if (pgd_none(pgd))
		269	break;
		270	if (!gup_pud_range(pgd, addr, next, write, pages, &nr))
		271	break;
		272	} while (pgdp++, addr = next, addr != end);
		273	local_irq_restore(flags);
		274
		275	return nr;
		276	}
		277
222	/**	278	/**
223	* get_user_pages_fast() - pin user pages in memory	279	* get_user_pages_fast() - pin user pages in memory
224	* @start: starting user address	280	* @start: starting user address
@@ -247,11 +303,16 @@ int get_user_pages_fast(unsigned long start, int nr_pages, int write,
247	start &= PAGE_MASK;	303	start &= PAGE_MASK;
248	addr = start;	304	addr = start;
249	len = (unsigned long) nr_pages << PAGE_SHIFT;	305	len = (unsigned long) nr_pages << PAGE_SHIFT;
		306
250	end = start + len;	307	end = start + len;
251	if (unlikely(!access_ok(write ? VERIFY_WRITE : VERIFY_READ,	308	if (end < start)
252	(void __user *)start, len)))
253	goto slow_irqon;	309	goto slow_irqon;
254		310
		311	#ifdef CONFIG_X86_64
		312	if (end >> __VIRTUAL_MASK_SHIFT)
		313	goto slow_irqon;
		314	#endif
		315
255	/*	316	/*
256	* XXX: batch / limit 'nr', to avoid large irq off latency	317	* XXX: batch / limit 'nr', to avoid large irq off latency
257	* needs some instrumenting to determine the common sizes used by	318	* needs some instrumenting to determine the common sizes used by