2 files changed, 420 insertions, 0 deletions
diff --git a/arch/powerpc/lib/Makefile b/arch/powerpc/lib/Makefile
index a0360ae10d0c..e2d414160c83 100644
--- a/arch/powerpc/lib/Makefile
+++ b/arch/powerpc/lib/Makefile
@@ -16,6 +16,7 @@ obj-$(CONFIG_PPC64)	+= checksum_64.o copypage_64.o copyuser_64.o \
                           strcase.o
 obj-$(CONFIG_QUICC_ENGINE) += rheap.o
 obj-$(CONFIG_XMON)      += sstep.o
+obj-$(CONFIG_NOT_COHERENT_CACHE)        += dma-noncoherent.o
 ifeq ($(CONFIG_PPC64),y)
 obj-$(CONFIG_SMP)       += locks.o
@@ -24,5 +25,6 @@ endif
 # Temporary hack until we have migrated to asm-powerpc
 ifeq ($(CONFIG_PPC_MERGE),y)
+obj-$(CONFIG_8xx)       += rheap.o
 obj-$(CONFIG_CPM2)      += rheap.o
 endif
diff --git a/arch/powerpc/lib/dma-noncoherent.c b/arch/powerpc/lib/dma-noncoherent.c
new file mode 100644
index 000000000000..48f3d13a3de5
--- /dev/null
+++ b/arch/powerpc/lib/dma-noncoherent.c
@@ -0,0 +1,418 @@
+/*
+ *  PowerPC version derived from arch/arm/mm/consistent.c
+ *    Copyright (C) 2001 Dan Malek (dmalek@jlc.net)
+ *
+ *  Copyright (C) 2000 Russell King
+ *
+ * Consistent memory allocators.  Used for DMA devices that want to
+ * share uncached memory with the processor core.  The function return
+ * is the virtual address and 'dma_handle' is the physical address.
+ * Mostly stolen from the ARM port, with some changes for PowerPC.
+ *                                              -- Dan
+ *
+ * Reorganized to get rid of the arch-specific consistent_* functions
+ * and provide non-coherent implementations for the DMA API. -Matt
+ *
+ * Added in_interrupt() safe dma_alloc_coherent()/dma_free_coherent()
+ * implementation. This is pulled straight from ARM and barely
+ * modified. -Matt
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License version 2 as
+ * published by the Free Software Foundation.
+ */
+#include <linux/sched.h>
+#include <linux/kernel.h>
+#include <linux/errno.h>
+#include <linux/string.h>
+#include <linux/types.h>
+#include <linux/highmem.h>
+#include <linux/dma-mapping.h>
+#include <asm/tlbflush.h>
+/*
+ * This address range defaults to a value that is safe for all
+ * platforms which currently set CONFIG_NOT_COHERENT_CACHE. It
+ * can be further configured for specific applications under
+ * the "Advanced Setup" menu. -Matt
+ */
+#define CONSISTENT_BASE (CONFIG_CONSISTENT_START)
+#define CONSISTENT_END  (CONFIG_CONSISTENT_START + CONFIG_CONSISTENT_SIZE)
+#define CONSISTENT_OFFSET(x)    (((unsigned long)(x) - CONSISTENT_BASE) >> PAGE_SHIFT)
+/*
+ * This is the page table (2MB) covering uncached, DMA consistent allocations
+ */
+static pte_t *consistent_pte;
+static DEFINE_SPINLOCK(consistent_lock);
+/*
+ * VM region handling support.
+ *
+ * This should become something generic, handling VM region allocations for
+ * vmalloc and similar (ioremap, module space, etc).
+ *
+ * I envisage vmalloc()'s supporting vm_struct becoming:
+ *
+ *  struct vm_struct {
+ *    struct vm_region  region;
+ *    unsigned long     flags;
+ *    struct page       **pages;
+ *    unsigned int      nr_pages;
+ *    unsigned long     phys_addr;
+ *  };
+ *
+ * get_vm_area() would then call vm_region_alloc with an appropriate
+ * struct vm_region head (eg):
+ *
+ *  struct vm_region vmalloc_head = {
+ *      .vm_list        = LIST_HEAD_INIT(vmalloc_head.vm_list),
+ *      .vm_start       = VMALLOC_START,
+ *      .vm_end         = VMALLOC_END,
+ *  };
+ *
+ * However, vmalloc_head.vm_start is variable (typically, it is dependent on
+ * the amount of RAM found at boot time.)  I would imagine that get_vm_area()
+ * would have to initialise this each time prior to calling vm_region_alloc().
+ */
+struct vm_region {
+        struct list_head        vm_list;
+        unsigned long           vm_start;
+        unsigned long           vm_end;
+};
+static struct vm_region consistent_head = {
+        .vm_list        = LIST_HEAD_INIT(consistent_head.vm_list),
+        .vm_start       = CONSISTENT_BASE,
+        .vm_end         = CONSISTENT_END,
+};
+static struct vm_region *
+vm_region_alloc(struct vm_region *head, size_t size, gfp_t gfp)
+{
+        unsigned long addr = head->vm_start, end = head->vm_end - size;
+        unsigned long flags;
+        struct vm_region *c, *new;
+        new = kmalloc(sizeof(struct vm_region), gfp);
+        if (!new)
+                goto out;
+        spin_lock_irqsave(&consistent_lock, flags);
+        list_for_each_entry(c, &head->vm_list, vm_list) {
+                if ((addr + size) < addr)
+                        goto nospc;
+                if ((addr + size) <= c->vm_start)
+                        goto found;
+                addr = c->vm_end;
+                if (addr > end)
+                        goto nospc;
+        }
+ found:
+        /*
+         * Insert this entry _before_ the one we found.
+         */
+        list_add_tail(&new->vm_list, &c->vm_list);
+        new->vm_start = addr;
+        new->vm_end = addr + size;
+        spin_unlock_irqrestore(&consistent_lock, flags);
+        return new;
+ nospc:
+        spin_unlock_irqrestore(&consistent_lock, flags);
+        kfree(new);
+ out:
+        return NULL;
+}
+static struct vm_region *vm_region_find(struct vm_region *head, unsigned long addr)
+{
+        struct vm_region *c;
+        list_for_each_entry(c, &head->vm_list, vm_list) {
+                if (c->vm_start == addr)
+                        goto out;
+        }
+        c = NULL;
+ out:
+        return c;
+}
+/*
+ * Allocate DMA-coherent memory space and return both the kernel remapped
+ * virtual and bus address for that space.
+ */
+void *
+__dma_alloc_coherent(size_t size, dma_addr_t *handle, gfp_t gfp)
+{
+        struct page *page;
+        struct vm_region *c;
+        unsigned long order;
+        u64 mask = 0x00ffffff, limit; /* ISA default */
+        if (!consistent_pte) {
+                printk(KERN_ERR "%s: not initialised\n", __func__);
+                dump_stack();
+                return NULL;
+        }
+        size = PAGE_ALIGN(size);
+        limit = (mask + 1) & ~mask;
+        if ((limit && size >= limit) || size >= (CONSISTENT_END - CONSISTENT_BASE)) {
+                printk(KERN_WARNING "coherent allocation too big (requested %#x mask %#Lx)\n",
+                       size, mask);
+                return NULL;
+        }
+        order = get_order(size);
+        if (mask != 0xffffffff)
+                gfp |= GFP_DMA;
+        page = alloc_pages(gfp, order);
+        if (!page)
+                goto no_page;
+        /*
+         * Invalidate any data that might be lurking in the
+         * kernel direct-mapped region for device DMA.
+         */
+        {
+                unsigned long kaddr = (unsigned long)page_address(page);
+                memset(page_address(page), 0, size);
+                flush_dcache_range(kaddr, kaddr + size);
+        }
+        /*
+         * Allocate a virtual address in the consistent mapping region.
+         */
+        c = vm_region_alloc(&consistent_head, size,
+                            gfp & ~(__GFP_DMA | __GFP_HIGHMEM));
+        if (c) {
+                unsigned long vaddr = c->vm_start;
+                pte_t *pte = consistent_pte + CONSISTENT_OFFSET(vaddr);
+                struct page *end = page + (1 << order);
+                split_page(page, order);
+                /*
+                 * Set the "dma handle"
+                 */
+                *handle = page_to_bus(page);
+                do {
+                        BUG_ON(!pte_none(*pte));
+                        SetPageReserved(page);
+                        set_pte_at(&init_mm, vaddr,
+                                   pte, mk_pte(page, pgprot_noncached(PAGE_KERNEL)));
+                        page++;
+                        pte++;
+                        vaddr += PAGE_SIZE;
+                } while (size -= PAGE_SIZE);
+                /*
+                 * Free the otherwise unused pages.
+                 */
+                while (page < end) {
+                        __free_page(page);
+                        page++;
+                }
+                return (void *)c->vm_start;
+        }
+        if (page)
+                __free_pages(page, order);
+ no_page:
+        return NULL;
+}
+EXPORT_SYMBOL(__dma_alloc_coherent);
+/*
+ * free a page as defined by the above mapping.
+ */
+void __dma_free_coherent(size_t size, void *vaddr)
+{
+        struct vm_region *c;
+        unsigned long flags, addr;
+        pte_t *ptep;
+        size = PAGE_ALIGN(size);
+        spin_lock_irqsave(&consistent_lock, flags);
+        c = vm_region_find(&consistent_head, (unsigned long)vaddr);
+        if (!c)
+                goto no_area;
+        if ((c->vm_end - c->vm_start) != size) {
+                printk(KERN_ERR "%s: freeing wrong coherent size (%ld != %d)\n",
+                       __func__, c->vm_end - c->vm_start, size);
+                dump_stack();
+                size = c->vm_end - c->vm_start;
+        }
+        ptep = consistent_pte + CONSISTENT_OFFSET(c->vm_start);
+        addr = c->vm_start;
+        do {
+                pte_t pte = ptep_get_and_clear(&init_mm, addr, ptep);
+                unsigned long pfn;
+                ptep++;
+                addr += PAGE_SIZE;
+                if (!pte_none(pte) && pte_present(pte)) {
+                        pfn = pte_pfn(pte);
+                        if (pfn_valid(pfn)) {
+                                struct page *page = pfn_to_page(pfn);
+                                ClearPageReserved(page);
+                                __free_page(page);
+                                continue;
+                        }
+                }
+                printk(KERN_CRIT "%s: bad page in kernel page table\n",
+                       __func__);
+        } while (size -= PAGE_SIZE);
+        flush_tlb_kernel_range(c->vm_start, c->vm_end);
+        list_del(&c->vm_list);
+        spin_unlock_irqrestore(&consistent_lock, flags);
+        kfree(c);
+        return;
+ no_area:
+        spin_unlock_irqrestore(&consistent_lock, flags);
+        printk(KERN_ERR "%s: trying to free invalid coherent area: %p\n",
+               __func__, vaddr);
+        dump_stack();
+}
+EXPORT_SYMBOL(__dma_free_coherent);
+/*
+ * Initialise the consistent memory allocation.
+ */
+static int __init dma_alloc_init(void)
+{
+        pgd_t *pgd;
+        pmd_t *pmd;
+        pte_t *pte;
+        int ret = 0;
+        do {
+                pgd = pgd_offset(&init_mm, CONSISTENT_BASE);
+                pmd = pmd_alloc(&init_mm, pgd, CONSISTENT_BASE);
+                if (!pmd) {
+                        printk(KERN_ERR "%s: no pmd tables\n", __func__);
+                        ret = -ENOMEM;
+                        break;
+                }
+                WARN_ON(!pmd_none(*pmd));
+                pte = pte_alloc_kernel(pmd, CONSISTENT_BASE);
+                if (!pte) {
+                        printk(KERN_ERR "%s: no pte tables\n", __func__);
+                        ret = -ENOMEM;
+                        break;
+                }
+                consistent_pte = pte;
+        } while (0);
+        return ret;
+}
+core_initcall(dma_alloc_init);
+/*
+ * make an area consistent.
+ */
+void __dma_sync(void *vaddr, size_t size, int direction)
+{
+        unsigned long start = (unsigned long)vaddr;
+        unsigned long end   = start + size;
+        switch (direction) {
+        case DMA_NONE:
+                BUG();
+        case DMA_FROM_DEVICE:   /* invalidate only */
+                invalidate_dcache_range(start, end);
+                break;
+        case DMA_TO_DEVICE:             /* writeback only */
+                clean_dcache_range(start, end);
+                break;
+        case DMA_BIDIRECTIONAL: /* writeback and invalidate */
+                flush_dcache_range(start, end);
+                break;
+        }
+}
+EXPORT_SYMBOL(__dma_sync);
+#ifdef CONFIG_HIGHMEM
+/*
+ * __dma_sync_page() implementation for systems using highmem.
+ * In this case, each page of a buffer must be kmapped/kunmapped
+ * in order to have a virtual address for __dma_sync(). This must
+ * not sleep so kmap_atomic()/kunmap_atomic() are used.
+ *
+ * Note: yes, it is possible and correct to have a buffer extend
+ * beyond the first page.
+ */
+static inline void __dma_sync_page_highmem(struct page *page,
+                unsigned long offset, size_t size, int direction)
+{
+        size_t seg_size = min((size_t)(PAGE_SIZE - offset), size);
+        size_t cur_size = seg_size;
+        unsigned long flags, start, seg_offset = offset;
+        int nr_segs = 1 + ((size - seg_size) + PAGE_SIZE - 1)/PAGE_SIZE;
+        int seg_nr = 0;
+        local_irq_save(flags);
+        do {
+                start = (unsigned long)kmap_atomic(page + seg_nr,
+                                KM_PPC_SYNC_PAGE) + seg_offset;
+                /* Sync this buffer segment */
+                __dma_sync((void *)start, seg_size, direction);
+                kunmap_atomic((void *)start, KM_PPC_SYNC_PAGE);
+                seg_nr++;
+                /* Calculate next buffer segment size */
+                seg_size = min((size_t)PAGE_SIZE, size - cur_size);
+                /* Add the segment size to our running total */
+                cur_size += seg_size;
+                seg_offset = 0;
+        } while (seg_nr < nr_segs);
+        local_irq_restore(flags);
+}
+#endif /* CONFIG_HIGHMEM */
+/*
+ * __dma_sync_page makes memory consistent. identical to __dma_sync, but
+ * takes a struct page instead of a virtual address
+ */
+void __dma_sync_page(struct page *page, unsigned long offset,
+        size_t size, int direction)
+{
+#ifdef CONFIG_HIGHMEM
+        __dma_sync_page_highmem(page, offset, size, direction);
+#else
+        unsigned long start = (unsigned long)page_address(page) + offset;
+        __dma_sync((void *)start, size, direction);
+#endif
+}
+EXPORT_SYMBOL(__dma_sync_page);

diff --git a/arch/powerpc/lib/Makefile b/arch/powerpc/lib/Makefile index a0360ae10d0c..e2d414160c83 100644 --- a/arch/powerpc/lib/Makefile +++ b/arch/powerpc/lib/Makefile
@@ -16,6 +16,7 @@ obj-$(CONFIG_PPC64) += checksum_64.o copypage_64.o copyuser_64.o \
16	strcase.o	16	strcase.o
17	obj-$(CONFIG_QUICC_ENGINE) += rheap.o	17	obj-$(CONFIG_QUICC_ENGINE) += rheap.o
18	obj-$(CONFIG_XMON) += sstep.o	18	obj-$(CONFIG_XMON) += sstep.o
		19	obj-$(CONFIG_NOT_COHERENT_CACHE) += dma-noncoherent.o
19		20
20	ifeq ($(CONFIG_PPC64),y)	21	ifeq ($(CONFIG_PPC64),y)
21	obj-$(CONFIG_SMP) += locks.o	22	obj-$(CONFIG_SMP) += locks.o
@@ -24,5 +25,6 @@ endif
24		25
25	# Temporary hack until we have migrated to asm-powerpc	26	# Temporary hack until we have migrated to asm-powerpc
26	ifeq ($(CONFIG_PPC_MERGE),y)	27	ifeq ($(CONFIG_PPC_MERGE),y)
		28	obj-$(CONFIG_8xx) += rheap.o
27	obj-$(CONFIG_CPM2) += rheap.o	29	obj-$(CONFIG_CPM2) += rheap.o
28	endif	30	endif


diff --git a/arch/powerpc/lib/dma-noncoherent.c b/arch/powerpc/lib/dma-noncoherent.c new file mode 100644 index 000000000000..48f3d13a3de5 --- /dev/null +++ b/arch/powerpc/lib/dma-noncoherent.c
@@ -0,0 +1,418 @@
		1	/*
		2	* PowerPC version derived from arch/arm/mm/consistent.c
		3	* Copyright (C) 2001 Dan Malek (dmalek@jlc.net)
		4	*
		5	* Copyright (C) 2000 Russell King
		6	*
		7	* Consistent memory allocators. Used for DMA devices that want to
		8	* share uncached memory with the processor core. The function return
		9	* is the virtual address and 'dma_handle' is the physical address.
		10	* Mostly stolen from the ARM port, with some changes for PowerPC.
		11	* -- Dan
		12	*
		13	* Reorganized to get rid of the arch-specific consistent_* functions
		14	* and provide non-coherent implementations for the DMA API. -Matt
		15	*
		16	* Added in_interrupt() safe dma_alloc_coherent()/dma_free_coherent()
		17	* implementation. This is pulled straight from ARM and barely
		18	* modified. -Matt
		19	*
		20	* This program is free software; you can redistribute it and/or modify
		21	* it under the terms of the GNU General Public License version 2 as
		22	* published by the Free Software Foundation.
		23	*/
		24
		25	#include <linux/sched.h>
		26	#include <linux/kernel.h>
		27	#include <linux/errno.h>
		28	#include <linux/string.h>
		29	#include <linux/types.h>
		30	#include <linux/highmem.h>
		31	#include <linux/dma-mapping.h>
		32
		33	#include <asm/tlbflush.h>
		34
		35	/*
		36	* This address range defaults to a value that is safe for all
		37	* platforms which currently set CONFIG_NOT_COHERENT_CACHE. It
		38	* can be further configured for specific applications under
		39	* the "Advanced Setup" menu. -Matt
		40	*/
		41	#define CONSISTENT_BASE (CONFIG_CONSISTENT_START)
		42	#define CONSISTENT_END (CONFIG_CONSISTENT_START + CONFIG_CONSISTENT_SIZE)
		43	#define CONSISTENT_OFFSET(x) (((unsigned long)(x) - CONSISTENT_BASE) >> PAGE_SHIFT)
		44
		45	/*
		46	* This is the page table (2MB) covering uncached, DMA consistent allocations
		47	*/
		48	static pte_t *consistent_pte;
		49	static DEFINE_SPINLOCK(consistent_lock);
		50
		51	/*
		52	* VM region handling support.
		53	*
		54	* This should become something generic, handling VM region allocations for
		55	* vmalloc and similar (ioremap, module space, etc).
		56	*
		57	* I envisage vmalloc()'s supporting vm_struct becoming:
		58	*
		59	* struct vm_struct {
		60	* struct vm_region region;
		61	* unsigned long flags;
		62	* struct page **pages;
		63	* unsigned int nr_pages;
		64	* unsigned long phys_addr;
		65	* };
		66	*
		67	* get_vm_area() would then call vm_region_alloc with an appropriate
		68	* struct vm_region head (eg):
		69	*
		70	* struct vm_region vmalloc_head = {
		71	* .vm_list = LIST_HEAD_INIT(vmalloc_head.vm_list),
		72	* .vm_start = VMALLOC_START,
		73	* .vm_end = VMALLOC_END,
		74	* };
		75	*
		76	* However, vmalloc_head.vm_start is variable (typically, it is dependent on
		77	* the amount of RAM found at boot time.) I would imagine that get_vm_area()
		78	* would have to initialise this each time prior to calling vm_region_alloc().
		79	*/
		80	struct vm_region {
		81	struct list_head vm_list;
		82	unsigned long vm_start;
		83	unsigned long vm_end;
		84	};
		85
		86	static struct vm_region consistent_head = {
		87	.vm_list = LIST_HEAD_INIT(consistent_head.vm_list),
		88	.vm_start = CONSISTENT_BASE,
		89	.vm_end = CONSISTENT_END,
		90	};
		91
		92	static struct vm_region *
		93	vm_region_alloc(struct vm_region *head, size_t size, gfp_t gfp)
		94	{
		95	unsigned long addr = head->vm_start, end = head->vm_end - size;
		96	unsigned long flags;
		97	struct vm_region c, new;
		98
		99	new = kmalloc(sizeof(struct vm_region), gfp);
		100	if (!new)
		101	goto out;
		102
		103	spin_lock_irqsave(&consistent_lock, flags);
		104
		105	list_for_each_entry(c, &head->vm_list, vm_list) {
		106	if ((addr + size) < addr)
		107	goto nospc;
		108	if ((addr + size) <= c->vm_start)
		109	goto found;
		110	addr = c->vm_end;
		111	if (addr > end)
		112	goto nospc;
		113	}
		114
		115	found:
		116	/*
		117	* Insert this entry _before_ the one we found.
		118	*/
		119	list_add_tail(&new->vm_list, &c->vm_list);
		120	new->vm_start = addr;
		121	new->vm_end = addr + size;
		122
		123	spin_unlock_irqrestore(&consistent_lock, flags);
		124	return new;
		125
		126	nospc:
		127	spin_unlock_irqrestore(&consistent_lock, flags);
		128	kfree(new);
		129	out:
		130	return NULL;
		131	}
		132
		133	static struct vm_region vm_region_find(struct vm_region head, unsigned long addr)
		134	{
		135	struct vm_region *c;
		136
		137	list_for_each_entry(c, &head->vm_list, vm_list) {
		138	if (c->vm_start == addr)
		139	goto out;
		140	}
		141	c = NULL;
		142	out:
		143	return c;
		144	}
		145
		146	/*
		147	* Allocate DMA-coherent memory space and return both the kernel remapped
		148	* virtual and bus address for that space.
		149	*/
		150	void *
		151	__dma_alloc_coherent(size_t size, dma_addr_t *handle, gfp_t gfp)
		152	{
		153	struct page *page;
		154	struct vm_region *c;
		155	unsigned long order;
		156	u64 mask = 0x00ffffff, limit; /* ISA default */
		157
		158	if (!consistent_pte) {
		159	printk(KERN_ERR "%s: not initialised\n", __func__);
		160	dump_stack();
		161	return NULL;
		162	}
		163
		164	size = PAGE_ALIGN(size);
		165	limit = (mask + 1) & ~mask;
		166	if ((limit && size >= limit) \|\| size >= (CONSISTENT_END - CONSISTENT_BASE)) {
		167	printk(KERN_WARNING "coherent allocation too big (requested %#x mask %#Lx)\n",
		168	size, mask);
		169	return NULL;
		170	}
		171
		172	order = get_order(size);
		173
		174	if (mask != 0xffffffff)
		175	gfp \|= GFP_DMA;
		176
		177	page = alloc_pages(gfp, order);
		178	if (!page)
		179	goto no_page;
		180
		181	/*
		182	* Invalidate any data that might be lurking in the
		183	* kernel direct-mapped region for device DMA.
		184	*/
		185	{
		186	unsigned long kaddr = (unsigned long)page_address(page);
		187	memset(page_address(page), 0, size);
		188	flush_dcache_range(kaddr, kaddr + size);
		189	}
		190
		191	/*
		192	* Allocate a virtual address in the consistent mapping region.
		193	*/
		194	c = vm_region_alloc(&consistent_head, size,
		195	gfp & ~(__GFP_DMA \| __GFP_HIGHMEM));
		196	if (c) {
		197	unsigned long vaddr = c->vm_start;
		198	pte_t *pte = consistent_pte + CONSISTENT_OFFSET(vaddr);
		199	struct page *end = page + (1 << order);
		200
		201	split_page(page, order);
		202
		203	/*
		204	* Set the "dma handle"
		205	*/
		206	*handle = page_to_bus(page);
		207
		208	do {
		209	BUG_ON(!pte_none(*pte));
		210
		211	SetPageReserved(page);
		212	set_pte_at(&init_mm, vaddr,
		213	pte, mk_pte(page, pgprot_noncached(PAGE_KERNEL)));
		214	page++;
		215	pte++;
		216	vaddr += PAGE_SIZE;
		217	} while (size -= PAGE_SIZE);
		218
		219	/*
		220	* Free the otherwise unused pages.
		221	*/
		222	while (page < end) {
		223	__free_page(page);
		224	page++;
		225	}
		226
		227	return (void *)c->vm_start;
		228	}
		229
		230	if (page)
		231	__free_pages(page, order);
		232	no_page:
		233	return NULL;
		234	}
		235	EXPORT_SYMBOL(__dma_alloc_coherent);
		236
		237	/*
		238	* free a page as defined by the above mapping.
		239	*/
		240	void __dma_free_coherent(size_t size, void *vaddr)
		241	{
		242	struct vm_region *c;
		243	unsigned long flags, addr;
		244	pte_t *ptep;
		245
		246	size = PAGE_ALIGN(size);
		247
		248	spin_lock_irqsave(&consistent_lock, flags);
		249
		250	c = vm_region_find(&consistent_head, (unsigned long)vaddr);
		251	if (!c)
		252	goto no_area;
		253
		254	if ((c->vm_end - c->vm_start) != size) {
		255	printk(KERN_ERR "%s: freeing wrong coherent size (%ld != %d)\n",
		256	__func__, c->vm_end - c->vm_start, size);
		257	dump_stack();
		258	size = c->vm_end - c->vm_start;
		259	}
		260
		261	ptep = consistent_pte + CONSISTENT_OFFSET(c->vm_start);
		262	addr = c->vm_start;
		263	do {
		264	pte_t pte = ptep_get_and_clear(&init_mm, addr, ptep);
		265	unsigned long pfn;
		266
		267	ptep++;
		268	addr += PAGE_SIZE;
		269
		270	if (!pte_none(pte) && pte_present(pte)) {
		271	pfn = pte_pfn(pte);
		272
		273	if (pfn_valid(pfn)) {
		274	struct page *page = pfn_to_page(pfn);
		275	ClearPageReserved(page);
		276
		277	__free_page(page);
		278	continue;
		279	}
		280	}
		281
		282	printk(KERN_CRIT "%s: bad page in kernel page table\n",
		283	__func__);
		284	} while (size -= PAGE_SIZE);
		285
		286	flush_tlb_kernel_range(c->vm_start, c->vm_end);
		287
		288	list_del(&c->vm_list);
		289
		290	spin_unlock_irqrestore(&consistent_lock, flags);
		291
		292	kfree(c);
		293	return;
		294
		295	no_area:
		296	spin_unlock_irqrestore(&consistent_lock, flags);
		297	printk(KERN_ERR "%s: trying to free invalid coherent area: %p\n",
		298	__func__, vaddr);
		299	dump_stack();
		300	}
		301	EXPORT_SYMBOL(__dma_free_coherent);
		302
		303	/*
		304	* Initialise the consistent memory allocation.
		305	*/
		306	static int __init dma_alloc_init(void)
		307	{
		308	pgd_t *pgd;
		309	pmd_t *pmd;
		310	pte_t *pte;
		311	int ret = 0;
		312
		313	do {
		314	pgd = pgd_offset(&init_mm, CONSISTENT_BASE);
		315	pmd = pmd_alloc(&init_mm, pgd, CONSISTENT_BASE);
		316	if (!pmd) {
		317	printk(KERN_ERR "%s: no pmd tables\n", __func__);
		318	ret = -ENOMEM;
		319	break;
		320	}
		321	WARN_ON(!pmd_none(*pmd));
		322
		323	pte = pte_alloc_kernel(pmd, CONSISTENT_BASE);
		324	if (!pte) {
		325	printk(KERN_ERR "%s: no pte tables\n", __func__);
		326	ret = -ENOMEM;
		327	break;
		328	}
		329
		330	consistent_pte = pte;
		331	} while (0);
		332
		333	return ret;
		334	}
		335
		336	core_initcall(dma_alloc_init);
		337
		338	/*
		339	* make an area consistent.
		340	*/
		341	void __dma_sync(void *vaddr, size_t size, int direction)
		342	{
		343	unsigned long start = (unsigned long)vaddr;
		344	unsigned long end = start + size;
		345
		346	switch (direction) {
		347	case DMA_NONE:
		348	BUG();
		349	case DMA_FROM_DEVICE: /* invalidate only */
		350	invalidate_dcache_range(start, end);
		351	break;
		352	case DMA_TO_DEVICE: /* writeback only */
		353	clean_dcache_range(start, end);
		354	break;
		355	case DMA_BIDIRECTIONAL: /* writeback and invalidate */
		356	flush_dcache_range(start, end);
		357	break;
		358	}
		359	}
		360	EXPORT_SYMBOL(__dma_sync);
		361
		362	#ifdef CONFIG_HIGHMEM
		363	/*
		364	* __dma_sync_page() implementation for systems using highmem.
		365	* In this case, each page of a buffer must be kmapped/kunmapped
		366	* in order to have a virtual address for __dma_sync(). This must
		367	* not sleep so kmap_atomic()/kunmap_atomic() are used.
		368	*
		369	* Note: yes, it is possible and correct to have a buffer extend
		370	* beyond the first page.
		371	*/
		372	static inline void __dma_sync_page_highmem(struct page *page,
		373	unsigned long offset, size_t size, int direction)
		374	{
		375	size_t seg_size = min((size_t)(PAGE_SIZE - offset), size);
		376	size_t cur_size = seg_size;
		377	unsigned long flags, start, seg_offset = offset;
		378	int nr_segs = 1 + ((size - seg_size) + PAGE_SIZE - 1)/PAGE_SIZE;
		379	int seg_nr = 0;
		380
		381	local_irq_save(flags);
		382
		383	do {
		384	start = (unsigned long)kmap_atomic(page + seg_nr,
		385	KM_PPC_SYNC_PAGE) + seg_offset;
		386
		387	/* Sync this buffer segment */
		388	__dma_sync((void *)start, seg_size, direction);
		389	kunmap_atomic((void *)start, KM_PPC_SYNC_PAGE);
		390	seg_nr++;
		391
		392	/* Calculate next buffer segment size */
		393	seg_size = min((size_t)PAGE_SIZE, size - cur_size);
		394
		395	/* Add the segment size to our running total */
		396	cur_size += seg_size;
		397	seg_offset = 0;
		398	} while (seg_nr < nr_segs);
		399
		400	local_irq_restore(flags);
		401	}
		402	#endif /* CONFIG_HIGHMEM */
		403
		404	/*
		405	* __dma_sync_page makes memory consistent. identical to __dma_sync, but
		406	* takes a struct page instead of a virtual address
		407	*/
		408	void __dma_sync_page(struct page *page, unsigned long offset,
		409	size_t size, int direction)
		410	{
		411	#ifdef CONFIG_HIGHMEM
		412	__dma_sync_page_highmem(page, offset, size, direction);
		413	#else
		414	unsigned long start = (unsigned long)page_address(page) + offset;
		415	__dma_sync((void *)start, size, direction);
		416	#endif
		417	}
		418	EXPORT_SYMBOL(__dma_sync_page);