2 files changed, 416 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/common/linux/dma.c b/drivers/gpu/nvgpu/common/linux/dma.c
new file mode 100644
index 00000000..755848ea
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/linux/dma.c
@@ -0,0 +1,415 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <linux/dma-attrs.h>
+#include <linux/dma-mapping.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/lock.h>
+#include "gk20a/gk20a.h"
+#if defined(CONFIG_GK20A_VIDMEM)
+static u64 __gk20a_gmmu_alloc(struct nvgpu_allocator *allocator, dma_addr_t at,
+                                size_t size)
+{
+        u64 addr = 0;
+        if (at)
+                addr = nvgpu_alloc_fixed(allocator, at, size, 0);
+        else
+                addr = nvgpu_alloc(allocator, size);
+        return addr;
+}
+#endif
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
+static void gk20a_dma_flags_to_attrs(unsigned long *attrs,
+                unsigned long flags)
+#define ATTR_ARG(x) *x
+#else
+static void gk20a_dma_flags_to_attrs(struct dma_attrs *attrs,
+                unsigned long flags)
+#define ATTR_ARG(x) x
+#endif
+{
+        if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
+                dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, ATTR_ARG(attrs));
+        if (flags & NVGPU_DMA_FORCE_CONTIGUOUS)
+                dma_set_attr(DMA_ATTR_FORCE_CONTIGUOUS, ATTR_ARG(attrs));
+        if (flags & NVGPU_DMA_READ_ONLY)
+                dma_set_attr(DMA_ATTR_READ_ONLY, ATTR_ARG(attrs));
+#undef ATTR_ARG
+}
+int gk20a_gmmu_alloc(struct gk20a *g, size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags(g, 0, size, mem);
+}
+int gk20a_gmmu_alloc_flags(struct gk20a *g, unsigned long flags, size_t size,
+                struct nvgpu_mem *mem)
+{
+        if (g->mm.vidmem_is_vidmem) {
+                /*
+                 * Force the no-kernel-mapping flag on because we don't support
+                 * the lack of it for vidmem - the user should not care when
+                 * using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
+                 * difference, the user should use the flag explicitly anyway.
+                 */
+                int err = gk20a_gmmu_alloc_flags_vid(g,
+                                flags | NVGPU_DMA_NO_KERNEL_MAPPING,
+                                size, mem);
+                if (!err)
+                        return 0;
+                /*
+                 * Fall back to sysmem (which may then also fail) in case
+                 * vidmem is exhausted.
+                 */
+        }
+        return gk20a_gmmu_alloc_flags_sys(g, flags, size, mem);
+}
+int gk20a_gmmu_alloc_sys(struct gk20a *g, size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags_sys(g, 0, size, mem);
+}
+int gk20a_gmmu_alloc_flags_sys(struct gk20a *g, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        struct device *d = dev_from_gk20a(g);
+        int err;
+        dma_addr_t iova;
+        gk20a_dbg_fn("");
+        if (flags) {
+                DEFINE_DMA_ATTRS(dma_attrs);
+                gk20a_dma_flags_to_attrs(&dma_attrs, flags);
+                if (flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
+                        mem->pages = dma_alloc_attrs(d,
+                                        size, &iova, GFP_KERNEL,
+                                        __DMA_ATTR(dma_attrs));
+                        if (!mem->pages)
+                                return -ENOMEM;
+                } else {
+                        mem->cpu_va = dma_alloc_attrs(d,
+                                        size, &iova, GFP_KERNEL,
+                                        __DMA_ATTR(dma_attrs));
+                        if (!mem->cpu_va)
+                                return -ENOMEM;
+                }
+        } else {
+                mem->cpu_va = dma_alloc_coherent(d, size, &iova, GFP_KERNEL);
+                if (!mem->cpu_va)
+                        return -ENOMEM;
+        }
+        if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
+                err = gk20a_get_sgtable_from_pages(d, &mem->sgt, mem->pages,
+                                                   iova, size);
+        else {
+                err = gk20a_get_sgtable(d, &mem->sgt, mem->cpu_va, iova, size);
+                memset(mem->cpu_va, 0, size);
+        }
+        if (err)
+                goto fail_free;
+        mem->size = size;
+        mem->aperture = APERTURE_SYSMEM;
+        mem->flags = flags;
+        gk20a_dbg_fn("done");
+        return 0;
+fail_free:
+        dma_free_coherent(d, size, mem->cpu_va, iova);
+        mem->cpu_va = NULL;
+        mem->sgt = NULL;
+        return err;
+}
+int gk20a_gmmu_alloc_vid(struct gk20a *g, size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags_vid(g,
+                        NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
+}
+int gk20a_gmmu_alloc_flags_vid(struct gk20a *g, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags_vid_at(g, flags, size, mem, 0);
+}
+int gk20a_gmmu_alloc_flags_vid_at(struct gk20a *g, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem, dma_addr_t at)
+{
+#if defined(CONFIG_GK20A_VIDMEM)
+        u64 addr;
+        int err;
+        struct nvgpu_allocator *vidmem_alloc = g->mm.vidmem.cleared ?
+                &g->mm.vidmem.allocator :
+                &g->mm.vidmem.bootstrap_allocator;
+        int before_pending;
+        gk20a_dbg_fn("");
+        if (!nvgpu_alloc_initialized(&g->mm.vidmem.allocator))
+                return -ENOSYS;
+        /*
+         * Our own allocator doesn't have any flags yet, and we can't
+         * kernel-map these, so require explicit flags.
+         */
+        WARN_ON(flags != NVGPU_DMA_NO_KERNEL_MAPPING);
+        nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
+        before_pending = atomic64_read(&g->mm.vidmem.bytes_pending);
+        addr = __gk20a_gmmu_alloc(vidmem_alloc, at, size);
+        nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
+        if (!addr) {
+                /*
+                 * If memory is known to be freed soon, let the user know that
+                 * it may be available after a while.
+                 */
+                if (before_pending)
+                        return -EAGAIN;
+                else
+                        return -ENOMEM;
+        }
+        if (at)
+                mem->fixed = true;
+        else
+                mem->fixed = false;
+        mem->sgt = nvgpu_kzalloc(g, sizeof(struct sg_table));
+        if (!mem->sgt) {
+                err = -ENOMEM;
+                goto fail_physfree;
+        }
+        err = sg_alloc_table(mem->sgt, 1, GFP_KERNEL);
+        if (err)
+                goto fail_kfree;
+        set_vidmem_page_alloc(mem->sgt->sgl, addr);
+        sg_set_page(mem->sgt->sgl, NULL, size, 0);
+        mem->size = size;
+        mem->aperture = APERTURE_VIDMEM;
+        mem->allocator = vidmem_alloc;
+        mem->flags = flags;
+        nvgpu_init_list_node(&mem->clear_list_entry);
+        gk20a_dbg_fn("done at 0x%llx size %zu", addr, size);
+        return 0;
+fail_kfree:
+        nvgpu_kfree(g, mem->sgt);
+fail_physfree:
+        nvgpu_free(&g->mm.vidmem.allocator, addr);
+        return err;
+#else
+        return -ENOSYS;
+#endif
+}
+int gk20a_gmmu_alloc_map(struct vm_gk20a *vm, size_t size,
+                struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_map_flags(vm, 0, size, mem);
+}
+int gk20a_gmmu_alloc_map_flags(struct vm_gk20a *vm, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        if (vm->mm->vidmem_is_vidmem) {
+                /*
+                 * Force the no-kernel-mapping flag on because we don't support
+                 * the lack of it for vidmem - the user should not care when
+                 * using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
+                 * difference, the user should use the flag explicitly anyway.
+                 */
+                int err = gk20a_gmmu_alloc_map_flags_vid(vm,
+                                flags | NVGPU_DMA_NO_KERNEL_MAPPING,
+                                size, mem);
+                if (!err)
+                        return 0;
+                /*
+                 * Fall back to sysmem (which may then also fail) in case
+                 * vidmem is exhausted.
+                 */
+        }
+        return gk20a_gmmu_alloc_map_flags_sys(vm, flags, size, mem);
+}
+int gk20a_gmmu_alloc_map_sys(struct vm_gk20a *vm, size_t size,
+                struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_map_flags_sys(vm, 0, size, mem);
+}
+int gk20a_gmmu_alloc_map_flags_sys(struct vm_gk20a *vm, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        int err = gk20a_gmmu_alloc_flags_sys(vm->mm->g, flags, size, mem);
+        if (err)
+                return err;
+        mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
+                                     gk20a_mem_flag_none, false,
+                                     mem->aperture);
+        if (!mem->gpu_va) {
+                err = -ENOMEM;
+                goto fail_free;
+        }
+        return 0;
+fail_free:
+        gk20a_gmmu_free(vm->mm->g, mem);
+        return err;
+}
+int gk20a_gmmu_alloc_map_vid(struct vm_gk20a *vm, size_t size,
+                struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_map_flags_vid(vm,
+                        NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
+}
+int gk20a_gmmu_alloc_map_flags_vid(struct vm_gk20a *vm, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        int err = gk20a_gmmu_alloc_flags_vid(vm->mm->g, flags, size, mem);
+        if (err)
+                return err;
+        mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
+                                     gk20a_mem_flag_none, false,
+                                     mem->aperture);
+        if (!mem->gpu_va) {
+                err = -ENOMEM;
+                goto fail_free;
+        }
+        return 0;
+fail_free:
+        gk20a_gmmu_free(vm->mm->g, mem);
+        return err;
+}
+static void gk20a_gmmu_free_sys(struct gk20a *g, struct nvgpu_mem *mem)
+{
+        struct device *d = dev_from_gk20a(g);
+        if (mem->cpu_va || mem->pages) {
+                if (mem->flags) {
+                        DEFINE_DMA_ATTRS(dma_attrs);
+                        gk20a_dma_flags_to_attrs(&dma_attrs, mem->flags);
+                        if (mem->flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
+                                dma_free_attrs(d, mem->size, mem->pages,
+                                        sg_dma_address(mem->sgt->sgl),
+                                        __DMA_ATTR(dma_attrs));
+                        } else {
+                                dma_free_attrs(d, mem->size, mem->cpu_va,
+                                        sg_dma_address(mem->sgt->sgl),
+                                        __DMA_ATTR(dma_attrs));
+                        }
+                } else {
+                        dma_free_coherent(d, mem->size, mem->cpu_va,
+                                        sg_dma_address(mem->sgt->sgl));
+                }
+                mem->cpu_va = NULL;
+                mem->pages = NULL;
+        }
+        if (mem->sgt)
+                gk20a_free_sgtable(g, &mem->sgt);
+        mem->size = 0;
+        mem->aperture = APERTURE_INVALID;
+}
+static void gk20a_gmmu_free_vid(struct gk20a *g, struct nvgpu_mem *mem)
+{
+#if defined(CONFIG_GK20A_VIDMEM)
+        bool was_empty;
+        /* Sanity check - only this supported when allocating. */
+        WARN_ON(mem->flags != NVGPU_DMA_NO_KERNEL_MAPPING);
+        if (mem->user_mem) {
+                nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
+                was_empty = nvgpu_list_empty(&g->mm.vidmem.clear_list_head);
+                nvgpu_list_add_tail(&mem->clear_list_entry,
+                              &g->mm.vidmem.clear_list_head);
+                atomic64_add(mem->size, &g->mm.vidmem.bytes_pending);
+                nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
+                if (was_empty) {
+                        cancel_work_sync(&g->mm.vidmem.clear_mem_worker);
+                        schedule_work(&g->mm.vidmem.clear_mem_worker);
+                }
+        } else {
+                nvgpu_memset(g, mem, 0, 0, mem->size);
+                nvgpu_free(mem->allocator,
+                           (u64)get_vidmem_page_alloc(mem->sgt->sgl));
+                gk20a_free_sgtable(g, &mem->sgt);
+                mem->size = 0;
+                mem->aperture = APERTURE_INVALID;
+        }
+#endif
+}
+void gk20a_gmmu_free(struct gk20a *g, struct nvgpu_mem *mem)
+{
+        switch (mem->aperture) {
+        case APERTURE_SYSMEM:
+                return gk20a_gmmu_free_sys(g, mem);
+        case APERTURE_VIDMEM:
+                return gk20a_gmmu_free_vid(g, mem);
+        default:
+                break; /* like free() on "null" memory */
+        }
+}
+void gk20a_gmmu_unmap_free(struct vm_gk20a *vm, struct nvgpu_mem *mem)
+{
+        if (mem->gpu_va)
+                gk20a_gmmu_unmap(vm, mem->gpu_va, mem->size, gk20a_mem_flag_none);
+        mem->gpu_va = 0;
+        gk20a_gmmu_free(vm->mm->g, mem);
+}
diff --git a/drivers/gpu/nvgpu/common/semaphore.c b/drivers/gpu/nvgpu/common/semaphore.c
index 6fb6c27e..cfe1149f 100644
--- a/drivers/gpu/nvgpu/common/semaphore.c
+++ b/drivers/gpu/nvgpu/common/semaphore.c
@@ -18,6 +18,7 @@
 #include <linux/dma-mapping.h>
 #include <linux/highmem.h>
+#include <nvgpu/dma.h>
 #include <nvgpu/semaphore.h>
 #include <nvgpu/kmem.h>

diff --git a/drivers/gpu/nvgpu/common/linux/dma.c b/drivers/gpu/nvgpu/common/linux/dma.c new file mode 100644 index 00000000..755848ea --- /dev/null +++ b/drivers/gpu/nvgpu/common/linux/dma.c
@@ -0,0 +1,415 @@
		1	/*
		2	* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
		3	*
		4	* This program is free software; you can redistribute it and/or modify it
		5	* under the terms and conditions of the GNU General Public License,
		6	* version 2, as published by the Free Software Foundation.
		7	*
		8	* This program is distributed in the hope it will be useful, but WITHOUT
		9	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
		10	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
		11	* more details.
		12	*
		13	* You should have received a copy of the GNU General Public License
		14	* along with this program. If not, see <http://www.gnu.org/licenses/>.
		15	*/
		16
		17	#include <linux/dma-attrs.h>
		18	#include <linux/dma-mapping.h>
		19
		20	#include <nvgpu/dma.h>
		21	#include <nvgpu/lock.h>
		22
		23	#include "gk20a/gk20a.h"
		24
		25	#if defined(CONFIG_GK20A_VIDMEM)
		26	static u64 __gk20a_gmmu_alloc(struct nvgpu_allocator *allocator, dma_addr_t at,
		27	size_t size)
		28	{
		29	u64 addr = 0;
		30
		31	if (at)
		32	addr = nvgpu_alloc_fixed(allocator, at, size, 0);
		33	else
		34	addr = nvgpu_alloc(allocator, size);
		35
		36	return addr;
		37	}
		38	#endif
		39
		40	#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
		41	static void gk20a_dma_flags_to_attrs(unsigned long *attrs,
		42	unsigned long flags)
		43	#define ATTR_ARG(x) *x
		44	#else
		45	static void gk20a_dma_flags_to_attrs(struct dma_attrs *attrs,
		46	unsigned long flags)
		47	#define ATTR_ARG(x) x
		48	#endif
		49	{
		50	if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
		51	dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, ATTR_ARG(attrs));
		52	if (flags & NVGPU_DMA_FORCE_CONTIGUOUS)
		53	dma_set_attr(DMA_ATTR_FORCE_CONTIGUOUS, ATTR_ARG(attrs));
		54	if (flags & NVGPU_DMA_READ_ONLY)
		55	dma_set_attr(DMA_ATTR_READ_ONLY, ATTR_ARG(attrs));
		56	#undef ATTR_ARG
		57	}
		58
		59	int gk20a_gmmu_alloc(struct gk20a g, size_t size, struct nvgpu_mem mem)
		60	{
		61	return gk20a_gmmu_alloc_flags(g, 0, size, mem);
		62	}
		63
		64	int gk20a_gmmu_alloc_flags(struct gk20a *g, unsigned long flags, size_t size,
		65	struct nvgpu_mem *mem)
		66	{
		67	if (g->mm.vidmem_is_vidmem) {
		68	/*
		69	* Force the no-kernel-mapping flag on because we don't support
		70	* the lack of it for vidmem - the user should not care when
		71	* using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
		72	* difference, the user should use the flag explicitly anyway.
		73	*/
		74	int err = gk20a_gmmu_alloc_flags_vid(g,
		75	flags \| NVGPU_DMA_NO_KERNEL_MAPPING,
		76	size, mem);
		77
		78	if (!err)
		79	return 0;
		80	/*
		81	* Fall back to sysmem (which may then also fail) in case
		82	* vidmem is exhausted.
		83	*/
		84	}
		85
		86	return gk20a_gmmu_alloc_flags_sys(g, flags, size, mem);
		87	}
		88
		89	int gk20a_gmmu_alloc_sys(struct gk20a g, size_t size, struct nvgpu_mem mem)
		90	{
		91	return gk20a_gmmu_alloc_flags_sys(g, 0, size, mem);
		92	}
		93
		94	int gk20a_gmmu_alloc_flags_sys(struct gk20a *g, unsigned long flags,
		95	size_t size, struct nvgpu_mem *mem)
		96	{
		97	struct device *d = dev_from_gk20a(g);
		98	int err;
		99	dma_addr_t iova;
		100
		101	gk20a_dbg_fn("");
		102
		103	if (flags) {
		104	DEFINE_DMA_ATTRS(dma_attrs);
		105
		106	gk20a_dma_flags_to_attrs(&dma_attrs, flags);
		107
		108	if (flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
		109	mem->pages = dma_alloc_attrs(d,
		110	size, &iova, GFP_KERNEL,
		111	__DMA_ATTR(dma_attrs));
		112	if (!mem->pages)
		113	return -ENOMEM;
		114	} else {
		115	mem->cpu_va = dma_alloc_attrs(d,
		116	size, &iova, GFP_KERNEL,
		117	__DMA_ATTR(dma_attrs));
		118	if (!mem->cpu_va)
		119	return -ENOMEM;
		120	}
		121	} else {
		122	mem->cpu_va = dma_alloc_coherent(d, size, &iova, GFP_KERNEL);
		123	if (!mem->cpu_va)
		124	return -ENOMEM;
		125	}
		126
		127	if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
		128	err = gk20a_get_sgtable_from_pages(d, &mem->sgt, mem->pages,
		129	iova, size);
		130	else {
		131	err = gk20a_get_sgtable(d, &mem->sgt, mem->cpu_va, iova, size);
		132	memset(mem->cpu_va, 0, size);
		133	}
		134	if (err)
		135	goto fail_free;
		136
		137	mem->size = size;
		138	mem->aperture = APERTURE_SYSMEM;
		139	mem->flags = flags;
		140
		141	gk20a_dbg_fn("done");
		142
		143	return 0;
		144
		145	fail_free:
		146	dma_free_coherent(d, size, mem->cpu_va, iova);
		147	mem->cpu_va = NULL;
		148	mem->sgt = NULL;
		149	return err;
		150	}
		151
		152	int gk20a_gmmu_alloc_vid(struct gk20a g, size_t size, struct nvgpu_mem mem)
		153	{
		154	return gk20a_gmmu_alloc_flags_vid(g,
		155	NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
		156	}
		157
		158	int gk20a_gmmu_alloc_flags_vid(struct gk20a *g, unsigned long flags,
		159	size_t size, struct nvgpu_mem *mem)
		160	{
		161	return gk20a_gmmu_alloc_flags_vid_at(g, flags, size, mem, 0);
		162	}
		163
		164	int gk20a_gmmu_alloc_flags_vid_at(struct gk20a *g, unsigned long flags,
		165	size_t size, struct nvgpu_mem *mem, dma_addr_t at)
		166	{
		167	#if defined(CONFIG_GK20A_VIDMEM)
		168	u64 addr;
		169	int err;
		170	struct nvgpu_allocator *vidmem_alloc = g->mm.vidmem.cleared ?
		171	&g->mm.vidmem.allocator :
		172	&g->mm.vidmem.bootstrap_allocator;
		173	int before_pending;
		174
		175	gk20a_dbg_fn("");
		176
		177	if (!nvgpu_alloc_initialized(&g->mm.vidmem.allocator))
		178	return -ENOSYS;
		179
		180	/*
		181	* Our own allocator doesn't have any flags yet, and we can't
		182	* kernel-map these, so require explicit flags.
		183	*/
		184	WARN_ON(flags != NVGPU_DMA_NO_KERNEL_MAPPING);
		185
		186	nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
		187	before_pending = atomic64_read(&g->mm.vidmem.bytes_pending);
		188	addr = __gk20a_gmmu_alloc(vidmem_alloc, at, size);
		189	nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
		190	if (!addr) {
		191	/*
		192	* If memory is known to be freed soon, let the user know that
		193	* it may be available after a while.
		194	*/
		195	if (before_pending)
		196	return -EAGAIN;
		197	else
		198	return -ENOMEM;
		199	}
		200
		201	if (at)
		202	mem->fixed = true;
		203	else
		204	mem->fixed = false;
		205
		206	mem->sgt = nvgpu_kzalloc(g, sizeof(struct sg_table));
		207	if (!mem->sgt) {
		208	err = -ENOMEM;
		209	goto fail_physfree;
		210	}
		211
		212	err = sg_alloc_table(mem->sgt, 1, GFP_KERNEL);
		213	if (err)
		214	goto fail_kfree;
		215
		216	set_vidmem_page_alloc(mem->sgt->sgl, addr);
		217	sg_set_page(mem->sgt->sgl, NULL, size, 0);
		218
		219	mem->size = size;
		220	mem->aperture = APERTURE_VIDMEM;
		221	mem->allocator = vidmem_alloc;
		222	mem->flags = flags;
		223
		224	nvgpu_init_list_node(&mem->clear_list_entry);
		225
		226	gk20a_dbg_fn("done at 0x%llx size %zu", addr, size);
		227
		228	return 0;
		229
		230	fail_kfree:
		231	nvgpu_kfree(g, mem->sgt);
		232	fail_physfree:
		233	nvgpu_free(&g->mm.vidmem.allocator, addr);
		234	return err;
		235	#else
		236	return -ENOSYS;
		237	#endif
		238	}
		239
		240	int gk20a_gmmu_alloc_map(struct vm_gk20a *vm, size_t size,
		241	struct nvgpu_mem *mem)
		242	{
		243	return gk20a_gmmu_alloc_map_flags(vm, 0, size, mem);
		244	}
		245
		246	int gk20a_gmmu_alloc_map_flags(struct vm_gk20a *vm, unsigned long flags,
		247	size_t size, struct nvgpu_mem *mem)
		248	{
		249	if (vm->mm->vidmem_is_vidmem) {
		250	/*
		251	* Force the no-kernel-mapping flag on because we don't support
		252	* the lack of it for vidmem - the user should not care when
		253	* using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
		254	* difference, the user should use the flag explicitly anyway.
		255	*/
		256	int err = gk20a_gmmu_alloc_map_flags_vid(vm,
		257	flags \| NVGPU_DMA_NO_KERNEL_MAPPING,
		258	size, mem);
		259
		260	if (!err)
		261	return 0;
		262	/*
		263	* Fall back to sysmem (which may then also fail) in case
		264	* vidmem is exhausted.
		265	*/
		266	}
		267
		268	return gk20a_gmmu_alloc_map_flags_sys(vm, flags, size, mem);
		269	}
		270
		271	int gk20a_gmmu_alloc_map_sys(struct vm_gk20a *vm, size_t size,
		272	struct nvgpu_mem *mem)
		273	{
		274	return gk20a_gmmu_alloc_map_flags_sys(vm, 0, size, mem);
		275	}
		276
		277	int gk20a_gmmu_alloc_map_flags_sys(struct vm_gk20a *vm, unsigned long flags,
		278	size_t size, struct nvgpu_mem *mem)
		279	{
		280	int err = gk20a_gmmu_alloc_flags_sys(vm->mm->g, flags, size, mem);
		281
		282	if (err)
		283	return err;
		284
		285	mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
		286	gk20a_mem_flag_none, false,
		287	mem->aperture);
		288	if (!mem->gpu_va) {
		289	err = -ENOMEM;
		290	goto fail_free;
		291	}
		292
		293	return 0;
		294
		295	fail_free:
		296	gk20a_gmmu_free(vm->mm->g, mem);
		297	return err;
		298	}
		299
		300	int gk20a_gmmu_alloc_map_vid(struct vm_gk20a *vm, size_t size,
		301	struct nvgpu_mem *mem)
		302	{
		303	return gk20a_gmmu_alloc_map_flags_vid(vm,
		304	NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
		305	}
		306
		307	int gk20a_gmmu_alloc_map_flags_vid(struct vm_gk20a *vm, unsigned long flags,
		308	size_t size, struct nvgpu_mem *mem)
		309	{
		310	int err = gk20a_gmmu_alloc_flags_vid(vm->mm->g, flags, size, mem);
		311
		312	if (err)
		313	return err;
		314
		315	mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
		316	gk20a_mem_flag_none, false,
		317	mem->aperture);
		318	if (!mem->gpu_va) {
		319	err = -ENOMEM;
		320	goto fail_free;
		321	}
		322
		323	return 0;
		324
		325	fail_free:
		326	gk20a_gmmu_free(vm->mm->g, mem);
		327	return err;
		328	}
		329
		330	static void gk20a_gmmu_free_sys(struct gk20a g, struct nvgpu_mem mem)
		331	{
		332	struct device *d = dev_from_gk20a(g);
		333
		334	if (mem->cpu_va \|\| mem->pages) {
		335	if (mem->flags) {
		336	DEFINE_DMA_ATTRS(dma_attrs);
		337
		338	gk20a_dma_flags_to_attrs(&dma_attrs, mem->flags);
		339
		340	if (mem->flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
		341	dma_free_attrs(d, mem->size, mem->pages,
		342	sg_dma_address(mem->sgt->sgl),
		343	__DMA_ATTR(dma_attrs));
		344	} else {
		345	dma_free_attrs(d, mem->size, mem->cpu_va,
		346	sg_dma_address(mem->sgt->sgl),
		347	__DMA_ATTR(dma_attrs));
		348	}
		349	} else {
		350	dma_free_coherent(d, mem->size, mem->cpu_va,
		351	sg_dma_address(mem->sgt->sgl));
		352	}
		353	mem->cpu_va = NULL;
		354	mem->pages = NULL;
		355	}
		356
		357	if (mem->sgt)
		358	gk20a_free_sgtable(g, &mem->sgt);
		359
		360	mem->size = 0;
		361	mem->aperture = APERTURE_INVALID;
		362	}
		363
		364	static void gk20a_gmmu_free_vid(struct gk20a g, struct nvgpu_mem mem)
		365	{
		366	#if defined(CONFIG_GK20A_VIDMEM)
		367	bool was_empty;
		368
		369	/* Sanity check - only this supported when allocating. */
		370	WARN_ON(mem->flags != NVGPU_DMA_NO_KERNEL_MAPPING);
		371
		372	if (mem->user_mem) {
		373	nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
		374	was_empty = nvgpu_list_empty(&g->mm.vidmem.clear_list_head);
		375	nvgpu_list_add_tail(&mem->clear_list_entry,
		376	&g->mm.vidmem.clear_list_head);
		377	atomic64_add(mem->size, &g->mm.vidmem.bytes_pending);
		378	nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
		379
		380	if (was_empty) {
		381	cancel_work_sync(&g->mm.vidmem.clear_mem_worker);
		382	schedule_work(&g->mm.vidmem.clear_mem_worker);
		383	}
		384	} else {
		385	nvgpu_memset(g, mem, 0, 0, mem->size);
		386	nvgpu_free(mem->allocator,
		387	(u64)get_vidmem_page_alloc(mem->sgt->sgl));
		388	gk20a_free_sgtable(g, &mem->sgt);
		389
		390	mem->size = 0;
		391	mem->aperture = APERTURE_INVALID;
		392	}
		393	#endif
		394	}
		395
		396	void gk20a_gmmu_free(struct gk20a g, struct nvgpu_mem mem)
		397	{
		398	switch (mem->aperture) {
		399	case APERTURE_SYSMEM:
		400	return gk20a_gmmu_free_sys(g, mem);
		401	case APERTURE_VIDMEM:
		402	return gk20a_gmmu_free_vid(g, mem);
		403	default:
		404	break; /* like free() on "null" memory */
		405	}
		406	}
		407
		408	void gk20a_gmmu_unmap_free(struct vm_gk20a vm, struct nvgpu_mem mem)
		409	{
		410	if (mem->gpu_va)
		411	gk20a_gmmu_unmap(vm, mem->gpu_va, mem->size, gk20a_mem_flag_none);
		412	mem->gpu_va = 0;
		413
		414	gk20a_gmmu_free(vm->mm->g, mem);
		415	}


diff --git a/drivers/gpu/nvgpu/common/semaphore.c b/drivers/gpu/nvgpu/common/semaphore.c index 6fb6c27e..cfe1149f 100644 --- a/drivers/gpu/nvgpu/common/semaphore.c +++ b/drivers/gpu/nvgpu/common/semaphore.c
@@ -18,6 +18,7 @@
18	#include <linux/dma-mapping.h>	18	#include <linux/dma-mapping.h>
19	#include <linux/highmem.h>	19	#include <linux/highmem.h>
20		20
		21	#include <nvgpu/dma.h>
21	#include <nvgpu/semaphore.h>	22	#include <nvgpu/semaphore.h>
22	#include <nvgpu/kmem.h>	23	#include <nvgpu/kmem.h>
23		24