gpu: nvgpu: Move DMA API to dma.h

Make an nvgpu DMA API include file so that the intricacies of the Linux DMA API can be hidden from the calling code. Also document the nvgpu DMA API. JIRA NVGPU-12 Change-Id: I7578e4c726ad46344b7921179d95861858e9a27e Signed-off-by: Alex Waterman <alexw@nvidia.com> Reviewed-on: http://git-master/r/1323326 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Alex Waterman <alexw@nvidia.com> 2017-03-21 17:32:13 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2017-04-06 21:14:58 -0400
commit: 8f2d4a3f4a0acc81bae6725d30506e92651a42b5 (patch)
tree: 5cfe8a72fc824d167d3ce0f207621e1e4eb88391 /drivers/gpu/nvgpu/common
parent: c9665079d7b12f22a847c62587724b4ee120ca6e (diff)
2 files changed, 416 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/common/linux/dma.c b/drivers/gpu/nvgpu/common/linux/dma.c
new file mode 100644
index 00000000..755848ea
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/linux/dma.c
@@ -0,0 +1,415 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <linux/dma-attrs.h>
+#include <linux/dma-mapping.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/lock.h>
+#include "gk20a/gk20a.h"
+#if defined(CONFIG_GK20A_VIDMEM)
+static u64 __gk20a_gmmu_alloc(struct nvgpu_allocator *allocator, dma_addr_t at,
+                                size_t size)
+{
+        u64 addr = 0;
+        if (at)
+                addr = nvgpu_alloc_fixed(allocator, at, size, 0);
+        else
+                addr = nvgpu_alloc(allocator, size);
+        return addr;
+}
+#endif
+#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
+static void gk20a_dma_flags_to_attrs(unsigned long *attrs,
+                unsigned long flags)
+#define ATTR_ARG(x) *x
+#else
+static void gk20a_dma_flags_to_attrs(struct dma_attrs *attrs,
+                unsigned long flags)
+#define ATTR_ARG(x) x
+#endif
+{
+        if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
+                dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, ATTR_ARG(attrs));
+        if (flags & NVGPU_DMA_FORCE_CONTIGUOUS)
+                dma_set_attr(DMA_ATTR_FORCE_CONTIGUOUS, ATTR_ARG(attrs));
+        if (flags & NVGPU_DMA_READ_ONLY)
+                dma_set_attr(DMA_ATTR_READ_ONLY, ATTR_ARG(attrs));
+#undef ATTR_ARG
+}
+int gk20a_gmmu_alloc(struct gk20a *g, size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags(g, 0, size, mem);
+}
+int gk20a_gmmu_alloc_flags(struct gk20a *g, unsigned long flags, size_t size,
+                struct nvgpu_mem *mem)
+{
+        if (g->mm.vidmem_is_vidmem) {
+                /*
+                 * Force the no-kernel-mapping flag on because we don't support
+                 * the lack of it for vidmem - the user should not care when
+                 * using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
+                 * difference, the user should use the flag explicitly anyway.
+                 */
+                int err = gk20a_gmmu_alloc_flags_vid(g,
+                                flags | NVGPU_DMA_NO_KERNEL_MAPPING,
+                                size, mem);
+                if (!err)
+                        return 0;
+                /*
+                 * Fall back to sysmem (which may then also fail) in case
+                 * vidmem is exhausted.
+                 */
+        }
+        return gk20a_gmmu_alloc_flags_sys(g, flags, size, mem);
+}
+int gk20a_gmmu_alloc_sys(struct gk20a *g, size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags_sys(g, 0, size, mem);
+}
+int gk20a_gmmu_alloc_flags_sys(struct gk20a *g, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        struct device *d = dev_from_gk20a(g);
+        int err;
+        dma_addr_t iova;
+        gk20a_dbg_fn("");
+        if (flags) {
+                DEFINE_DMA_ATTRS(dma_attrs);
+                gk20a_dma_flags_to_attrs(&dma_attrs, flags);
+                if (flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
+                        mem->pages = dma_alloc_attrs(d,
+                                        size, &iova, GFP_KERNEL,
+                                        __DMA_ATTR(dma_attrs));
+                        if (!mem->pages)
+                                return -ENOMEM;
+                } else {
+                        mem->cpu_va = dma_alloc_attrs(d,
+                                        size, &iova, GFP_KERNEL,
+                                        __DMA_ATTR(dma_attrs));
+                        if (!mem->cpu_va)
+                                return -ENOMEM;
+                }
+        } else {
+                mem->cpu_va = dma_alloc_coherent(d, size, &iova, GFP_KERNEL);
+                if (!mem->cpu_va)
+                        return -ENOMEM;
+        }
+        if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
+                err = gk20a_get_sgtable_from_pages(d, &mem->sgt, mem->pages,
+                                                   iova, size);
+        else {
+                err = gk20a_get_sgtable(d, &mem->sgt, mem->cpu_va, iova, size);
+                memset(mem->cpu_va, 0, size);
+        }
+        if (err)
+                goto fail_free;
+        mem->size = size;
+        mem->aperture = APERTURE_SYSMEM;
+        mem->flags = flags;
+        gk20a_dbg_fn("done");
+        return 0;
+fail_free:
+        dma_free_coherent(d, size, mem->cpu_va, iova);
+        mem->cpu_va = NULL;
+        mem->sgt = NULL;
+        return err;
+}
+int gk20a_gmmu_alloc_vid(struct gk20a *g, size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags_vid(g,
+                        NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
+}
+int gk20a_gmmu_alloc_flags_vid(struct gk20a *g, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_flags_vid_at(g, flags, size, mem, 0);
+}
+int gk20a_gmmu_alloc_flags_vid_at(struct gk20a *g, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem, dma_addr_t at)
+{
+#if defined(CONFIG_GK20A_VIDMEM)
+        u64 addr;
+        int err;
+        struct nvgpu_allocator *vidmem_alloc = g->mm.vidmem.cleared ?
+                &g->mm.vidmem.allocator :
+                &g->mm.vidmem.bootstrap_allocator;
+        int before_pending;
+        gk20a_dbg_fn("");
+        if (!nvgpu_alloc_initialized(&g->mm.vidmem.allocator))
+                return -ENOSYS;
+        /*
+         * Our own allocator doesn't have any flags yet, and we can't
+         * kernel-map these, so require explicit flags.
+         */
+        WARN_ON(flags != NVGPU_DMA_NO_KERNEL_MAPPING);
+        nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
+        before_pending = atomic64_read(&g->mm.vidmem.bytes_pending);
+        addr = __gk20a_gmmu_alloc(vidmem_alloc, at, size);
+        nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
+        if (!addr) {
+                /*
+                 * If memory is known to be freed soon, let the user know that
+                 * it may be available after a while.
+                 */
+                if (before_pending)
+                        return -EAGAIN;
+                else
+                        return -ENOMEM;
+        }
+        if (at)
+                mem->fixed = true;
+        else
+                mem->fixed = false;
+        mem->sgt = nvgpu_kzalloc(g, sizeof(struct sg_table));
+        if (!mem->sgt) {
+                err = -ENOMEM;
+                goto fail_physfree;
+        }
+        err = sg_alloc_table(mem->sgt, 1, GFP_KERNEL);
+        if (err)
+                goto fail_kfree;
+        set_vidmem_page_alloc(mem->sgt->sgl, addr);
+        sg_set_page(mem->sgt->sgl, NULL, size, 0);
+        mem->size = size;
+        mem->aperture = APERTURE_VIDMEM;
+        mem->allocator = vidmem_alloc;
+        mem->flags = flags;
+        nvgpu_init_list_node(&mem->clear_list_entry);
+        gk20a_dbg_fn("done at 0x%llx size %zu", addr, size);
+        return 0;
+fail_kfree:
+        nvgpu_kfree(g, mem->sgt);
+fail_physfree:
+        nvgpu_free(&g->mm.vidmem.allocator, addr);
+        return err;
+#else
+        return -ENOSYS;
+#endif
+}
+int gk20a_gmmu_alloc_map(struct vm_gk20a *vm, size_t size,
+                struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_map_flags(vm, 0, size, mem);
+}
+int gk20a_gmmu_alloc_map_flags(struct vm_gk20a *vm, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        if (vm->mm->vidmem_is_vidmem) {
+                /*
+                 * Force the no-kernel-mapping flag on because we don't support
+                 * the lack of it for vidmem - the user should not care when
+                 * using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
+                 * difference, the user should use the flag explicitly anyway.
+                 */
+                int err = gk20a_gmmu_alloc_map_flags_vid(vm,
+                                flags | NVGPU_DMA_NO_KERNEL_MAPPING,
+                                size, mem);
+                if (!err)
+                        return 0;
+                /*
+                 * Fall back to sysmem (which may then also fail) in case
+                 * vidmem is exhausted.
+                 */
+        }
+        return gk20a_gmmu_alloc_map_flags_sys(vm, flags, size, mem);
+}
+int gk20a_gmmu_alloc_map_sys(struct vm_gk20a *vm, size_t size,
+                struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_map_flags_sys(vm, 0, size, mem);
+}
+int gk20a_gmmu_alloc_map_flags_sys(struct vm_gk20a *vm, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        int err = gk20a_gmmu_alloc_flags_sys(vm->mm->g, flags, size, mem);
+        if (err)
+                return err;
+        mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
+                                     gk20a_mem_flag_none, false,
+                                     mem->aperture);
+        if (!mem->gpu_va) {
+                err = -ENOMEM;
+                goto fail_free;
+        }
+        return 0;
+fail_free:
+        gk20a_gmmu_free(vm->mm->g, mem);
+        return err;
+}
+int gk20a_gmmu_alloc_map_vid(struct vm_gk20a *vm, size_t size,
+                struct nvgpu_mem *mem)
+{
+        return gk20a_gmmu_alloc_map_flags_vid(vm,
+                        NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
+}
+int gk20a_gmmu_alloc_map_flags_vid(struct vm_gk20a *vm, unsigned long flags,
+                size_t size, struct nvgpu_mem *mem)
+{
+        int err = gk20a_gmmu_alloc_flags_vid(vm->mm->g, flags, size, mem);
+        if (err)
+                return err;
+        mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
+                                     gk20a_mem_flag_none, false,
+                                     mem->aperture);
+        if (!mem->gpu_va) {
+                err = -ENOMEM;
+                goto fail_free;
+        }
+        return 0;
+fail_free:
+        gk20a_gmmu_free(vm->mm->g, mem);
+        return err;
+}
+static void gk20a_gmmu_free_sys(struct gk20a *g, struct nvgpu_mem *mem)
+{
+        struct device *d = dev_from_gk20a(g);
+        if (mem->cpu_va || mem->pages) {
+                if (mem->flags) {
+                        DEFINE_DMA_ATTRS(dma_attrs);
+                        gk20a_dma_flags_to_attrs(&dma_attrs, mem->flags);
+                        if (mem->flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
+                                dma_free_attrs(d, mem->size, mem->pages,
+                                        sg_dma_address(mem->sgt->sgl),
+                                        __DMA_ATTR(dma_attrs));
+                        } else {
+                                dma_free_attrs(d, mem->size, mem->cpu_va,
+                                        sg_dma_address(mem->sgt->sgl),
+                                        __DMA_ATTR(dma_attrs));
+                        }
+                } else {
+                        dma_free_coherent(d, mem->size, mem->cpu_va,
+                                        sg_dma_address(mem->sgt->sgl));
+                }
+                mem->cpu_va = NULL;
+                mem->pages = NULL;
+        }
+        if (mem->sgt)
+                gk20a_free_sgtable(g, &mem->sgt);
+        mem->size = 0;
+        mem->aperture = APERTURE_INVALID;
+}
+static void gk20a_gmmu_free_vid(struct gk20a *g, struct nvgpu_mem *mem)
+{
+#if defined(CONFIG_GK20A_VIDMEM)
+        bool was_empty;
+        /* Sanity check - only this supported when allocating. */
+        WARN_ON(mem->flags != NVGPU_DMA_NO_KERNEL_MAPPING);
+        if (mem->user_mem) {
+                nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
+                was_empty = nvgpu_list_empty(&g->mm.vidmem.clear_list_head);
+                nvgpu_list_add_tail(&mem->clear_list_entry,
+                              &g->mm.vidmem.clear_list_head);
+                atomic64_add(mem->size, &g->mm.vidmem.bytes_pending);
+                nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
+                if (was_empty) {
+                        cancel_work_sync(&g->mm.vidmem.clear_mem_worker);
+                        schedule_work(&g->mm.vidmem.clear_mem_worker);
+                }
+        } else {
+                nvgpu_memset(g, mem, 0, 0, mem->size);
+                nvgpu_free(mem->allocator,
+                           (u64)get_vidmem_page_alloc(mem->sgt->sgl));
+                gk20a_free_sgtable(g, &mem->sgt);
+                mem->size = 0;
+                mem->aperture = APERTURE_INVALID;
+        }
+#endif
+}
+void gk20a_gmmu_free(struct gk20a *g, struct nvgpu_mem *mem)
+{
+        switch (mem->aperture) {
+        case APERTURE_SYSMEM:
+                return gk20a_gmmu_free_sys(g, mem);
+        case APERTURE_VIDMEM:
+                return gk20a_gmmu_free_vid(g, mem);
+        default:
+                break; /* like free() on "null" memory */
+        }
+}
+void gk20a_gmmu_unmap_free(struct vm_gk20a *vm, struct nvgpu_mem *mem)
+{
+        if (mem->gpu_va)
+                gk20a_gmmu_unmap(vm, mem->gpu_va, mem->size, gk20a_mem_flag_none);
+        mem->gpu_va = 0;
+        gk20a_gmmu_free(vm->mm->g, mem);
+}
diff --git a/drivers/gpu/nvgpu/common/semaphore.c b/drivers/gpu/nvgpu/common/semaphore.c
index 6fb6c27e..cfe1149f 100644
--- a/drivers/gpu/nvgpu/common/semaphore.c
+++ b/drivers/gpu/nvgpu/common/semaphore.c
@@ -18,6 +18,7 @@
 #include <linux/dma-mapping.h>
 #include <linux/highmem.h>
+#include <nvgpu/dma.h>
 #include <nvgpu/semaphore.h>
 #include <nvgpu/kmem.h>
author	Alex Waterman <alexw@nvidia.com>	2017-03-21 17:32:13 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2017-04-06 21:14:58 -0400
commit	8f2d4a3f4a0acc81bae6725d30506e92651a42b5 (patch)
tree	5cfe8a72fc824d167d3ce0f207621e1e4eb88391 /drivers/gpu/nvgpu/common
parent	c9665079d7b12f22a847c62587724b4ee120ca6e (diff)

diff --git a/drivers/gpu/nvgpu/common/linux/dma.c b/drivers/gpu/nvgpu/common/linux/dma.c new file mode 100644 index 00000000..755848ea --- /dev/null +++ b/drivers/gpu/nvgpu/common/linux/dma.c
@@ -0,0 +1,415 @@
		1	/*
		2	* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
		3	*
		4	* This program is free software; you can redistribute it and/or modify it
		5	* under the terms and conditions of the GNU General Public License,
		6	* version 2, as published by the Free Software Foundation.
		7	*
		8	* This program is distributed in the hope it will be useful, but WITHOUT
		9	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
		10	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
		11	* more details.
		12	*
		13	* You should have received a copy of the GNU General Public License
		14	* along with this program. If not, see <http://www.gnu.org/licenses/>.
		15	*/
		16
		17	#include <linux/dma-attrs.h>
		18	#include <linux/dma-mapping.h>
		19
		20	#include <nvgpu/dma.h>
		21	#include <nvgpu/lock.h>
		22
		23	#include "gk20a/gk20a.h"
		24
		25	#if defined(CONFIG_GK20A_VIDMEM)
		26	static u64 __gk20a_gmmu_alloc(struct nvgpu_allocator *allocator, dma_addr_t at,
		27	size_t size)
		28	{
		29	u64 addr = 0;
		30
		31	if (at)
		32	addr = nvgpu_alloc_fixed(allocator, at, size, 0);
		33	else
		34	addr = nvgpu_alloc(allocator, size);
		35
		36	return addr;
		37	}
		38	#endif
		39
		40	#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 9, 0)
		41	static void gk20a_dma_flags_to_attrs(unsigned long *attrs,
		42	unsigned long flags)
		43	#define ATTR_ARG(x) *x
		44	#else
		45	static void gk20a_dma_flags_to_attrs(struct dma_attrs *attrs,
		46	unsigned long flags)
		47	#define ATTR_ARG(x) x
		48	#endif
		49	{
		50	if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
		51	dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, ATTR_ARG(attrs));
		52	if (flags & NVGPU_DMA_FORCE_CONTIGUOUS)
		53	dma_set_attr(DMA_ATTR_FORCE_CONTIGUOUS, ATTR_ARG(attrs));
		54	if (flags & NVGPU_DMA_READ_ONLY)
		55	dma_set_attr(DMA_ATTR_READ_ONLY, ATTR_ARG(attrs));
		56	#undef ATTR_ARG
		57	}
		58
		59	int gk20a_gmmu_alloc(struct gk20a g, size_t size, struct nvgpu_mem mem)
		60	{
		61	return gk20a_gmmu_alloc_flags(g, 0, size, mem);
		62	}
		63
		64	int gk20a_gmmu_alloc_flags(struct gk20a *g, unsigned long flags, size_t size,
		65	struct nvgpu_mem *mem)
		66	{
		67	if (g->mm.vidmem_is_vidmem) {
		68	/*
		69	* Force the no-kernel-mapping flag on because we don't support
		70	* the lack of it for vidmem - the user should not care when
		71	* using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
		72	* difference, the user should use the flag explicitly anyway.
		73	*/
		74	int err = gk20a_gmmu_alloc_flags_vid(g,
		75	flags \| NVGPU_DMA_NO_KERNEL_MAPPING,
		76	size, mem);
		77
		78	if (!err)
		79	return 0;
		80	/*
		81	* Fall back to sysmem (which may then also fail) in case
		82	* vidmem is exhausted.
		83	*/
		84	}
		85
		86	return gk20a_gmmu_alloc_flags_sys(g, flags, size, mem);
		87	}
		88
		89	int gk20a_gmmu_alloc_sys(struct gk20a g, size_t size, struct nvgpu_mem mem)
		90	{
		91	return gk20a_gmmu_alloc_flags_sys(g, 0, size, mem);
		92	}
		93
		94	int gk20a_gmmu_alloc_flags_sys(struct gk20a *g, unsigned long flags,
		95	size_t size, struct nvgpu_mem *mem)
		96	{
		97	struct device *d = dev_from_gk20a(g);
		98	int err;
		99	dma_addr_t iova;
		100
		101	gk20a_dbg_fn("");
		102
		103	if (flags) {
		104	DEFINE_DMA_ATTRS(dma_attrs);
		105
		106	gk20a_dma_flags_to_attrs(&dma_attrs, flags);
		107
		108	if (flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
		109	mem->pages = dma_alloc_attrs(d,
		110	size, &iova, GFP_KERNEL,
		111	__DMA_ATTR(dma_attrs));
		112	if (!mem->pages)
		113	return -ENOMEM;
		114	} else {
		115	mem->cpu_va = dma_alloc_attrs(d,
		116	size, &iova, GFP_KERNEL,
		117	__DMA_ATTR(dma_attrs));
		118	if (!mem->cpu_va)
		119	return -ENOMEM;
		120	}
		121	} else {
		122	mem->cpu_va = dma_alloc_coherent(d, size, &iova, GFP_KERNEL);
		123	if (!mem->cpu_va)
		124	return -ENOMEM;
		125	}
		126
		127	if (flags & NVGPU_DMA_NO_KERNEL_MAPPING)
		128	err = gk20a_get_sgtable_from_pages(d, &mem->sgt, mem->pages,
		129	iova, size);
		130	else {
		131	err = gk20a_get_sgtable(d, &mem->sgt, mem->cpu_va, iova, size);
		132	memset(mem->cpu_va, 0, size);
		133	}
		134	if (err)
		135	goto fail_free;
		136
		137	mem->size = size;
		138	mem->aperture = APERTURE_SYSMEM;
		139	mem->flags = flags;
		140
		141	gk20a_dbg_fn("done");
		142
		143	return 0;
		144
		145	fail_free:
		146	dma_free_coherent(d, size, mem->cpu_va, iova);
		147	mem->cpu_va = NULL;
		148	mem->sgt = NULL;
		149	return err;
		150	}
		151
		152	int gk20a_gmmu_alloc_vid(struct gk20a g, size_t size, struct nvgpu_mem mem)
		153	{
		154	return gk20a_gmmu_alloc_flags_vid(g,
		155	NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
		156	}
		157
		158	int gk20a_gmmu_alloc_flags_vid(struct gk20a *g, unsigned long flags,
		159	size_t size, struct nvgpu_mem *mem)
		160	{
		161	return gk20a_gmmu_alloc_flags_vid_at(g, flags, size, mem, 0);
		162	}
		163
		164	int gk20a_gmmu_alloc_flags_vid_at(struct gk20a *g, unsigned long flags,
		165	size_t size, struct nvgpu_mem *mem, dma_addr_t at)
		166	{
		167	#if defined(CONFIG_GK20A_VIDMEM)
		168	u64 addr;
		169	int err;
		170	struct nvgpu_allocator *vidmem_alloc = g->mm.vidmem.cleared ?
		171	&g->mm.vidmem.allocator :
		172	&g->mm.vidmem.bootstrap_allocator;
		173	int before_pending;
		174
		175	gk20a_dbg_fn("");
		176
		177	if (!nvgpu_alloc_initialized(&g->mm.vidmem.allocator))
		178	return -ENOSYS;
		179
		180	/*
		181	* Our own allocator doesn't have any flags yet, and we can't
		182	* kernel-map these, so require explicit flags.
		183	*/
		184	WARN_ON(flags != NVGPU_DMA_NO_KERNEL_MAPPING);
		185
		186	nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
		187	before_pending = atomic64_read(&g->mm.vidmem.bytes_pending);
		188	addr = __gk20a_gmmu_alloc(vidmem_alloc, at, size);
		189	nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
		190	if (!addr) {
		191	/*
		192	* If memory is known to be freed soon, let the user know that
		193	* it may be available after a while.
		194	*/
		195	if (before_pending)
		196	return -EAGAIN;
		197	else
		198	return -ENOMEM;
		199	}
		200
		201	if (at)
		202	mem->fixed = true;
		203	else
		204	mem->fixed = false;
		205
		206	mem->sgt = nvgpu_kzalloc(g, sizeof(struct sg_table));
		207	if (!mem->sgt) {
		208	err = -ENOMEM;
		209	goto fail_physfree;
		210	}
		211
		212	err = sg_alloc_table(mem->sgt, 1, GFP_KERNEL);
		213	if (err)
		214	goto fail_kfree;
		215
		216	set_vidmem_page_alloc(mem->sgt->sgl, addr);
		217	sg_set_page(mem->sgt->sgl, NULL, size, 0);
		218
		219	mem->size = size;
		220	mem->aperture = APERTURE_VIDMEM;
		221	mem->allocator = vidmem_alloc;
		222	mem->flags = flags;
		223
		224	nvgpu_init_list_node(&mem->clear_list_entry);
		225
		226	gk20a_dbg_fn("done at 0x%llx size %zu", addr, size);
		227
		228	return 0;
		229
		230	fail_kfree:
		231	nvgpu_kfree(g, mem->sgt);
		232	fail_physfree:
		233	nvgpu_free(&g->mm.vidmem.allocator, addr);
		234	return err;
		235	#else
		236	return -ENOSYS;
		237	#endif
		238	}
		239
		240	int gk20a_gmmu_alloc_map(struct vm_gk20a *vm, size_t size,
		241	struct nvgpu_mem *mem)
		242	{
		243	return gk20a_gmmu_alloc_map_flags(vm, 0, size, mem);
		244	}
		245
		246	int gk20a_gmmu_alloc_map_flags(struct vm_gk20a *vm, unsigned long flags,
		247	size_t size, struct nvgpu_mem *mem)
		248	{
		249	if (vm->mm->vidmem_is_vidmem) {
		250	/*
		251	* Force the no-kernel-mapping flag on because we don't support
		252	* the lack of it for vidmem - the user should not care when
		253	* using gk20a_gmmu_alloc_map and it's vidmem, or if there's a
		254	* difference, the user should use the flag explicitly anyway.
		255	*/
		256	int err = gk20a_gmmu_alloc_map_flags_vid(vm,
		257	flags \| NVGPU_DMA_NO_KERNEL_MAPPING,
		258	size, mem);
		259
		260	if (!err)
		261	return 0;
		262	/*
		263	* Fall back to sysmem (which may then also fail) in case
		264	* vidmem is exhausted.
		265	*/
		266	}
		267
		268	return gk20a_gmmu_alloc_map_flags_sys(vm, flags, size, mem);
		269	}
		270
		271	int gk20a_gmmu_alloc_map_sys(struct vm_gk20a *vm, size_t size,
		272	struct nvgpu_mem *mem)
		273	{
		274	return gk20a_gmmu_alloc_map_flags_sys(vm, 0, size, mem);
		275	}
		276
		277	int gk20a_gmmu_alloc_map_flags_sys(struct vm_gk20a *vm, unsigned long flags,
		278	size_t size, struct nvgpu_mem *mem)
		279	{
		280	int err = gk20a_gmmu_alloc_flags_sys(vm->mm->g, flags, size, mem);
		281
		282	if (err)
		283	return err;
		284
		285	mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
		286	gk20a_mem_flag_none, false,
		287	mem->aperture);
		288	if (!mem->gpu_va) {
		289	err = -ENOMEM;
		290	goto fail_free;
		291	}
		292
		293	return 0;
		294
		295	fail_free:
		296	gk20a_gmmu_free(vm->mm->g, mem);
		297	return err;
		298	}
		299
		300	int gk20a_gmmu_alloc_map_vid(struct vm_gk20a *vm, size_t size,
		301	struct nvgpu_mem *mem)
		302	{
		303	return gk20a_gmmu_alloc_map_flags_vid(vm,
		304	NVGPU_DMA_NO_KERNEL_MAPPING, size, mem);
		305	}
		306
		307	int gk20a_gmmu_alloc_map_flags_vid(struct vm_gk20a *vm, unsigned long flags,
		308	size_t size, struct nvgpu_mem *mem)
		309	{
		310	int err = gk20a_gmmu_alloc_flags_vid(vm->mm->g, flags, size, mem);
		311
		312	if (err)
		313	return err;
		314
		315	mem->gpu_va = gk20a_gmmu_map(vm, &mem->sgt, size, 0,
		316	gk20a_mem_flag_none, false,
		317	mem->aperture);
		318	if (!mem->gpu_va) {
		319	err = -ENOMEM;
		320	goto fail_free;
		321	}
		322
		323	return 0;
		324
		325	fail_free:
		326	gk20a_gmmu_free(vm->mm->g, mem);
		327	return err;
		328	}
		329
		330	static void gk20a_gmmu_free_sys(struct gk20a g, struct nvgpu_mem mem)
		331	{
		332	struct device *d = dev_from_gk20a(g);
		333
		334	if (mem->cpu_va \|\| mem->pages) {
		335	if (mem->flags) {
		336	DEFINE_DMA_ATTRS(dma_attrs);
		337
		338	gk20a_dma_flags_to_attrs(&dma_attrs, mem->flags);
		339
		340	if (mem->flags & NVGPU_DMA_NO_KERNEL_MAPPING) {
		341	dma_free_attrs(d, mem->size, mem->pages,
		342	sg_dma_address(mem->sgt->sgl),
		343	__DMA_ATTR(dma_attrs));
		344	} else {
		345	dma_free_attrs(d, mem->size, mem->cpu_va,
		346	sg_dma_address(mem->sgt->sgl),
		347	__DMA_ATTR(dma_attrs));
		348	}
		349	} else {
		350	dma_free_coherent(d, mem->size, mem->cpu_va,
		351	sg_dma_address(mem->sgt->sgl));
		352	}
		353	mem->cpu_va = NULL;
		354	mem->pages = NULL;
		355	}
		356
		357	if (mem->sgt)
		358	gk20a_free_sgtable(g, &mem->sgt);
		359
		360	mem->size = 0;
		361	mem->aperture = APERTURE_INVALID;
		362	}
		363
		364	static void gk20a_gmmu_free_vid(struct gk20a g, struct nvgpu_mem mem)
		365	{
		366	#if defined(CONFIG_GK20A_VIDMEM)
		367	bool was_empty;
		368
		369	/* Sanity check - only this supported when allocating. */
		370	WARN_ON(mem->flags != NVGPU_DMA_NO_KERNEL_MAPPING);
		371
		372	if (mem->user_mem) {
		373	nvgpu_mutex_acquire(&g->mm.vidmem.clear_list_mutex);
		374	was_empty = nvgpu_list_empty(&g->mm.vidmem.clear_list_head);
		375	nvgpu_list_add_tail(&mem->clear_list_entry,
		376	&g->mm.vidmem.clear_list_head);
		377	atomic64_add(mem->size, &g->mm.vidmem.bytes_pending);
		378	nvgpu_mutex_release(&g->mm.vidmem.clear_list_mutex);
		379
		380	if (was_empty) {
		381	cancel_work_sync(&g->mm.vidmem.clear_mem_worker);
		382	schedule_work(&g->mm.vidmem.clear_mem_worker);
		383	}
		384	} else {
		385	nvgpu_memset(g, mem, 0, 0, mem->size);
		386	nvgpu_free(mem->allocator,
		387	(u64)get_vidmem_page_alloc(mem->sgt->sgl));
		388	gk20a_free_sgtable(g, &mem->sgt);
		389
		390	mem->size = 0;
		391	mem->aperture = APERTURE_INVALID;
		392	}
		393	#endif
		394	}
		395
		396	void gk20a_gmmu_free(struct gk20a g, struct nvgpu_mem mem)
		397	{
		398	switch (mem->aperture) {
		399	case APERTURE_SYSMEM:
		400	return gk20a_gmmu_free_sys(g, mem);
		401	case APERTURE_VIDMEM:
		402	return gk20a_gmmu_free_vid(g, mem);
		403	default:
		404	break; /* like free() on "null" memory */
		405	}
		406	}
		407
		408	void gk20a_gmmu_unmap_free(struct vm_gk20a vm, struct nvgpu_mem mem)
		409	{
		410	if (mem->gpu_va)
		411	gk20a_gmmu_unmap(vm, mem->gpu_va, mem->size, gk20a_mem_flag_none);
		412	mem->gpu_va = 0;
		413
		414	gk20a_gmmu_free(vm->mm->g, mem);
		415	}


diff --git a/drivers/gpu/nvgpu/common/semaphore.c b/drivers/gpu/nvgpu/common/semaphore.c index 6fb6c27e..cfe1149f 100644 --- a/drivers/gpu/nvgpu/common/semaphore.c +++ b/drivers/gpu/nvgpu/common/semaphore.c
@@ -18,6 +18,7 @@
18	#include <linux/dma-mapping.h>	18	#include <linux/dma-mapping.h>
19	#include <linux/highmem.h>	19	#include <linux/highmem.h>
20		20
		21	#include <nvgpu/dma.h>
21	#include <nvgpu/semaphore.h>	22	#include <nvgpu/semaphore.h>
22	#include <nvgpu/kmem.h>	23	#include <nvgpu/kmem.h>
23		24