gpu: nvgpu: Split out pramin code

Split out the pramin interface code in preparation for splitting out the mem_desc code. JIRA NVGPU-12 Change-Id: I3f03447ea213cc15669b0934fa706e7cb22599b7 Signed-off-by: Alex Waterman <alexw@nvidia.com> Reviewed-on: http://git-master/r/1323323 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Alex Waterman <alexw@nvidia.com> 2017-03-15 18:49:18 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2017-03-31 20:21:34 -0400
commit: dd88aed5cc3088285c5d0b900aebf705f52178c5 (patch)
tree: 371ffb74c97305be99fe312b45e30793dab36926 /drivers/gpu/nvgpu/common
parent: 56df8c58088b5c8b4a09ce6f5e195614251bf8d0 (diff)
1 files changed, 129 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/common/pramin.c b/drivers/gpu/nvgpu/common/pramin.c
new file mode 100644
index 00000000..b9216309
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/pramin.c
@@ -0,0 +1,129 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <nvgpu/pramin.h>
+#include <nvgpu/page_allocator.h>
+#include "gk20a/gk20a.h"
+/*
+ * Flip this to force all gk20a_mem* accesses via PRAMIN from the start of the
+ * boot, even for buffers that would work via cpu_va. In runtime, the flag is
+ * in debugfs, called "force_pramin".
+ */
+#define GK20A_FORCE_PRAMIN_DEFAULT false
+void pramin_access_batch_rd_n(struct gk20a *g, u32 start, u32 words, u32 **arg)
+{
+        u32 r = start, *dest_u32 = *arg;
+        if (!g->regs) {
+                __gk20a_warn_on_no_regs();
+                return;
+        }
+        while (words--) {
+                *dest_u32++ = gk20a_readl(g, r);
+                r += sizeof(u32);
+        }
+        *arg = dest_u32;
+}
+void pramin_access_batch_wr_n(struct gk20a *g, u32 start, u32 words, u32 **arg)
+{
+        u32 r = start, *src_u32 = *arg;
+        if (!g->regs) {
+                __gk20a_warn_on_no_regs();
+                return;
+        }
+        while (words--) {
+                writel_relaxed(*src_u32++, g->regs + r);
+                r += sizeof(u32);
+        }
+        *arg = src_u32;
+}
+void pramin_access_batch_set(struct gk20a *g, u32 start, u32 words, u32 **arg)
+{
+        u32 r = start, repeat = **arg;
+        if (!g->regs) {
+                __gk20a_warn_on_no_regs();
+                return;
+        }
+        while (words--) {
+                writel_relaxed(repeat, g->regs + r);
+                r += sizeof(u32);
+        }
+}
+/*
+ * The PRAMIN range is 1 MB, must change base addr if a buffer crosses that.
+ * This same loop is used for read/write/memset. Offset and size in bytes.
+ * One call to "loop" is done per range, with "arg" supplied.
+ */
+void nvgpu_pramin_access_batched(struct gk20a *g, struct mem_desc *mem,
+                u32 offset, u32 size, pramin_access_batch_fn loop, u32 **arg)
+{
+        struct nvgpu_page_alloc *alloc = NULL;
+        struct page_alloc_chunk *chunk = NULL;
+        u32 byteoff, start_reg, until_end, n;
+        alloc = get_vidmem_page_alloc(mem->sgt->sgl);
+        list_for_each_entry(chunk, &alloc->alloc_chunks, list_entry) {
+                if (offset >= chunk->length)
+                        offset -= chunk->length;
+                else
+                        break;
+        }
+        offset /= sizeof(u32);
+        while (size) {
+                byteoff = g->ops.pramin.enter(g, mem, chunk, offset);
+                start_reg = g->ops.pramin.data032_r(byteoff / sizeof(u32));
+                until_end = SZ_1M - (byteoff & (SZ_1M - 1));
+                n = min3(size, until_end, (u32)(chunk->length - offset));
+                loop(g, start_reg, n / sizeof(u32), arg);
+                /* read back to synchronize accesses */
+                gk20a_readl(g, start_reg);
+                g->ops.pramin.exit(g, mem, chunk);
+                size -= n;
+                if (n == (chunk->length - offset)) {
+                        chunk = list_next_entry(chunk, list_entry);
+                        offset = 0;
+                } else {
+                        offset += n / sizeof(u32);
+                }
+        }
+}
+void nvgpu_init_pramin(struct mm_gk20a *mm)
+{
+        mm->pramin_window = 0;
+        nvgpu_spinlock_init(&mm->pramin_window_lock);
+        mm->force_pramin = GK20A_FORCE_PRAMIN_DEFAULT;
+}
author	Alex Waterman <alexw@nvidia.com>	2017-03-15 18:49:18 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2017-03-31 20:21:34 -0400
commit	dd88aed5cc3088285c5d0b900aebf705f52178c5 (patch)
tree	371ffb74c97305be99fe312b45e30793dab36926 /drivers/gpu/nvgpu/common
parent	56df8c58088b5c8b4a09ce6f5e195614251bf8d0 (diff)

diff --git a/drivers/gpu/nvgpu/common/pramin.c b/drivers/gpu/nvgpu/common/pramin.c new file mode 100644 index 00000000..b9216309 --- /dev/null +++ b/drivers/gpu/nvgpu/common/pramin.c
@@ -0,0 +1,129 @@
	1	/*
	2	* Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved.
	3	*
	4	* This program is free software; you can redistribute it and/or modify it
	5	* under the terms and conditions of the GNU General Public License,
	6	* version 2, as published by the Free Software Foundation.
	7	*
	8	* This program is distributed in the hope it will be useful, but WITHOUT
	9	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
	10	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
	11	* more details.
	12	*
	13	* You should have received a copy of the GNU General Public License
	14	* along with this program. If not, see <http://www.gnu.org/licenses/>.
	15	*/
	16
	17	#include <nvgpu/pramin.h>
	18	#include <nvgpu/page_allocator.h>
	19
	20	#include "gk20a/gk20a.h"
	21
	22	/*
	23	* Flip this to force all gk20a_mem* accesses via PRAMIN from the start of the
	24	* boot, even for buffers that would work via cpu_va. In runtime, the flag is
	25	* in debugfs, called "force_pramin".
	26	*/
	27	#define GK20A_FORCE_PRAMIN_DEFAULT false
	28
	29	void pramin_access_batch_rd_n(struct gk20a g, u32 start, u32 words, u32 *arg)
	30	{
	31	u32 r = start, dest_u32 = arg;
	32
	33	if (!g->regs) {
	34	__gk20a_warn_on_no_regs();
	35	return;
	36	}
	37
	38	while (words--) {
	39	*dest_u32++ = gk20a_readl(g, r);
	40	r += sizeof(u32);
	41	}
	42
	43	*arg = dest_u32;
	44	}
	45
	46	void pramin_access_batch_wr_n(struct gk20a g, u32 start, u32 words, u32 *arg)
	47	{
	48	u32 r = start, src_u32 = arg;
	49
	50	if (!g->regs) {
	51	__gk20a_warn_on_no_regs();
	52	return;
	53	}
	54
	55	while (words--) {
	56	writel_relaxed(*src_u32++, g->regs + r);
	57	r += sizeof(u32);
	58	}
	59
	60	*arg = src_u32;
	61	}
	62
	63	void pramin_access_batch_set(struct gk20a g, u32 start, u32 words, u32 *arg)
	64	{
	65	u32 r = start, repeat = **arg;
	66
	67	if (!g->regs) {
	68	__gk20a_warn_on_no_regs();
	69	return;
	70	}
	71
	72	while (words--) {
	73	writel_relaxed(repeat, g->regs + r);
	74	r += sizeof(u32);
	75	}
	76	}
	77
	78	/*
	79	* The PRAMIN range is 1 MB, must change base addr if a buffer crosses that.
	80	* This same loop is used for read/write/memset. Offset and size in bytes.
	81	* One call to "loop" is done per range, with "arg" supplied.
	82	*/
	83	void nvgpu_pramin_access_batched(struct gk20a g, struct mem_desc mem,
	84	u32 offset, u32 size, pramin_access_batch_fn loop, u32 **arg)
	85	{
	86	struct nvgpu_page_alloc *alloc = NULL;
	87	struct page_alloc_chunk *chunk = NULL;
	88	u32 byteoff, start_reg, until_end, n;
	89
	90	alloc = get_vidmem_page_alloc(mem->sgt->sgl);
	91	list_for_each_entry(chunk, &alloc->alloc_chunks, list_entry) {
	92	if (offset >= chunk->length)
	93	offset -= chunk->length;
	94	else
	95	break;
	96	}
	97
	98	offset /= sizeof(u32);
	99
	100	while (size) {
	101	byteoff = g->ops.pramin.enter(g, mem, chunk, offset);
	102	start_reg = g->ops.pramin.data032_r(byteoff / sizeof(u32));
	103	until_end = SZ_1M - (byteoff & (SZ_1M - 1));
	104
	105	n = min3(size, until_end, (u32)(chunk->length - offset));
	106
	107	loop(g, start_reg, n / sizeof(u32), arg);
	108
	109	/* read back to synchronize accesses */
	110	gk20a_readl(g, start_reg);
	111	g->ops.pramin.exit(g, mem, chunk);
	112
	113	size -= n;
	114
	115	if (n == (chunk->length - offset)) {
	116	chunk = list_next_entry(chunk, list_entry);
	117	offset = 0;
	118	} else {
	119	offset += n / sizeof(u32);
	120	}
	121	}
	122	}
	123
	124	void nvgpu_init_pramin(struct mm_gk20a *mm)
	125	{
	126	mm->pramin_window = 0;
	127	nvgpu_spinlock_init(&mm->pramin_window_lock);
	128	mm->force_pramin = GK20A_FORCE_PRAMIN_DEFAULT;
	129	}