gpu: nvgpu: Update Linux side VM code for API solidification

Update the Linux specific code to match the MM API docs in the previous patch. The user passed page size is plumbed through the Linux VM mapping calls but is ultimately ignored once the core VM code is called. This will be handled in the next patch. This also adds some code to make the CDE page size picking happen semi-intelligently. In many cases the CDE buffers can be mapped with large pages. Bug 2011640 Change-Id: I20e78e7d5a841e410864b474179e71da1c2482f4 Signed-off-by: Alex Waterman <alexw@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1740610 GVS: Gerrit_Virtual_Submit Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Alex Waterman <alexw@nvidia.com> 2018-06-05 15:53:16 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2018-06-22 13:04:16 -0400
commit: 840e039d57d4acfb2be2a82c4b95a6d25c7aacd4 (patch)
tree: a4a358cf6bb5d005e8f6db159d1b3b03ddbf94df /drivers/gpu/nvgpu/os/linux/cde.c
parent: 46666ed101847d9b87ea60cd432dea97afbef0b1 (diff)
1 files changed, 28 insertions, 1 deletions
diff --git a/drivers/gpu/nvgpu/os/linux/cde.c b/drivers/gpu/nvgpu/os/linux/cde.c
index 66a80403..052a1d21 100644
--- a/drivers/gpu/nvgpu/os/linux/cde.c
+++ b/drivers/gpu/nvgpu/os/linux/cde.c
@@ -975,6 +975,30 @@ static struct gk20a_cde_ctx *gk20a_cde_allocate_context(struct nvgpu_os_linux *l
        return cde_ctx;
 }
+static u32 gk20a_cde_mapping_page_size(struct vm_gk20a *vm,
+                                       u32 map_offset, u32 map_size)
+{
+        struct gk20a *g = gk20a_from_vm(vm);
+        /*
+         * To be simple we will just make the map size depend on the
+         * iommu'ability of the driver. If there's an IOMMU we can rely on
+         * buffers being contiguous. If not, then we'll use 4k pages since we
+         * know that will work for any buffer.
+         */
+        if (!nvgpu_iommuable(g))
+                return SZ_4K;
+        /*
+         * If map size or offset is not 64K aligned then use small pages.
+         */
+        if (map_size & (vm->big_page_size - 1) ||
+            map_offset & (vm->big_page_size - 1))
+                return SZ_4K;
+        return vm->big_page_size;
+}
 int gk20a_cde_convert(struct nvgpu_os_linux *l,
                      struct dma_buf *compbits_scatter_buf,
                      u64 compbits_byte_offset,
@@ -1071,7 +1095,10 @@ __releases(&l->cde_app->mutex)
        err = nvgpu_vm_map_linux(cde_ctx->vm, compbits_scatter_buf, 0,
                                 NVGPU_VM_MAP_CACHEABLE |
                                 NVGPU_VM_MAP_DIRECT_KIND_CTRL,
-                                 NVGPU_KIND_INVALID,
+                                 gk20a_cde_mapping_page_size(cde_ctx->vm,
+                                                             map_offset,
+                                                             map_size),
+                                 NV_KIND_INVALID,
                                 compbits_kind, /* incompressible kind */
                                 gk20a_mem_flag_none,
                                 map_offset, map_size,
author	Alex Waterman <alexw@nvidia.com>	2018-06-05 15:53:16 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2018-06-22 13:04:16 -0400
commit	840e039d57d4acfb2be2a82c4b95a6d25c7aacd4 (patch)
tree	a4a358cf6bb5d005e8f6db159d1b3b03ddbf94df /drivers/gpu/nvgpu/os/linux/cde.c
parent	46666ed101847d9b87ea60cd432dea97afbef0b1 (diff)

diff --git a/drivers/gpu/nvgpu/os/linux/cde.c b/drivers/gpu/nvgpu/os/linux/cde.c index 66a80403..052a1d21 100644 --- a/drivers/gpu/nvgpu/os/linux/cde.c +++ b/drivers/gpu/nvgpu/os/linux/cde.c
@@ -975,6 +975,30 @@ static struct gk20a_cde_ctx gk20a_cde_allocate_context(struct nvgpu_os_linux l
975	return cde_ctx;	975	return cde_ctx;
976	}	976	}
977		977
		978	static u32 gk20a_cde_mapping_page_size(struct vm_gk20a *vm,
		979	u32 map_offset, u32 map_size)
		980	{
		981	struct gk20a *g = gk20a_from_vm(vm);
		982
		983	/*
		984	* To be simple we will just make the map size depend on the
		985	* iommu'ability of the driver. If there's an IOMMU we can rely on
		986	* buffers being contiguous. If not, then we'll use 4k pages since we
		987	* know that will work for any buffer.
		988	*/
		989	if (!nvgpu_iommuable(g))
		990	return SZ_4K;
		991
		992	/*
		993	* If map size or offset is not 64K aligned then use small pages.
		994	*/
		995	if (map_size & (vm->big_page_size - 1) \|\|
		996	map_offset & (vm->big_page_size - 1))
		997	return SZ_4K;
		998
		999	return vm->big_page_size;
		1000	}
		1001
978	int gk20a_cde_convert(struct nvgpu_os_linux *l,	1002	int gk20a_cde_convert(struct nvgpu_os_linux *l,
979	struct dma_buf *compbits_scatter_buf,	1003	struct dma_buf *compbits_scatter_buf,
980	u64 compbits_byte_offset,	1004	u64 compbits_byte_offset,
@@ -1071,7 +1095,10 @@ __releases(&l->cde_app->mutex)
1071	err = nvgpu_vm_map_linux(cde_ctx->vm, compbits_scatter_buf, 0,	1095	err = nvgpu_vm_map_linux(cde_ctx->vm, compbits_scatter_buf, 0,
1072	NVGPU_VM_MAP_CACHEABLE \|	1096	NVGPU_VM_MAP_CACHEABLE \|
1073	NVGPU_VM_MAP_DIRECT_KIND_CTRL,	1097	NVGPU_VM_MAP_DIRECT_KIND_CTRL,
1074	NVGPU_KIND_INVALID,	1098	gk20a_cde_mapping_page_size(cde_ctx->vm,
		1099	map_offset,
		1100	map_size),
		1101	NV_KIND_INVALID,
1075	compbits_kind, /* incompressible kind */	1102	compbits_kind, /* incompressible kind */
1076	gk20a_mem_flag_none,	1103	gk20a_mem_flag_none,
1077	map_offset, map_size,	1104	map_offset, map_size,