gpu: nvgpu: gp10b: Make page mapping scatter aware

Augment new page mapping code to be aware of scattered buffers. Bug 1605769 Change-Id: Ifdb326563d28ccf07fc4d3d76a24492a68493fe3 Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-on: http://git-master/r/734355
author: Terje Bergstrom <tbergstrom@nvidia.com> 2015-04-22 15:47:15 -0400
committer: Deepak Nibade <dnibade@nvidia.com> 2016-12-27 04:52:05 -0500
commit: 4b02177fd3c84e84a3e6894f3696feecf8f5c508 (patch)
tree: b573668dc14096ec76d85998530da46f581dd2d4 /drivers/gpu/nvgpu/gp10b/mm_gp10b.c
parent: faa1e5d82b8c3a2d125f04788f8146ba9b9b186c (diff)
1 files changed, 40 insertions, 9 deletions
diff --git a/drivers/gpu/nvgpu/gp10b/mm_gp10b.c b/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
index 1608b176..3633e9d9 100644
--- a/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
+++ b/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
@@ -148,7 +148,9 @@ u32 *pde3_from_index(struct gk20a_mm_entry *entry, u32 i)
 static int update_gmmu_pde3_locked(struct vm_gk20a *vm,
                           struct gk20a_mm_entry *parent,
                           u32 i, u32 gmmu_pgsz_idx,
-                           u64 iova,
+                           struct scatterlist **sgl,
+                           u64 *offset,
+                           u64 *iova,
                           u32 kind_v, u32 *ctag,
                           bool cacheable, bool unmapped_pte,
                           int rw_flag, bool sparse, u32 flags)
@@ -188,7 +190,9 @@ u32 *pde0_from_index(struct gk20a_mm_entry *entry, u32 i)
 static int update_gmmu_pde0_locked(struct vm_gk20a *vm,
                           struct gk20a_mm_entry *pte,
                           u32 i, u32 gmmu_pgsz_idx,
-                           u64 iova,
+                           struct scatterlist **sgl,
+                           u64 *offset,
+                           u64 *iova,
                           u32 kind_v, u32 *ctag,
                           bool cacheable, bool unmapped_pte,
                           int rw_flag, bool sparse, u32 flags)
@@ -241,7 +245,9 @@ static int update_gmmu_pde0_locked(struct vm_gk20a *vm,
 static int update_gmmu_pte_locked(struct vm_gk20a *vm,
                           struct gk20a_mm_entry *pte,
                           u32 i, u32 gmmu_pgsz_idx,
-                           u64 iova,
+                           struct scatterlist **sgl,
+                           u64 *offset,
+                           u64 *iova,
                           u32 kind_v, u32 *ctag,
                           bool cacheable, bool unmapped_pte,
                           int rw_flag, bool sparse, u32 flags)
@@ -251,23 +257,31 @@ static int update_gmmu_pte_locked(struct vm_gk20a *vm,
        gk20a_dbg_fn("");
-        if (iova) {
+        if (*iova) {
-                pte_w[0] = gmmu_new_pte_valid_true_f() |
+                if (unmapped_pte)
-                        gmmu_new_pte_address_sys_f(iova
+                        pte_w[0] = gmmu_new_pte_valid_false_f() |
-                                >> gmmu_new_pte_address_shift_v());
+                                gmmu_new_pte_address_sys_f(*iova
+                                        >> gmmu_new_pte_address_shift_v());
+                else
+                        pte_w[0] = gmmu_new_pte_valid_true_f() |
+                                gmmu_new_pte_address_sys_f(*iova
+                                        >> gmmu_new_pte_address_shift_v());
                pte_w[1] = gmmu_new_pte_aperture_video_memory_f() |
                        gmmu_new_pte_kind_f(kind_v) |
                        gmmu_new_pte_comptagline_f(*ctag / SZ_128K);
                if (rw_flag == gk20a_mem_flag_read_only)
                        pte_w[0] |= gmmu_new_pte_read_only_true_f();
-                if (!cacheable)
+                if (unmapped_pte && !cacheable)
+                        pte_w[0] |= gmmu_new_pte_read_only_true_f();
+                else if (!cacheable)
                        pte_w[1] |= gmmu_new_pte_vol_true_f();
                gk20a_dbg(gpu_dbg_pte, "pte=%d iova=0x%llx kind=%d"
                           " ctag=%d vol=%d"
                           " [0x%08x, 0x%08x]",
-                           i, iova,
+                           i, *iova,
                           kind_v, *ctag, !cacheable,
                           pte_w[1], pte_w[0]);
@@ -283,6 +297,23 @@ static int update_gmmu_pte_locked(struct vm_gk20a *vm,
        gk20a_mem_wr32(pte->cpu_va + i*8, 0, pte_w[0]);
        gk20a_mem_wr32(pte->cpu_va + i*8, 1, pte_w[1]);
+        if (*iova) {
+                *iova += page_size;
+                *offset += page_size;
+                if (*sgl && *offset + page_size > (*sgl)->length) {
+                        u64 new_iova;
+                        *sgl = sg_next(*sgl);
+                        if (*sgl) {
+                                new_iova = sg_phys(*sgl);
+                                gk20a_dbg(gpu_dbg_pte, "chunk address %llx, size %d",
+                                          new_iova, (*sgl)->length);
+                                if (new_iova) {
+                                        *offset = 0;
+                                        *iova = new_iova;
+                                }
+                        }
+                }
+        }
        gk20a_dbg_fn("done");
        return 0;
 }
author	Terje Bergstrom <tbergstrom@nvidia.com>	2015-04-22 15:47:15 -0400
committer	Deepak Nibade <dnibade@nvidia.com>	2016-12-27 04:52:05 -0500
commit	4b02177fd3c84e84a3e6894f3696feecf8f5c508 (patch)
tree	b573668dc14096ec76d85998530da46f581dd2d4 /drivers/gpu/nvgpu/gp10b/mm_gp10b.c
parent	faa1e5d82b8c3a2d125f04788f8146ba9b9b186c (diff)