4 files changed, 37 insertions, 86 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
index 49b70767..293ccd97 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -597,16 +597,16 @@ int gr_gk20a_ctx_patch_write_begin(struct gk20a *g,
                                          struct channel_ctx_gk20a *ch_ctx)
 {
        /* being defensive still... */
-        if (WARN_ON(ch_ctx->patch_ctx.cpu_va)) {
+        if (WARN_ON(ch_ctx->patch_ctx.mem.cpu_va)) {
                gk20a_err(dev_from_gk20a(g), "nested ctx patch begin?");
                return -EBUSY;
        }
-        ch_ctx->patch_ctx.cpu_va = vmap(ch_ctx->patch_ctx.pages,
+        ch_ctx->patch_ctx.mem.cpu_va = vmap(ch_ctx->patch_ctx.mem.pages,
-                        PAGE_ALIGN(ch_ctx->patch_ctx.size) >> PAGE_SHIFT,
+                        PAGE_ALIGN(ch_ctx->patch_ctx.mem.size) >> PAGE_SHIFT,
                        0, pgprot_writecombine(PAGE_KERNEL));
-        if (!ch_ctx->patch_ctx.cpu_va)
+        if (!ch_ctx->patch_ctx.mem.cpu_va)
                return -ENOMEM;
        return 0;
@@ -616,13 +616,13 @@ int gr_gk20a_ctx_patch_write_end(struct gk20a *g,
                                        struct channel_ctx_gk20a *ch_ctx)
 {
        /* being defensive still... */
-        if (!ch_ctx->patch_ctx.cpu_va) {
+        if (!ch_ctx->patch_ctx.mem.cpu_va) {
                gk20a_err(dev_from_gk20a(g), "dangling ctx patch end?");
                return -EINVAL;
        }
-        vunmap(ch_ctx->patch_ctx.cpu_va);
+        vunmap(ch_ctx->patch_ctx.mem.cpu_va);
-        ch_ctx->patch_ctx.cpu_va = NULL;
+        ch_ctx->patch_ctx.mem.cpu_va = NULL;
        return 0;
 }
@@ -642,7 +642,7 @@ int gr_gk20a_ctx_patch_write(struct gk20a *g,
                /* we added an optimization prolog, epilog
                 * to get rid of unnecessary maps and l2 invals.
                 * but be defensive still... */
-                if (!ch_ctx->patch_ctx.cpu_va) {
+                if (!ch_ctx->patch_ctx.mem.cpu_va) {
                        int err;
                        gk20a_err(dev_from_gk20a(g),
                                   "per-write ctx patch begin?");
@@ -654,7 +654,7 @@ int gr_gk20a_ctx_patch_write(struct gk20a *g,
                } else
                        mapped_here = false;
-                patch_ptr = ch_ctx->patch_ctx.cpu_va;
+                patch_ptr = ch_ctx->patch_ctx.mem.cpu_va;
                patch_slot = ch_ctx->patch_ctx.data_count * 2;
                gk20a_mem_wr32(patch_ptr, patch_slot++, addr);
@@ -1622,8 +1622,8 @@ int gr_gk20a_load_golden_ctx_image(struct gk20a *g,
        gk20a_mem_wr32(ctx_ptr + ctxsw_prog_main_image_num_save_ops_o(), 0, 0);
        gk20a_mem_wr32(ctx_ptr + ctxsw_prog_main_image_num_restore_ops_o(), 0, 0);
-        virt_addr_lo = u64_lo32(ch_ctx->patch_ctx.gpu_va);
+        virt_addr_lo = u64_lo32(ch_ctx->patch_ctx.mem.gpu_va);
-        virt_addr_hi = u64_hi32(ch_ctx->patch_ctx.gpu_va);
+        virt_addr_hi = u64_hi32(ch_ctx->patch_ctx.mem.gpu_va);
        gk20a_mem_wr32(ctx_ptr + ctxsw_prog_main_image_patch_count_o(), 0,
                 ch_ctx->patch_ctx.data_count);
@@ -2568,82 +2568,33 @@ static int gr_gk20a_alloc_channel_patch_ctx(struct gk20a *g,
                                struct channel_gk20a *c)
 {
        struct patch_desc *patch_ctx = &c->ch_ctx.patch_ctx;
-        struct device *d = dev_from_gk20a(g);
        struct vm_gk20a *ch_vm = c->vm;
-        DEFINE_DMA_ATTRS(attrs);
-        struct sg_table *sgt;
        int err = 0;
-        dma_addr_t iova;
        gk20a_dbg_fn("");
-        patch_ctx->size = 128 * sizeof(u32);
+        err = gk20a_gmmu_alloc_map_attr(ch_vm, DMA_ATTR_NO_KERNEL_MAPPING,
-        dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, &attrs);
+                                        128 * sizeof(u32), &patch_ctx->mem);
-        patch_ctx->pages = dma_alloc_attrs(d, patch_ctx->size,
-                                &iova, GFP_KERNEL,
-                                &attrs);
-        if (!patch_ctx->pages)
-                return -ENOMEM;
-        patch_ctx->iova = iova;
-        err = gk20a_get_sgtable_from_pages(d, &sgt, patch_ctx->pages,
-                        patch_ctx->iova, patch_ctx->size);
        if (err)
-                goto err_free;
+                return err;
-        patch_ctx->gpu_va = gk20a_gmmu_map(ch_vm, &sgt, patch_ctx->size,
-                                        0, gk20a_mem_flag_none);
-        if (!patch_ctx->gpu_va)
-                goto err_free_sgtable;
-        gk20a_free_sgtable(&sgt);
        gk20a_dbg_fn("done");
        return 0;
- err_free_sgtable:
-        gk20a_free_sgtable(&sgt);
- err_free:
-        dma_free_attrs(d, patch_ctx->size,
-                patch_ctx->pages, patch_ctx->iova, &attrs);
-        patch_ctx->pages = NULL;
-        patch_ctx->iova = 0;
-        gk20a_err(dev_from_gk20a(g), "fail");
-        return err;
-}
-static void gr_gk20a_unmap_channel_patch_ctx(struct channel_gk20a *c)
-{
-        struct patch_desc *patch_ctx = &c->ch_ctx.patch_ctx;
-        struct vm_gk20a *ch_vm = c->vm;
-        gk20a_dbg_fn("");
-        if (patch_ctx->gpu_va)
-                gk20a_gmmu_unmap(ch_vm, patch_ctx->gpu_va,
-                        patch_ctx->size, gk20a_mem_flag_none);
-        patch_ctx->gpu_va = 0;
-        patch_ctx->data_count = 0;
 }
 static void gr_gk20a_free_channel_patch_ctx(struct channel_gk20a *c)
 {
        struct patch_desc *patch_ctx = &c->ch_ctx.patch_ctx;
        struct gk20a *g = c->g;
-        struct device *d = dev_from_gk20a(g);
-        DEFINE_DMA_ATTRS(attrs);
        gk20a_dbg_fn("");
-        gr_gk20a_unmap_channel_patch_ctx(c);
+        if (patch_ctx->mem.gpu_va)
+                gk20a_gmmu_unmap(c->vm, patch_ctx->mem.gpu_va,
+                                 patch_ctx->mem.size, gk20a_mem_flag_none);
-        if (patch_ctx->pages) {
+        gk20a_gmmu_free_attr(g, DMA_ATTR_NO_KERNEL_MAPPING, &patch_ctx->mem);
-                dma_set_attr(DMA_ATTR_NO_KERNEL_MAPPING, &attrs);
+        patch_ctx->data_count = 0;
-                dma_free_attrs(d, patch_ctx->size,
-                        patch_ctx->pages, patch_ctx->iova, &attrs);
-                patch_ctx->pages = NULL;
-                patch_ctx->iova = 0;
-        }
 }
 void gk20a_free_channel_ctx(struct channel_gk20a *c)
@@ -2757,7 +2708,7 @@ int gk20a_alloc_obj_ctx(struct channel_gk20a  *c,
        }
        /* allocate patch buffer */
-        if (ch_ctx->patch_ctx.pages == NULL) {
+        if (ch_ctx->patch_ctx.mem.sgt == NULL) {
                err = gr_gk20a_alloc_channel_patch_ctx(g, c);
                if (err) {
                        gk20a_err(dev_from_gk20a(g),
@@ -2883,7 +2834,7 @@ int gk20a_free_obj_ctx(struct channel_gk20a  *c,
                gk20a_disable_channel(c,
                        !c->has_timedout,
                        timeout);
-                gr_gk20a_unmap_channel_patch_ctx(c);
+                gr_gk20a_free_channel_patch_ctx(c);
        }
        return 0;
@@ -6081,8 +6032,8 @@ static int gr_gk20a_ctx_patch_smpc(struct gk20a *g,
                                gr_gk20a_ctx_patch_write(g, ch_ctx,
                                                         addr, data, true);
-                                vaddr_lo = u64_lo32(ch_ctx->patch_ctx.gpu_va);
+                                vaddr_lo = u64_lo32(ch_ctx->patch_ctx.mem.gpu_va);
-                                vaddr_hi = u64_hi32(ch_ctx->patch_ctx.gpu_va);
+                                vaddr_hi = u64_hi32(ch_ctx->patch_ctx.mem.gpu_va);
                                gk20a_mem_wr32(context +
                                         ctxsw_prog_main_image_patch_count_o(),
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
index fa84337b..bde8afae 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -1616,6 +1616,7 @@ void gk20a_gmmu_free_attr(struct gk20a *g, enum dma_attr attr,
                }
                mem->cpu_va = NULL;
+                mem->pages = NULL;
        }
        if (mem->sgt)
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
index 91659537..df9ebec3 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
@@ -68,11 +68,7 @@ struct gpfifo_desc {
 };
 struct patch_desc {
-        struct page **pages;
+        struct mem_desc mem;
-        u64 iova;
-        size_t size;
-        void *cpu_va;
-        u64 gpu_va;
        u32 data_count;
 };
diff --git a/drivers/gpu/nvgpu/vgpu/gr_vgpu.c b/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
index fd8bb81b..8d0bb6cf 100644
--- a/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
@@ -321,18 +321,20 @@ static int vgpu_gr_alloc_channel_patch_ctx(struct gk20a *g,
        gk20a_dbg_fn("");
-        patch_ctx->size = 128 * sizeof(u32);
+        patch_ctx->mem.size = 128 * sizeof(u32);
-        patch_ctx->gpu_va = gk20a_vm_alloc_va(ch_vm, patch_ctx->size, 0);
+        patch_ctx->mem.gpu_va = gk20a_vm_alloc_va(ch_vm,
-        if (!patch_ctx->gpu_va)
+                                                  patch_ctx->mem.size, 0);
+        if (!patch_ctx->mem.gpu_va)
                return -ENOMEM;
        msg.cmd = TEGRA_VGPU_CMD_CHANNEL_ALLOC_GR_PATCH_CTX;
        msg.handle = platform->virt_handle;
        p->handle = c->virt_ctx;
-        p->patch_ctx_va = patch_ctx->gpu_va;
+        p->patch_ctx_va = patch_ctx->mem.gpu_va;
        err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
        if (err || msg.ret) {
-                gk20a_vm_free_va(ch_vm, patch_ctx->gpu_va, patch_ctx->size, 0);
+                gk20a_vm_free_va(ch_vm, patch_ctx->mem.gpu_va,
+                                 patch_ctx->mem.size, 0);
                err = -ENOMEM;
        }
@@ -347,7 +349,7 @@ static void vgpu_gr_free_channel_patch_ctx(struct channel_gk20a *c)
        gk20a_dbg_fn("");
-        if (patch_ctx->gpu_va) {
+        if (patch_ctx->mem.gpu_va) {
                struct tegra_vgpu_cmd_msg msg;
                struct tegra_vgpu_gr_ctx_params *p = &msg.params.gr_ctx;
                int err;
@@ -358,8 +360,9 @@ static void vgpu_gr_free_channel_patch_ctx(struct channel_gk20a *c)
                err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
                WARN_ON(err || msg.ret);
-                gk20a_vm_free_va(ch_vm, patch_ctx->gpu_va, patch_ctx->size, 0);
+                gk20a_vm_free_va(ch_vm, patch_ctx->mem.gpu_va,
-                patch_ctx->gpu_va = 0;
+                                 patch_ctx->mem.size, 0);
+                patch_ctx->mem.gpu_va = 0;
        }
 }
@@ -438,7 +441,7 @@ static int vgpu_gr_alloc_obj_ctx(struct channel_gk20a  *c,
        }
        /* allocate patch buffer */
-        if (ch_ctx->patch_ctx.pages == NULL) {
+        if (ch_ctx->patch_ctx.mem.pages == NULL) {
                err = vgpu_gr_alloc_channel_patch_ctx(g, c);
                if (err) {
                        gk20a_err(dev_from_gk20a(g),