10 files changed, 87 insertions, 81 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/cde_gk20a.c b/drivers/gpu/nvgpu/gk20a/cde_gk20a.c
index 084f1793..730ffe5c 100644
--- a/drivers/gpu/nvgpu/gk20a/cde_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/cde_gk20a.c
@@ -1230,7 +1230,7 @@ static int gk20a_cde_load(struct gk20a_cde_ctx *cde_ctx)
        }
        /* bind the channel to the vm */
-        err = __gk20a_vm_bind_channel(&g->mm.cde.vm, ch);
+        err = __gk20a_vm_bind_channel(g->mm.cde.vm, ch);
        if (err) {
                nvgpu_warn(g, "cde: could not bind vm");
                goto err_commit_va;
diff --git a/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c b/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c
index c905bedb..8e600c18 100644
--- a/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c
@@ -451,7 +451,7 @@ u32 gk20a_ce_create_context_with_cb(struct gk20a *g,
        ce_ctx->submitted_seq_number = 0;
        ce_ctx->completed_seq_number = 0;
-        ce_ctx->vm = &g->mm.ce.vm;
+        ce_ctx->vm = g->mm.ce.vm;
        /* always kernel client needs privileged channel */
        ce_ctx->ch = gk20a_open_new_channel_with_cb(g, gk20a_ce_finished_ctx_cb,
@@ -465,7 +465,7 @@ u32 gk20a_ce_create_context_with_cb(struct gk20a *g,
        ce_ctx->ch->wdt_enabled = false;
        /* bind the channel to the vm */
-        err = __gk20a_vm_bind_channel(&g->mm.ce.vm, ce_ctx->ch);
+        err = __gk20a_vm_bind_channel(g->mm.ce.vm, ce_ctx->ch);
        if (err) {
                nvgpu_err(g, "ce: could not bind vm");
                goto end;
diff --git a/drivers/gpu/nvgpu/gk20a/css_gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/css_gr_gk20a.c
index f5176e98..452bcd11 100644
--- a/drivers/gpu/nvgpu/gk20a/css_gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/css_gr_gk20a.c
@@ -146,7 +146,7 @@ static int css_hw_enable_snapshot(struct channel_gk20a *ch,
        if (snapshot_size < CSS_MIN_HW_SNAPSHOT_SIZE)
                snapshot_size = CSS_MIN_HW_SNAPSHOT_SIZE;
-        ret = nvgpu_dma_alloc_map_sys(&g->mm.pmu.vm, snapshot_size,
+        ret = nvgpu_dma_alloc_map_sys(g->mm.pmu.vm, snapshot_size,
                                                        &data->hw_memdesc);
        if (ret)
                return ret;
@@ -195,7 +195,7 @@ static int css_hw_enable_snapshot(struct channel_gk20a *ch,
 failed_allocation:
        if (data->hw_memdesc.size) {
-                nvgpu_dma_unmap_free(&g->mm.pmu.vm, &data->hw_memdesc);
+                nvgpu_dma_unmap_free(g->mm.pmu.vm, &data->hw_memdesc);
                memset(&data->hw_memdesc, 0, sizeof(data->hw_memdesc));
        }
        data->hw_snapshot = NULL;
@@ -223,7 +223,7 @@ static void css_hw_disable_snapshot(struct gr_gk20a *gr)
                        perf_pmasys_mem_block_valid_false_f() |
                        perf_pmasys_mem_block_target_f(0));
-        nvgpu_dma_unmap_free(&g->mm.pmu.vm, &data->hw_memdesc);
+        nvgpu_dma_unmap_free(g->mm.pmu.vm, &data->hw_memdesc);
        memset(&data->hw_memdesc, 0, sizeof(data->hw_memdesc));
        data->hw_snapshot = NULL;
diff --git a/drivers/gpu/nvgpu/gk20a/dbg_gpu_gk20a.c b/drivers/gpu/nvgpu/gk20a/dbg_gpu_gk20a.c
index 09268b6b..4bfa041e 100644
--- a/drivers/gpu/nvgpu/gk20a/dbg_gpu_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/dbg_gpu_gk20a.c
@@ -1838,7 +1838,6 @@ static int gk20a_perfbuf_map(struct dbg_session_gk20a *dbg_s,
 {
        struct gk20a *g = dbg_s->g;
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->perfbuf.vm;
        int err;
        u32 virt_size;
        u32 virt_addr_lo;
@@ -1853,23 +1852,23 @@ static int gk20a_perfbuf_map(struct dbg_session_gk20a *dbg_s,
                return -EBUSY;
        }
-        err = nvgpu_init_vm(mm, vm, big_page_size,
+        mm->perfbuf.vm = nvgpu_vm_init(g, big_page_size,
                        big_page_size << 10,
                        NV_MM_DEFAULT_KERNEL_SIZE,
                        NV_MM_DEFAULT_KERNEL_SIZE + NV_MM_DEFAULT_USER_SIZE,
                        false, false, "perfbuf");
-        if (err) {
+        if (!mm->perfbuf.vm) {
                nvgpu_mutex_release(&g->dbg_sessions_lock);
-                return err;
+                return -ENOMEM;
        }
        err = gk20a_alloc_inst_block(g, &mm->perfbuf.inst_block);
        if (err)
                goto err_remove_vm;
-        g->ops.mm.init_inst_block(&mm->perfbuf.inst_block, vm, 0);
+        g->ops.mm.init_inst_block(&mm->perfbuf.inst_block, mm->perfbuf.vm, 0);
-        err = nvgpu_vm_map_buffer(vm,
+        err = nvgpu_vm_map_buffer(mm->perfbuf.vm,
                        args->dmabuf_fd,
                        &args->offset,
                        0,
@@ -1922,9 +1921,10 @@ static int gk20a_perfbuf_map(struct dbg_session_gk20a *dbg_s,
        return 0;
 err_unmap:
-        nvgpu_vm_unmap_buffer(vm, args->offset, NULL);
+        nvgpu_vm_unmap_buffer(mm->perfbuf.vm, args->offset, NULL);
 err_remove_vm:
-        nvgpu_vm_remove_inst(vm, &mm->perfbuf.inst_block);
+        gk20a_free_inst_block(g, &mm->perfbuf.inst_block);
+        nvgpu_vm_put(mm->perfbuf.vm);
        nvgpu_mutex_release(&g->dbg_sessions_lock);
        return err;
 }
@@ -1956,13 +1956,14 @@ static int gk20a_perfbuf_disable_locked(struct gk20a *g)
 static int gk20a_perfbuf_release_locked(struct gk20a *g, u64 offset)
 {
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->perfbuf.vm;
+        struct vm_gk20a *vm = mm->perfbuf.vm;
        int err;
        err = gk20a_perfbuf_disable_locked(g);
        nvgpu_vm_unmap_buffer(vm, offset, NULL);
-        nvgpu_vm_remove_inst(vm, &mm->perfbuf.inst_block);
+        gk20a_free_inst_block(g, &mm->perfbuf.inst_block);
+        nvgpu_vm_put(vm);
        g->perfbuf.owner = NULL;
        g->perfbuf.offset = 0;
diff --git a/drivers/gpu/nvgpu/gk20a/fifo_gk20a.c b/drivers/gpu/nvgpu/gk20a/fifo_gk20a.c
index 63896228..7eb28f2f 100644
--- a/drivers/gpu/nvgpu/gk20a/fifo_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/fifo_gk20a.c
@@ -541,7 +541,7 @@ static void gk20a_remove_fifo_support(struct fifo_gk20a *f)
        nvgpu_vfree(g, f->channel);
        nvgpu_vfree(g, f->tsg);
        if (g->ops.mm.is_bar1_supported(g))
-                nvgpu_dma_unmap_free(&g->mm.bar1.vm, &f->userd);
+                nvgpu_dma_unmap_free(g->mm.bar1.vm, &f->userd);
        else
                nvgpu_dma_free(g, &f->userd);
@@ -923,7 +923,7 @@ static int gk20a_init_fifo_setup_sw(struct gk20a *g)
        nvgpu_mutex_init(&f->free_chs_mutex);
        if (g->ops.mm.is_bar1_supported(g))
-                err = nvgpu_dma_alloc_map_sys(&g->mm.bar1.vm,
+                err = nvgpu_dma_alloc_map_sys(g->mm.bar1.vm,
                                   f->userd_entry_size * f->num_channels,
                                   &f->userd);
@@ -963,7 +963,7 @@ static int gk20a_init_fifo_setup_sw(struct gk20a *g)
 clean_up:
        gk20a_dbg_fn("fail");
        if (g->ops.mm.is_bar1_supported(g))
-                nvgpu_dma_unmap_free(&g->mm.bar1.vm, &f->userd);
+                nvgpu_dma_unmap_free(g->mm.bar1.vm, &f->userd);
        else
                nvgpu_dma_free(g, &f->userd);
diff --git a/drivers/gpu/nvgpu/gk20a/gk20a.c b/drivers/gpu/nvgpu/gk20a/gk20a.c
index 31b0a771..e4d454fe 100644
--- a/drivers/gpu/nvgpu/gk20a/gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gk20a.c
@@ -436,10 +436,10 @@ int gk20a_init_gpu_characteristics(struct gk20a *g)
        gpu->bus_type = NVGPU_GPU_BUS_TYPE_AXI; /* always AXI for now */
-        gpu->big_page_size = g->mm.pmu.vm.big_page_size;
        gpu->compression_page_size = g->ops.fb.compression_page_size(g);
+        gpu->big_page_size = platform->default_big_page_size;
        gpu->pde_coverage_bit_count =
-                gk20a_mm_pde_coverage_bit_count(&g->mm.pmu.vm);
+                g->ops.mm.get_mmu_levels(g, gpu->big_page_size)[0].lo_bit[0];
        if (g->mm.disable_bigpage) {
                gpu->big_page_size = 0;
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
index f8e05818..b2ae77c3 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -2191,7 +2191,7 @@ static void gr_gk20a_start_falcon_ucode(struct gk20a *g)
 static int gr_gk20a_init_ctxsw_ucode_vaspace(struct gk20a *g)
 {
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->pmu.vm;
+        struct vm_gk20a *vm = mm->pmu.vm;
        struct gk20a_ctxsw_ucode_info *ucode_info = &g->ctxsw_ucode_info;
        int err;
@@ -2265,7 +2265,7 @@ static int gr_gk20a_copy_ctxsw_ucode_segments(
 int gr_gk20a_init_ctxsw_ucode(struct gk20a *g)
 {
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->pmu.vm;
+        struct vm_gk20a *vm = mm->pmu.vm;
        struct gk20a_ctxsw_bootloader_desc *fecs_boot_desc;
        struct gk20a_ctxsw_bootloader_desc *gpccs_boot_desc;
        struct nvgpu_firmware *fecs_fw;
@@ -5195,7 +5195,7 @@ static int gk20a_init_gr_bind_fecs_elpg(struct gk20a *g)
 {
        struct nvgpu_pmu *pmu = &g->pmu;
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->pmu.vm;
+        struct vm_gk20a *vm = mm->pmu.vm;
        int err = 0;
        u32 size;
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
index 87e6f30c..a1873a30 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -465,8 +465,7 @@ static void gk20a_remove_mm_ce_support(struct mm_gk20a *mm)
        mm->vidmem.ce_ctx_id = (u32)~0;
-        __nvgpu_vm_remove(&mm->ce.vm);
+        nvgpu_vm_put(mm->ce.vm);
 }
 static void gk20a_remove_mm_support(struct mm_gk20a *mm)
@@ -476,12 +475,15 @@ static void gk20a_remove_mm_support(struct mm_gk20a *mm)
        if (g->ops.mm.remove_bar2_vm)
                g->ops.mm.remove_bar2_vm(g);
-        if (g->ops.mm.is_bar1_supported(g))
+        if (g->ops.mm.is_bar1_supported(g)) {
-                nvgpu_vm_remove_inst(&mm->bar1.vm, &mm->bar1.inst_block);
+                gk20a_free_inst_block(g, &mm->bar1.inst_block);
+                nvgpu_vm_put(mm->bar1.vm);
+        }
-        nvgpu_vm_remove_inst(&mm->pmu.vm, &mm->pmu.inst_block);
+        gk20a_free_inst_block(g, &mm->pmu.inst_block);
-        gk20a_free_inst_block(gk20a_from_mm(mm), &mm->hwpm.inst_block);
+        gk20a_free_inst_block(g, &mm->hwpm.inst_block);
-        __nvgpu_vm_remove(&mm->cde.vm);
+        nvgpu_vm_put(mm->pmu.vm);
+        nvgpu_vm_put(mm->cde.vm);
        gk20a_semaphore_sea_destroy(g);
        gk20a_vidmem_destroy(g);
@@ -2641,30 +2643,31 @@ u64 gk20a_mm_inst_block_addr(struct gk20a *g, struct nvgpu_mem *inst_block)
 static int gk20a_init_bar1_vm(struct mm_gk20a *mm)
 {
        int err;
-        struct vm_gk20a *vm = &mm->bar1.vm;
        struct gk20a *g = gk20a_from_mm(mm);
        struct nvgpu_mem *inst_block = &mm->bar1.inst_block;
        u32 big_page_size = gk20a_get_platform(g->dev)->default_big_page_size;
        mm->bar1.aperture_size = bar1_aperture_size_mb_gk20a() << 20;
        gk20a_dbg_info("bar1 vm size = 0x%x", mm->bar1.aperture_size);
-        nvgpu_init_vm(mm, vm,
+        mm->bar1.vm = nvgpu_vm_init(g,
-                      big_page_size,
+                                    big_page_size,
-                      SZ_4K,                            /* Low hole */
+                                    SZ_4K,
-                      mm->bar1.aperture_size - SZ_4K,   /* Kernel reserved. */
+                                    mm->bar1.aperture_size - SZ_4K,
-                      mm->bar1.aperture_size,
+                                    mm->bar1.aperture_size,
-                      true, false,
+                                    true, false,
-                      "bar1");
+                                    "bar1");
+        if (!mm->bar1.vm)
+                return -ENOMEM;
        err = gk20a_alloc_inst_block(g, inst_block);
        if (err)
-                goto clean_up_va;
+                goto clean_up_vm;
-        g->ops.mm.init_inst_block(inst_block, vm, big_page_size);
+        g->ops.mm.init_inst_block(inst_block, mm->bar1.vm, big_page_size);
        return 0;
-clean_up_va:
+clean_up_vm:
-        nvgpu_deinit_vm(vm);
+        nvgpu_vm_put(mm->bar1.vm);
        return err;
 }
@@ -2672,7 +2675,6 @@ clean_up_va:
 static int gk20a_init_system_vm(struct mm_gk20a *mm)
 {
        int err;
-        struct vm_gk20a *vm = &mm->pmu.vm;
        struct gk20a *g = gk20a_from_mm(mm);
        struct nvgpu_mem *inst_block = &mm->pmu.inst_block;
        u32 big_page_size = gk20a_get_platform(g->dev)->default_big_page_size;
@@ -2687,65 +2689,70 @@ static int gk20a_init_system_vm(struct mm_gk20a *mm)
        mm->pmu.aperture_size = GK20A_PMU_VA_SIZE;
        gk20a_dbg_info("pmu vm size = 0x%x", mm->pmu.aperture_size);
-        nvgpu_init_vm(mm, vm, big_page_size,
+        mm->pmu.vm = nvgpu_vm_init(g, big_page_size,
-                      low_hole,
+                                   low_hole,
-                      aperture_size - low_hole,
+                                   aperture_size - low_hole,
-                      aperture_size,
+                                   aperture_size,
-                      true,
+                                   true,
-                      false,
+                                   false,
-                      "system");
+                                   "system");
+        if (!mm->pmu.vm)
+                return -ENOMEM;
        err = gk20a_alloc_inst_block(g, inst_block);
        if (err)
-                goto clean_up_va;
+                goto clean_up_vm;
-        g->ops.mm.init_inst_block(inst_block, vm, big_page_size);
+        g->ops.mm.init_inst_block(inst_block, mm->pmu.vm, big_page_size);
        return 0;
-clean_up_va:
+clean_up_vm:
-        nvgpu_deinit_vm(vm);
+        nvgpu_vm_put(mm->pmu.vm);
        return err;
 }
 static int gk20a_init_hwpm(struct mm_gk20a *mm)
 {
        int err;
-        struct vm_gk20a *vm = &mm->pmu.vm;
        struct gk20a *g = gk20a_from_mm(mm);
        struct nvgpu_mem *inst_block = &mm->hwpm.inst_block;
        err = gk20a_alloc_inst_block(g, inst_block);
        if (err)
                return err;
-        g->ops.mm.init_inst_block(inst_block, vm, 0);
+        g->ops.mm.init_inst_block(inst_block, mm->pmu.vm, 0);
        return 0;
 }
 static int gk20a_init_cde_vm(struct mm_gk20a *mm)
 {
-        struct vm_gk20a *vm = &mm->cde.vm;
        struct gk20a *g = gk20a_from_mm(mm);
        u32 big_page_size = gk20a_get_platform(g->dev)->default_big_page_size;
-        return nvgpu_init_vm(mm, vm, big_page_size,
+        mm->cde.vm = nvgpu_vm_init(g, big_page_size,
-                        big_page_size << 10,
+                                   big_page_size << 10,
-                        NV_MM_DEFAULT_KERNEL_SIZE,
+                                   NV_MM_DEFAULT_KERNEL_SIZE,
-                        NV_MM_DEFAULT_KERNEL_SIZE + NV_MM_DEFAULT_USER_SIZE,
+                                   NV_MM_DEFAULT_KERNEL_SIZE + NV_MM_DEFAULT_USER_SIZE,
-                        false, false, "cde");
+                                   false, false, "cde");
+        if (!mm->cde.vm)
+                return -ENOMEM;
+        return 0;
 }
 static int gk20a_init_ce_vm(struct mm_gk20a *mm)
 {
-        struct vm_gk20a *vm = &mm->ce.vm;
        struct gk20a *g = gk20a_from_mm(mm);
        u32 big_page_size = gk20a_get_platform(g->dev)->default_big_page_size;
-        return nvgpu_init_vm(mm, vm, big_page_size,
+        mm->ce.vm = nvgpu_vm_init(g, big_page_size,
-                        big_page_size << 10,
+                                  big_page_size << 10,
-                        NV_MM_DEFAULT_KERNEL_SIZE,
+                                  NV_MM_DEFAULT_KERNEL_SIZE,
-                        NV_MM_DEFAULT_KERNEL_SIZE + NV_MM_DEFAULT_USER_SIZE,
+                                  NV_MM_DEFAULT_KERNEL_SIZE + NV_MM_DEFAULT_USER_SIZE,
-                        false, false, "ce");
+                                  false, false, "ce");
+        if (!mm->ce.vm)
+                return -ENOMEM;
+        return 0;
 }
 void gk20a_mm_init_pdb(struct gk20a *g, struct nvgpu_mem *inst_block,
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
index 16c35d34..7e2ba051 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
@@ -78,8 +78,6 @@ struct pm_ctx_desc {
        u32 pm_mode;
 };
-struct gk20a;
 struct compbit_store_desc {
        struct nvgpu_mem mem;
@@ -191,19 +189,19 @@ struct mm_gk20a {
        struct {
                u32 aperture_size;
-                struct vm_gk20a vm;
+                struct vm_gk20a *vm;
                struct nvgpu_mem inst_block;
        } bar1;
        struct {
                u32 aperture_size;
-                struct vm_gk20a vm;
+                struct vm_gk20a *vm;
                struct nvgpu_mem inst_block;
        } bar2;
        struct {
                u32 aperture_size;
-                struct vm_gk20a vm;
+                struct vm_gk20a *vm;
                struct nvgpu_mem inst_block;
        } pmu;
@@ -213,16 +211,16 @@ struct mm_gk20a {
        } hwpm;
        struct {
-                struct vm_gk20a vm;
+                struct vm_gk20a *vm;
                struct nvgpu_mem inst_block;
        } perfbuf;
        struct {
-                struct vm_gk20a vm;
+                struct vm_gk20a *vm;
        } cde;
        struct {
-                struct vm_gk20a vm;
+                struct vm_gk20a *vm;
        } ce;
        struct nvgpu_mutex l2_op_lock;
diff --git a/drivers/gpu/nvgpu/gk20a/pmu_gk20a.c b/drivers/gpu/nvgpu/gk20a/pmu_gk20a.c
index e74a5264..f296b57c 100644
--- a/drivers/gpu/nvgpu/gk20a/pmu_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/pmu_gk20a.c
@@ -3132,7 +3132,7 @@ static int gk20a_prepare_ucode(struct gk20a *g)
        struct nvgpu_pmu *pmu = &g->pmu;
        int err = 0;
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->pmu.vm;
+        struct vm_gk20a *vm = mm->pmu.vm;
        if (pmu->fw)
                return gk20a_init_pmu(pmu);
@@ -3170,7 +3170,7 @@ static int gk20a_init_pmu_setup_sw(struct gk20a *g)
 {
        struct nvgpu_pmu *pmu = &g->pmu;
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->pmu.vm;
+        struct vm_gk20a *vm = mm->pmu.vm;
        unsigned int i;
        int err = 0;
        u8 *ptr;
@@ -4793,7 +4793,7 @@ int gk20a_pmu_vidmem_surface_alloc(struct gk20a *g, struct nvgpu_mem *mem,
                u32 size)
 {
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->pmu.vm;
+        struct vm_gk20a *vm = mm->pmu.vm;
        int err;
        err = nvgpu_dma_alloc_map_vid(vm, size, mem);
@@ -4809,7 +4809,7 @@ int gk20a_pmu_sysmem_surface_alloc(struct gk20a *g, struct nvgpu_mem *mem,
                u32 size)
 {
        struct mm_gk20a *mm = &g->mm;
-        struct vm_gk20a *vm = &mm->pmu.vm;
+        struct vm_gk20a *vm = mm->pmu.vm;
        int err;
        err = nvgpu_dma_alloc_map_sys(vm, size, mem);