gpu: nvgpu: don't mem_{begin,end}() for gr

Now that GR buffers always have a kernel mapping, remove the unnecessary calls to nvgpu_mem_begin() and nvgpu_mem_end() on these buffers: - global ctx buffer mem in gr - gr ctx mem in a tsg - patch ctx mem in a gr ctx - pm ctx mem in a gr ctx - ctx_header mem in a channel (subctx header) Change-Id: Id2a8ad108aef8db8b16dce5bae8003bbcd3b23e4 Signed-off-by: Konsta Holtta <kholtta@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1760599 Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com> GVS: Gerrit_Virtual_Submit Reviewed-by: Alex Waterman <alexw@nvidia.com> Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Konsta Holtta <kholtta@nvidia.com> 2018-06-25 08:47:15 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2018-06-28 14:13:35 -0400
commit: dd146d42fc910128b0e2987d12b83430bf97bae0 (patch)
tree: 23d3f808eb6ea65dd8ab90398a22ff52fce09736 /drivers/gpu/nvgpu/gk20a/gr_gk20a.c
parent: 2dda362e6395a6d486ba3d1a75e707933690023e (diff)
1 files changed, 4 insertions, 115 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
index 28ccb896..b218397a 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -111,15 +111,10 @@ int gr_gk20a_get_ctx_id(struct gk20a *g,
           Flush and invalidate before cpu update. */
        g->ops.mm.l2_flush(g, true);
-        if (nvgpu_mem_begin(g, mem))
-                return -ENOMEM;
        *ctx_id = nvgpu_mem_rd(g, mem,
                        ctxsw_prog_main_image_context_id_o());
        nvgpu_log(g, gpu_dbg_fn | gpu_dbg_intr, "ctx_id: 0x%x", *ctx_id);
-        nvgpu_mem_end(g, mem);
        return 0;
 }
@@ -696,12 +691,6 @@ int gr_gk20a_ctx_patch_write_begin(struct gk20a *g,
                                          struct nvgpu_gr_ctx *gr_ctx,
                                          bool update_patch_count)
 {
-        int err = 0;
-        err = nvgpu_mem_begin(g, &gr_ctx->patch_ctx.mem);
-        if (err)
-                return err;
        if (update_patch_count) {
                /* reset patch count if ucode has already processed it */
                gr_ctx->patch_ctx.data_count = nvgpu_mem_rd(g,
@@ -717,8 +706,6 @@ void gr_gk20a_ctx_patch_write_end(struct gk20a *g,
                                        struct nvgpu_gr_ctx *gr_ctx,
                                        bool update_patch_count)
 {
-        nvgpu_mem_end(g, &gr_ctx->patch_ctx.mem);
        /* Write context count to context image if it is mapped */
        if (update_patch_count) {
                nvgpu_mem_wr(g, &gr_ctx->mem,
@@ -832,31 +819,22 @@ static int gr_gk20a_ctx_zcull_setup(struct gk20a *g, struct channel_gk20a *c)
        gr_ctx = &tsg->gr_ctx;
        mem = &gr_ctx->mem;
-        if (nvgpu_mem_begin(g, mem))
-                return -ENOMEM;
-        if (nvgpu_mem_begin(g, ctxheader)) {
-                ret = -ENOMEM;
-                goto clean_up_mem;
-        }
        if (gr_ctx->zcull_ctx.gpu_va == 0 &&
            gr_ctx->zcull_ctx.ctx_sw_mode ==
                ctxsw_prog_main_image_zcull_mode_separate_buffer_v()) {
-                ret = -EINVAL;
+                return -EINVAL;
-                goto clean_up;
        }
        ret = gk20a_disable_channel_tsg(g, c);
        if (ret) {
                nvgpu_err(g, "failed to disable channel/TSG");
-                goto clean_up;
+                return ret;
        }
        ret = gk20a_fifo_preempt(g, c);
        if (ret) {
                gk20a_enable_channel_tsg(g, c);
                nvgpu_err(g, "failed to preempt channel/TSG");
-                goto clean_up;
+                return ret;
        }
        nvgpu_mem_wr(g, mem,
@@ -871,11 +849,6 @@ static int gr_gk20a_ctx_zcull_setup(struct gk20a *g, struct channel_gk20a *c)
        gk20a_enable_channel_tsg(g, c);
-clean_up:
-        nvgpu_mem_end(g, ctxheader);
-clean_up_mem:
-        nvgpu_mem_end(g, mem);
        return ret;
 }
@@ -1597,12 +1570,6 @@ restore_fe_go_idle:
                goto restore_fe_go_idle;
        }
-        if (nvgpu_mem_begin(g, gold_mem))
-                goto clean_up;
-        if (nvgpu_mem_begin(g, gr_mem))
-                goto clean_up;
        ctx_header_words =  roundup(ctx_header_bytes, sizeof(u32));
        ctx_header_words >>= 2;
@@ -1655,9 +1622,6 @@ clean_up:
        else
                nvgpu_log_fn(g, "done");
-        nvgpu_mem_end(g, gold_mem);
-        nvgpu_mem_end(g, gr_mem);
        nvgpu_mutex_release(&gr->ctx_mutex);
        return err;
 }
@@ -1701,11 +1665,6 @@ int gr_gk20a_update_smpc_ctxsw_mode(struct gk20a *g,
           Flush and invalidate before cpu update. */
        g->ops.mm.l2_flush(g, true);
-        if (nvgpu_mem_begin(g, mem)) {
-                ret = -ENOMEM;
-                goto out;
-        }
        data = nvgpu_mem_rd(g, mem,
                ctxsw_prog_main_image_pm_o());
@@ -1717,7 +1676,6 @@ int gr_gk20a_update_smpc_ctxsw_mode(struct gk20a *g,
        nvgpu_mem_wr(g, mem,
                ctxsw_prog_main_image_pm_o(), data);
-        nvgpu_mem_end(g, mem);
 out:
        gk20a_enable_channel_tsg(g, c);
        return ret;
@@ -1807,24 +1765,7 @@ int gr_gk20a_update_hwpm_ctxsw_mode(struct gk20a *g,
                }
                /* Now clear the buffer */
-                if (nvgpu_mem_begin(g, &pm_ctx->mem)) {
-                        ret = -ENOMEM;
-                        goto cleanup_pm_buf;
-                }
                nvgpu_memset(g, &pm_ctx->mem, 0, 0, pm_ctx->mem.size);
-                nvgpu_mem_end(g, &pm_ctx->mem);
-        }
-        if (nvgpu_mem_begin(g, gr_mem)) {
-                ret = -ENOMEM;
-                goto cleanup_pm_buf;
-        }
-        if (nvgpu_mem_begin(g, ctxheader)) {
-                ret = -ENOMEM;
-                goto clean_up_mem;
        }
        data = nvgpu_mem_rd(g, gr_mem, ctxsw_prog_main_image_pm_o());
@@ -1848,22 +1789,10 @@ int gr_gk20a_update_hwpm_ctxsw_mode(struct gk20a *g,
        else
                g->ops.gr.write_pm_ptr(g, gr_mem, virt_addr);
-        nvgpu_mem_end(g, ctxheader);
-        nvgpu_mem_end(g, gr_mem);
        /* enable channel */
        gk20a_enable_channel_tsg(g, c);
        return 0;
-clean_up_mem:
-        nvgpu_mem_end(g, gr_mem);
-cleanup_pm_buf:
-        nvgpu_gmmu_unmap(c->vm, &pm_ctx->mem, pm_ctx->mem.gpu_va);
-        nvgpu_dma_free(g, &pm_ctx->mem);
-        memset(&pm_ctx->mem, 0, sizeof(struct nvgpu_mem));
-        gk20a_enable_channel_tsg(g, c);
-        return ret;
 }
 void gk20a_gr_init_ctxsw_hdr_data(struct gk20a *g,
@@ -1904,9 +1833,6 @@ int gr_gk20a_load_golden_ctx_image(struct gk20a *g,
           Flush and invalidate before cpu update. */
        g->ops.mm.l2_flush(g, true);
-        if (nvgpu_mem_begin(g, mem))
-                return -ENOMEM;
        nvgpu_mem_wr_n(g, mem, 0,
                gr->ctx_vars.local_golden_image,
                gr->ctx_vars.golden_image_size);
@@ -1973,7 +1899,6 @@ int gr_gk20a_load_golden_ctx_image(struct gk20a *g,
                if (gr_ctx->pm_ctx.mem.gpu_va == 0) {
                        nvgpu_err(g,
                                "context switched pm with no pm buffer!");
-                        nvgpu_mem_end(g, mem);
                        return -EFAULT;
                }
@@ -1989,8 +1914,6 @@ int gr_gk20a_load_golden_ctx_image(struct gk20a *g,
        g->ops.gr.write_pm_ptr(g, mem, virt_addr);
-        nvgpu_mem_end(g, mem);
        return ret;
 }
@@ -4840,12 +4763,6 @@ static int gr_gk20a_init_access_map(struct gk20a *g)
        u32 *whitelist = NULL;
        int w, num_entries = 0;
-        if (nvgpu_mem_begin(g, mem)) {
-                nvgpu_err(g,
-                          "failed to map priv access map memory");
-                return -ENOMEM;
-        }
        nvgpu_memset(g, mem, 0, 0, PAGE_SIZE * nr_pages);
        g->ops.gr.get_access_map(g, &whitelist, &num_entries);
@@ -4864,7 +4781,6 @@ static int gr_gk20a_init_access_map(struct gk20a *g)
                nvgpu_mem_wr32(g, mem, map_byte / sizeof(u32), x);
        }
-        nvgpu_mem_end(g, mem);
        return 0;
 }
@@ -6758,22 +6674,12 @@ static int gr_gk20a_ctx_patch_smpc(struct gk20a *g,
                                         ctxsw_prog_main_image_patch_count_o(),
                                         gr_ctx->patch_ctx.data_count);
                                if (ctxheader->gpu_va) {
-                                        /*
-                                         * Main context can be gr_ctx or pm_ctx.
-                                         * CPU access for relevant ctx is taken
-                                         * care of in the calling function
-                                         * __gr_gk20a_exec_ctx_ops. Need to take
-                                         * care of cpu access to ctxheader here.
-                                         */
-                                if (nvgpu_mem_begin(g, ctxheader))
-                                                return -ENOMEM;
                                        nvgpu_mem_wr(g, ctxheader,
                                                ctxsw_prog_main_image_patch_adr_lo_o(),
                                                vaddr_lo);
                                        nvgpu_mem_wr(g, ctxheader,
                                                ctxsw_prog_main_image_patch_adr_hi_o(),
                                                vaddr_hi);
-                                         nvgpu_mem_end(g, ctxheader);
                                } else {
                                        nvgpu_mem_wr(g, mem,
                                                ctxsw_prog_main_image_patch_adr_lo_o(),
@@ -8038,17 +7944,8 @@ int __gr_gk20a_exec_ctx_ops(struct channel_gk20a *ch,
                                                ctx_ops[i].type == REGOP(TYPE_GR_CTX_QUAD),
                                                ctx_ops[i].quad);
                        if (!err) {
-                                if (!gr_ctx_ready) {
+                                if (!gr_ctx_ready)
-                                        /* would have been a variant of
-                                         * gr_gk20a_apply_instmem_overrides,
-                                         * recoded in-place instead.
-                                         */
-                                        if (nvgpu_mem_begin(g, &gr_ctx->mem)) {
-                                                err = -ENOMEM;
-                                                goto cleanup;
-                                        }
                                        gr_ctx_ready = true;
-                                }
                                current_mem = &gr_ctx->mem;
                        } else {
                                err = gr_gk20a_get_pm_ctx_buffer_offsets(g,
@@ -8072,10 +7969,6 @@ int __gr_gk20a_exec_ctx_ops(struct channel_gk20a *ch,
                                                err = -EINVAL;
                                                goto cleanup;
                                        }
-                                        if (nvgpu_mem_begin(g, &gr_ctx->pm_ctx.mem)) {
-                                                err = -ENOMEM;
-                                                goto cleanup;
-                                        }
                                        pm_ctx_ready = true;
                                }
                                current_mem = &gr_ctx->pm_ctx.mem;
@@ -8148,10 +8041,6 @@ int __gr_gk20a_exec_ctx_ops(struct channel_gk20a *ch,
        if (gr_ctx->patch_ctx.mem.cpu_va)
                gr_gk20a_ctx_patch_write_end(g, gr_ctx, gr_ctx_ready);
-        if (gr_ctx_ready)
-                nvgpu_mem_end(g, &gr_ctx->mem);
-        if (pm_ctx_ready)
-                nvgpu_mem_end(g, &gr_ctx->pm_ctx.mem);
        return err;
 }
author	Konsta Holtta <kholtta@nvidia.com>	2018-06-25 08:47:15 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2018-06-28 14:13:35 -0400
commit	dd146d42fc910128b0e2987d12b83430bf97bae0 (patch)
tree	23d3f808eb6ea65dd8ab90398a22ff52fce09736 /drivers/gpu/nvgpu/gk20a/gr_gk20a.c
parent	2dda362e6395a6d486ba3d1a75e707933690023e (diff)