3 files changed, 24 insertions, 3 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/gk20a.h b/drivers/gpu/nvgpu/gk20a/gk20a.h
index 80d85d65..d7fdffb0 100644
--- a/drivers/gpu/nvgpu/gk20a/gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/gk20a.h
@@ -172,6 +172,7 @@ struct gpu_ops {
                u32 (*get_num_pce)(struct gk20a *g);
        } ce2;
        struct {
+                u32 (*get_patch_slots)(struct gk20a *g);
                int (*init_fs_state)(struct gk20a *g);
                int (*init_preemption_state)(struct gk20a *g);
                void (*access_smpc_reg)(struct gk20a *g, u32 quad, u32 offset);
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
index 71fe44a3..3c3ddc80 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -714,7 +714,8 @@ void gr_gk20a_ctx_patch_write(struct gk20a *g,
        if (patch) {
                u32 patch_slot = ch_ctx->patch_ctx.data_count *
                                PATCH_CTX_SLOTS_REQUIRED_PER_ENTRY;
-                if (patch_slot > (PATCH_CTX_SLOTS_MAX -
+                if (patch_slot > (PATCH_CTX_ENTRIES_FROM_SIZE(
+                                        ch_ctx->patch_ctx.mem.size) -
                                PATCH_CTX_SLOTS_REQUIRED_PER_ENTRY)) {
                        nvgpu_err(g, "failed to access patch_slot %d",
                                patch_slot);
@@ -2813,17 +2814,29 @@ static void gr_gk20a_free_channel_gr_ctx(struct channel_gk20a *c)
        c->ch_ctx.gr_ctx = NULL;
 }
+u32 gr_gk20a_get_patch_slots(struct gk20a *g)
+{
+        return PATCH_CTX_SLOTS_PER_PAGE;
+}
 static int gr_gk20a_alloc_channel_patch_ctx(struct gk20a *g,
                                struct channel_gk20a *c)
 {
        struct patch_desc *patch_ctx = &c->ch_ctx.patch_ctx;
        struct vm_gk20a *ch_vm = c->vm;
+        u32 alloc_size;
        int err = 0;
        gk20a_dbg_fn("");
+        alloc_size = g->ops.gr.get_patch_slots(g) *
+                PATCH_CTX_SLOTS_REQUIRED_PER_ENTRY;
+        nvgpu_log(g, gpu_dbg_info, "patch buffer size in entries: %d",
+                alloc_size);
        err = nvgpu_dma_alloc_map_flags_sys(ch_vm, NVGPU_DMA_NO_KERNEL_MAPPING,
-                        PATCH_CTX_SLOTS_MAX * sizeof(u32), &patch_ctx->mem);
+                        alloc_size * sizeof(u32), &patch_ctx->mem);
        if (err)
                return err;
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
index 0a685d01..db1a9514 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
@@ -52,8 +52,14 @@
 #define GK20A_TIMEOUT_FPGA              100000 /* 100 sec */
-#define PATCH_CTX_SLOTS_MAX                     128
+/*
+ * allocate a minimum of 1 page (4KB) worth of patch space, this is 512 entries
+ * of address and data pairs
+ */
 #define PATCH_CTX_SLOTS_REQUIRED_PER_ENTRY      2
+#define PATCH_CTX_SLOTS_PER_PAGE \
+        (PAGE_SIZE/(PATCH_CTX_SLOTS_REQUIRED_PER_ENTRY * sizeof(u32)))
+#define PATCH_CTX_ENTRIES_FROM_SIZE(size) (size/sizeof(u32))
 struct channel_gk20a;
 struct nvgpu_warpstate;
@@ -756,5 +762,6 @@ void gk20a_gr_get_ovr_perf_regs(struct gk20a *g, u32 *num_ovr_perf_regs,
                                               u32 **ovr_perf_regs);
 void gk20a_gr_init_ctxsw_hdr_data(struct gk20a *g,
                                        struct nvgpu_mem *mem);
+u32 gr_gk20a_get_patch_slots(struct gk20a *g);
 #endif /*__GR_GK20A_H__*/