7 files changed, 4 insertions, 355 deletions
diff --git a/drivers/gpu/nvgpu/common/linux/ioctl_as.c b/drivers/gpu/nvgpu/common/linux/ioctl_as.c
index 273024bd..6fd0a3d2 100644
--- a/drivers/gpu/nvgpu/common/linux/ioctl_as.c
+++ b/drivers/gpu/nvgpu/common/linux/ioctl_as.c
@@ -227,31 +227,6 @@ static int gk20a_as_ioctl_get_va_regions(
        return 0;
 }
-static int gk20a_as_ioctl_get_buffer_compbits_info(
-                struct gk20a_as_share *as_share,
-                struct nvgpu_as_get_buffer_compbits_info_args *args)
-{
-        gk20a_dbg_fn("");
-        return nvgpu_vm_get_compbits_info(as_share->vm,
-                                          args->mapping_gva,
-                                          &args->compbits_win_size,
-                                          &args->compbits_win_ctagline,
-                                          &args->mapping_ctagline,
-                                          &args->flags);
-}
-static int gk20a_as_ioctl_map_buffer_compbits(
-                struct gk20a_as_share *as_share,
-                struct nvgpu_as_map_buffer_compbits_args *args)
-{
-        gk20a_dbg_fn("");
-        return nvgpu_vm_map_compbits(as_share->vm,
-                                     args->mapping_gva,
-                                     &args->compbits_win_gva,
-                                     &args->mapping_iova,
-                                     args->flags);
-}
 int gk20a_as_dev_open(struct inode *inode, struct file *filp)
 {
        struct nvgpu_os_linux *l;
@@ -364,14 +339,6 @@ long gk20a_as_dev_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
                err = gk20a_as_ioctl_get_va_regions(as_share,
                                (struct nvgpu_as_get_va_regions_args *)buf);
                break;
-        case NVGPU_AS_IOCTL_GET_BUFFER_COMPBITS_INFO:
-                err = gk20a_as_ioctl_get_buffer_compbits_info(as_share,
-                                (struct nvgpu_as_get_buffer_compbits_info_args *)buf);
-                break;
-        case NVGPU_AS_IOCTL_MAP_BUFFER_COMPBITS:
-                err = gk20a_as_ioctl_map_buffer_compbits(as_share,
-                                (struct nvgpu_as_map_buffer_compbits_args *)buf);
-                break;
        case NVGPU_AS_IOCTL_MAP_BUFFER_BATCH:
                err = gk20a_as_ioctl_map_buffer_batch(as_share,
                                (struct nvgpu_as_map_buffer_batch_args *)buf);
diff --git a/drivers/gpu/nvgpu/common/linux/vm.c b/drivers/gpu/nvgpu/common/linux/vm.c
index c84f531d..0ace5abe 100644
--- a/drivers/gpu/nvgpu/common/linux/vm.c
+++ b/drivers/gpu/nvgpu/common/linux/vm.c
@@ -199,8 +199,6 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
        struct gk20a_comptags comptags;
        bool clear_ctags = false;
        struct scatterlist *sgl;
-        u64 ctag_map_win_size = 0;
-        u32 ctag_map_win_ctagline = 0;
        struct nvgpu_vm_area *vm_area = NULL;
        u32 ctag_offset;
        enum nvgpu_aperture aperture;
@@ -298,15 +296,10 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
                                     g->ops.fb.compression_page_size(g));
        if (bfr.ctag_lines && !comptags.lines) {
-                const bool user_mappable =
-                        !!(flags & NVGPU_AS_MAP_BUFFER_FLAGS_MAPPABLE_COMPBITS);
                /* allocate compression resources if needed */
                err = gk20a_alloc_comptags(g, dev, dmabuf,
                                           ctag_allocator,
-                                           bfr.ctag_lines, user_mappable,
+                                           bfr.ctag_lines);
-                                           &ctag_map_win_size,
-                                           &ctag_map_win_ctagline);
                if (err) {
                        /* ok to fall back here if we ran out */
                        /* TBD: we can partially alloc ctags as well... */
@@ -370,9 +363,6 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
        mapped_buffer->ctag_offset = bfr.ctag_offset;
        mapped_buffer->ctag_lines  = bfr.ctag_lines;
        mapped_buffer->ctag_allocated_lines = bfr.ctag_allocated_lines;
-        mapped_buffer->ctags_mappable = bfr.ctag_user_mappable;
-        mapped_buffer->ctag_map_win_size = ctag_map_win_size;
-        mapped_buffer->ctag_map_win_ctagline = ctag_map_win_ctagline;
        mapped_buffer->vm          = vm;
        mapped_buffer->flags       = flags;
        mapped_buffer->kind        = kind;
diff --git a/drivers/gpu/nvgpu/common/linux/vm_priv.h b/drivers/gpu/nvgpu/common/linux/vm_priv.h
index 14852264..4f6b10bb 100644
--- a/drivers/gpu/nvgpu/common/linux/vm_priv.h
+++ b/drivers/gpu/nvgpu/common/linux/vm_priv.h
@@ -49,12 +49,6 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
                 u64 mapping_size,
                 struct vm_gk20a_mapping_batch *mapping_batch);
-int nvgpu_vm_map_compbits(struct vm_gk20a *vm,
-                          u64 mapping_gva,
-                          u64 *compbits_win_gva,
-                          u64 *mapping_iova,
-                          u32 flags);
 /* Note: batch may be NULL if map op is not part of a batch */
 int nvgpu_vm_map_buffer(struct vm_gk20a *vm,
                        int dmabuf_fd,
@@ -86,8 +80,6 @@ int gk20a_alloc_comptags(struct gk20a *g,
                         struct device *dev,
                         struct dma_buf *dmabuf,
                         struct gk20a_comptag_allocator *allocator,
-                         u32 lines, bool user_mappable,
+                         u32 lines);
-                         u64 *ctag_map_win_size,
-                         u32 *ctag_map_win_ctagline);
 #endif
diff --git a/drivers/gpu/nvgpu/gk20a/gk20a.c b/drivers/gpu/nvgpu/gk20a/gk20a.c
index 639ec4b5..0cd314d6 100644
--- a/drivers/gpu/nvgpu/gk20a/gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gk20a.c
@@ -444,7 +444,6 @@ int gk20a_init_gpu_characteristics(struct gk20a *g)
        gpu->flags |= NVGPU_GPU_FLAGS_SUPPORT_USERSPACE_MANAGED_AS;
        gpu->flags |= NVGPU_GPU_FLAGS_SUPPORT_TSG;
-        gpu->flags |= NVGPU_GPU_FLAGS_SUPPORT_MAP_COMPBITS;
        if (g->ops.clk_arb.get_arbiter_clk_domains)
                gpu->flags |= NVGPU_GPU_FLAGS_SUPPORT_CLOCK_CONTROLS;
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
index 3030c170..2d69a2aa 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -296,19 +296,11 @@ int gk20a_alloc_comptags(struct gk20a *g,
                         struct device *dev,
                         struct dma_buf *dmabuf,
                         struct gk20a_comptag_allocator *allocator,
-                         u32 lines, bool user_mappable,
+                         u32 lines)
-                         u64 *ctag_map_win_size,
-                         u32 *ctag_map_win_ctagline)
 {
        struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
        u32 ctaglines_allocsize;
-        u32 ctagline_align;
        u32 offset;
-        u32 alignment_lines;
-        const u32 aggregate_cacheline_sz =
-                g->gr.cacheline_size * g->gr.slices_per_ltc *
-                g->ltc_count;
-        const u32 small_pgsz = 4096;
        int err;
        if (!priv)
@@ -317,42 +309,7 @@ int gk20a_alloc_comptags(struct gk20a *g,
        if (!lines)
                return -EINVAL;
-        if (!user_mappable) {
+        ctaglines_allocsize = lines;
-                ctaglines_allocsize = lines;
-                ctagline_align = 1;
-        } else {
-                /*
-                 * For security, align the allocation on a page, and reserve
-                 * whole pages. Unfortunately, we cannot ask the allocator to
-                 * align here, since compbits per cacheline is not always a
-                 * power of two. So, we just have to allocate enough extra that
-                 * we're guaranteed to find a ctagline inside the allocation so
-                 * that: 1) it is the first ctagline in a cacheline that starts
-                 * at a page boundary, and 2) we can add enough overallocation
-                 * that the ctaglines of the succeeding allocation are on
-                 * different page than ours.
-                 */
-                ctagline_align =
-                        (lcm(aggregate_cacheline_sz, small_pgsz) /
-                         aggregate_cacheline_sz) *
-                        g->gr.comptags_per_cacheline;
-                ctaglines_allocsize =
-                        /* for alignment */
-                        ctagline_align +
-                        /* lines rounded up to cachelines */
-                        DIV_ROUND_UP(lines, g->gr.comptags_per_cacheline) *
-                        g->gr.comptags_per_cacheline +
-                        /* trail-padding */
-                        DIV_ROUND_UP(aggregate_cacheline_sz, small_pgsz) *
-                        g->gr.comptags_per_cacheline;
-                if (ctaglines_allocsize < lines)
-                        return -EINVAL; /* integer overflow */
-        }
        /* store the allocator so we can use it when we free the ctags */
        priv->comptag_allocator = allocator;
@@ -361,53 +318,9 @@ int gk20a_alloc_comptags(struct gk20a *g,
        if (err)
                return err;
-        /*
-         * offset needs to be at the start of a page/cacheline boundary;
-         * prune the preceding ctaglines that were allocated for alignment.
-         */
-        alignment_lines =
-                DIV_ROUND_UP(offset, ctagline_align) * ctagline_align - offset;
-        if (alignment_lines) {
-                gk20a_comptaglines_free(allocator, offset, alignment_lines);
-                offset += alignment_lines;
-                ctaglines_allocsize -= alignment_lines;
-        }
-        /*
-         * check if we can prune the trailing, too; we just need to reserve
-         * whole pages and ctagcachelines.
-         */
-        if (user_mappable) {
-                u32 needed_cachelines =
-                        DIV_ROUND_UP(lines, g->gr.comptags_per_cacheline);
-                u32 needed_bytes = round_up(needed_cachelines *
-                                            aggregate_cacheline_sz,
-                                            small_pgsz);
-                u32 first_unneeded_cacheline =
-                        DIV_ROUND_UP(needed_bytes, aggregate_cacheline_sz);
-                u32 needed_ctaglines = first_unneeded_cacheline *
-                        g->gr.comptags_per_cacheline;
-                u64 win_size;
-                if (needed_ctaglines < ctaglines_allocsize) {
-                        gk20a_comptaglines_free(allocator,
-                                offset + needed_ctaglines,
-                                ctaglines_allocsize - needed_ctaglines);
-                        ctaglines_allocsize = needed_ctaglines;
-                }
-                *ctag_map_win_ctagline = offset;
-                win_size =
-                        DIV_ROUND_UP(lines, g->gr.comptags_per_cacheline) *
-                        aggregate_cacheline_sz;
-                *ctag_map_win_size = round_up(win_size, small_pgsz);
-        }
        priv->comptags.offset = offset;
        priv->comptags.lines = lines;
        priv->comptags.allocated_lines = ctaglines_allocsize;
-        priv->comptags.user_mappable = user_mappable;
        return 0;
 }
@@ -1202,191 +1115,6 @@ int gk20a_vidbuf_access_memory(struct gk20a *g, struct dma_buf *dmabuf,
 #endif
 }
-int nvgpu_vm_get_compbits_info(struct vm_gk20a *vm,
-                               u64 mapping_gva,
-                               u64 *compbits_win_size,
-                               u32 *compbits_win_ctagline,
-                               u32 *mapping_ctagline,
-                               u32 *flags)
-{
-        struct nvgpu_mapped_buf *mapped_buffer;
-        struct gk20a *g = vm->mm->g;
-        nvgpu_mutex_acquire(&vm->update_gmmu_lock);
-        mapped_buffer = __nvgpu_vm_find_mapped_buf(vm, mapping_gva);
-        if (!mapped_buffer || !mapped_buffer->user_mapped)
-        {
-                nvgpu_mutex_release(&vm->update_gmmu_lock);
-                nvgpu_err(g, "%s: bad offset 0x%llx", __func__, mapping_gva);
-                return -EFAULT;
-        }
-        *compbits_win_size = 0;
-        *compbits_win_ctagline = 0;
-        *mapping_ctagline = 0;
-        *flags = 0;
-        if (mapped_buffer->ctag_offset)
-                *flags |= NVGPU_AS_GET_BUFFER_COMPBITS_INFO_FLAGS_HAS_COMPBITS;
-        if (mapped_buffer->ctags_mappable)
-        {
-                *flags |= NVGPU_AS_GET_BUFFER_COMPBITS_INFO_FLAGS_MAPPABLE;
-                *compbits_win_size = mapped_buffer->ctag_map_win_size;
-                *compbits_win_ctagline = mapped_buffer->ctag_map_win_ctagline;
-                *mapping_ctagline = mapped_buffer->ctag_offset;
-        }
-        nvgpu_mutex_release(&vm->update_gmmu_lock);
-        return 0;
-}
-int nvgpu_vm_map_compbits(struct vm_gk20a *vm,
-                          u64 mapping_gva,
-                          u64 *compbits_win_gva,
-                          u64 *mapping_iova,
-                          u32 flags)
-{
-        struct nvgpu_mapped_buf *mapped_buffer;
-        struct gk20a *g = gk20a_from_vm(vm);
-        const bool fixed_mapping =
-                (flags & NVGPU_AS_MAP_BUFFER_COMPBITS_FLAGS_FIXED_OFFSET) != 0;
-        if (vm->userspace_managed && !fixed_mapping) {
-                nvgpu_err(g,
-                          "%s: non-fixed-offset mapping is not available on userspace managed address spaces",
-                          __func__);
-                return -EFAULT;
-        }
-        if (fixed_mapping && !vm->userspace_managed) {
-                nvgpu_err(g,
-                          "%s: fixed-offset mapping is available only on userspace managed address spaces",
-                          __func__);
-                return -EFAULT;
-        }
-        nvgpu_mutex_acquire(&vm->update_gmmu_lock);
-        mapped_buffer = __nvgpu_vm_find_mapped_buf(vm, mapping_gva);
-        if (!mapped_buffer || !mapped_buffer->user_mapped) {
-                nvgpu_mutex_release(&vm->update_gmmu_lock);
-                nvgpu_err(g, "%s: bad offset 0x%llx", __func__, mapping_gva);
-                return -EFAULT;
-        }
-        if (!mapped_buffer->ctags_mappable) {
-                nvgpu_mutex_release(&vm->update_gmmu_lock);
-                nvgpu_err(g, "%s: comptags not mappable, offset 0x%llx",
-                          __func__, mapping_gva);
-                return -EFAULT;
-        }
-        if (!mapped_buffer->ctag_map_win_addr) {
-                const u32 small_pgsz_index = 0; /* small pages, 4K */
-                const u32 aggregate_cacheline_sz =
-                        g->gr.cacheline_size * g->gr.slices_per_ltc *
-                        g->ltc_count;
-                /* first aggregate cacheline to map */
-                u32 cacheline_start; /* inclusive */
-                /* offset of the start cacheline (will be page aligned) */
-                u64 cacheline_offset_start;
-                if (!mapped_buffer->ctag_map_win_size) {
-                        nvgpu_mutex_release(&vm->update_gmmu_lock);
-                        nvgpu_err(g,
-                                  "%s: mapping 0x%llx does not have "
-                                  "mappable comptags",
-                                  __func__, mapping_gva);
-                        return -EFAULT;
-                }
-                cacheline_start = mapped_buffer->ctag_offset /
-                        g->gr.comptags_per_cacheline;
-                cacheline_offset_start =
-                        (u64)cacheline_start * aggregate_cacheline_sz;
-                if (fixed_mapping) {
-                        struct buffer_attrs bfr;
-                        int err;
-                        struct nvgpu_vm_area *vm_area = NULL;
-                        memset(&bfr, 0, sizeof(bfr));
-                        bfr.pgsz_idx = small_pgsz_index;
-                        err = nvgpu_vm_area_validate_buffer(
-                                vm, *compbits_win_gva, mapped_buffer->ctag_map_win_size,
-                                bfr.pgsz_idx, &vm_area);
-                        if (err) {
-                                nvgpu_mutex_release(&vm->update_gmmu_lock);
-                                return err;
-                        }
-                        if (vm_area) {
-                                /* this would create a dangling GPU VA
-                                 * pointer if the space is freed
-                                 * before before the buffer is
-                                 * unmapped */
-                                nvgpu_mutex_release(&vm->update_gmmu_lock);
-                                nvgpu_err(g,
-                                          "%s: comptags cannot be mapped into allocated space",
-                                          __func__);
-                                return -EINVAL;
-                        }
-                }
-                mapped_buffer->ctag_map_win_addr =
-                        g->ops.mm.gmmu_map(
-                                vm,
-                                !fixed_mapping ? 0 : *compbits_win_gva, /* va */
-                                g->gr.compbit_store.mem.priv.sgt,
-                                cacheline_offset_start, /* sg offset */
-                                mapped_buffer->ctag_map_win_size, /* size */
-                                small_pgsz_index,
-                                0, /* kind */
-                                0, /* ctag_offset */
-                                NVGPU_MAP_BUFFER_FLAGS_CACHEABLE_TRUE,
-                                gk20a_mem_flag_read_only,
-                                false, /* clear_ctags */
-                                false, /* sparse */
-                                false, /* priv */
-                                NULL,  /* mapping_batch handle */
-                                g->gr.compbit_store.mem.aperture);
-                if (!mapped_buffer->ctag_map_win_addr) {
-                        nvgpu_mutex_release(&vm->update_gmmu_lock);
-                        nvgpu_err(g,
-                                  "%s: failed to map comptags for mapping 0x%llx",
-                                  __func__, mapping_gva);
-                        return -ENOMEM;
-                }
-        } else if (fixed_mapping && *compbits_win_gva &&
-                   mapped_buffer->ctag_map_win_addr != *compbits_win_gva) {
-                nvgpu_mutex_release(&vm->update_gmmu_lock);
-                nvgpu_err(g,
-                          "%s: re-requesting comptags map into mismatching address. buffer offset 0x"
-                          "%llx, existing comptag map at 0x%llx, requested remap 0x%llx",
-                          __func__, mapping_gva,
-                          mapped_buffer->ctag_map_win_addr, *compbits_win_gva);
-                return -EINVAL;
-        }
-        *mapping_iova = nvgpu_mem_get_addr_sgl(g, mapped_buffer->sgt->sgl);
-        *compbits_win_gva = mapped_buffer->ctag_map_win_addr;
-        nvgpu_mutex_release(&vm->update_gmmu_lock);
-        return 0;
-}
 #if defined(CONFIG_GK20A_VIDMEM)
 static int gk20a_gmmu_clear_vidmem_mem(struct gk20a *g, struct nvgpu_mem *mem)
 {
@@ -1688,19 +1416,6 @@ void nvgpu_vm_unmap_locked(struct nvgpu_mapped_buf *mapped_buffer,
        struct vm_gk20a *vm = mapped_buffer->vm;
        struct gk20a *g = vm->mm->g;
-        if (mapped_buffer->ctag_map_win_addr) {
-                /* unmap compbits */
-                g->ops.mm.gmmu_unmap(vm,
-                                     mapped_buffer->ctag_map_win_addr,
-                                     mapped_buffer->ctag_map_win_size,
-                                     0,       /* page size 4k */
-                                     true,    /* va allocated */
-                                     gk20a_mem_flag_none,
-                                     false,   /* not sparse */
-                                     batch);  /* batch handle */
-        }
        g->ops.mm.gmmu_unmap(vm,
                mapped_buffer->addr,
                mapped_buffer->size,
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
index 82a4ee85..c77bebf8 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
@@ -389,13 +389,6 @@ struct sg_table *gk20a_mm_pin(struct device *dev, struct dma_buf *dmabuf);
 void gk20a_mm_unpin(struct device *dev, struct dma_buf *dmabuf,
                    struct sg_table *sgt);
-int nvgpu_vm_get_compbits_info(struct vm_gk20a *vm,
-                               u64 mapping_gva,
-                               u64 *compbits_win_size,
-                               u32 *compbits_win_ctagline,
-                               u32 *mapping_ctagline,
-                               u32 *flags);
 /* vm-as interface */
 struct nvgpu_as_alloc_space_args;
 struct nvgpu_as_free_space_args;
diff --git a/drivers/gpu/nvgpu/include/nvgpu/vm.h b/drivers/gpu/nvgpu/include/nvgpu/vm.h
index b5c64c99..604f4335 100644
--- a/drivers/gpu/nvgpu/include/nvgpu/vm.h
+++ b/drivers/gpu/nvgpu/include/nvgpu/vm.h
@@ -96,13 +96,6 @@ struct nvgpu_mapped_buf {
        u32 ctag_lines;
        u32 ctag_allocated_lines;
-        /* For comptag mapping, these are the mapping window parameters */
-        bool ctags_mappable;
-        u64 ctag_map_win_addr; /* non-zero if mapped */
-        u64 ctag_map_win_size; /* non-zero if ctags_mappable */
-        u32 ctag_map_win_ctagline; /* ctagline at win start, set if
-                                    * ctags_mappable */
        u32 flags;
        u32 kind;
        bool va_allocated;

diff --git a/drivers/gpu/nvgpu/common/linux/ioctl_as.c b/drivers/gpu/nvgpu/common/linux/ioctl_as.c index 273024bd..6fd0a3d2 100644 --- a/drivers/gpu/nvgpu/common/linux/ioctl_as.c +++ b/drivers/gpu/nvgpu/common/linux/ioctl_as.c
@@ -227,31 +227,6 @@ static int gk20a_as_ioctl_get_va_regions(
227	return 0;	227	return 0;
228	}	228	}
229		229
230	static int gk20a_as_ioctl_get_buffer_compbits_info(
231	struct gk20a_as_share *as_share,
232	struct nvgpu_as_get_buffer_compbits_info_args *args)
233	{
234	gk20a_dbg_fn("");
235	return nvgpu_vm_get_compbits_info(as_share->vm,
236	args->mapping_gva,
237	&args->compbits_win_size,
238	&args->compbits_win_ctagline,
239	&args->mapping_ctagline,
240	&args->flags);
241	}
242
243	static int gk20a_as_ioctl_map_buffer_compbits(
244	struct gk20a_as_share *as_share,
245	struct nvgpu_as_map_buffer_compbits_args *args)
246	{
247	gk20a_dbg_fn("");
248	return nvgpu_vm_map_compbits(as_share->vm,
249	args->mapping_gva,
250	&args->compbits_win_gva,
251	&args->mapping_iova,
252	args->flags);
253	}
254
255	int gk20a_as_dev_open(struct inode inode, struct file filp)	230	int gk20a_as_dev_open(struct inode inode, struct file filp)
256	{	231	{
257	struct nvgpu_os_linux *l;	232	struct nvgpu_os_linux *l;
@@ -364,14 +339,6 @@ long gk20a_as_dev_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
364	err = gk20a_as_ioctl_get_va_regions(as_share,	339	err = gk20a_as_ioctl_get_va_regions(as_share,
365	(struct nvgpu_as_get_va_regions_args *)buf);	340	(struct nvgpu_as_get_va_regions_args *)buf);
366	break;	341	break;
367	case NVGPU_AS_IOCTL_GET_BUFFER_COMPBITS_INFO:
368	err = gk20a_as_ioctl_get_buffer_compbits_info(as_share,
369	(struct nvgpu_as_get_buffer_compbits_info_args *)buf);
370	break;
371	case NVGPU_AS_IOCTL_MAP_BUFFER_COMPBITS:
372	err = gk20a_as_ioctl_map_buffer_compbits(as_share,
373	(struct nvgpu_as_map_buffer_compbits_args *)buf);
374	break;
375	case NVGPU_AS_IOCTL_MAP_BUFFER_BATCH:	342	case NVGPU_AS_IOCTL_MAP_BUFFER_BATCH:
376	err = gk20a_as_ioctl_map_buffer_batch(as_share,	343	err = gk20a_as_ioctl_map_buffer_batch(as_share,
377	(struct nvgpu_as_map_buffer_batch_args *)buf);	344	(struct nvgpu_as_map_buffer_batch_args *)buf);


diff --git a/drivers/gpu/nvgpu/common/linux/vm.c b/drivers/gpu/nvgpu/common/linux/vm.c index c84f531d..0ace5abe 100644 --- a/drivers/gpu/nvgpu/common/linux/vm.c +++ b/drivers/gpu/nvgpu/common/linux/vm.c
@@ -199,8 +199,6 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
199	struct gk20a_comptags comptags;	199	struct gk20a_comptags comptags;
200	bool clear_ctags = false;	200	bool clear_ctags = false;
201	struct scatterlist *sgl;	201	struct scatterlist *sgl;
202	u64 ctag_map_win_size = 0;
203	u32 ctag_map_win_ctagline = 0;
204	struct nvgpu_vm_area *vm_area = NULL;	202	struct nvgpu_vm_area *vm_area = NULL;
205	u32 ctag_offset;	203	u32 ctag_offset;
206	enum nvgpu_aperture aperture;	204	enum nvgpu_aperture aperture;
@@ -298,15 +296,10 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
298	g->ops.fb.compression_page_size(g));	296	g->ops.fb.compression_page_size(g));
299		297
300	if (bfr.ctag_lines && !comptags.lines) {	298	if (bfr.ctag_lines && !comptags.lines) {
301	const bool user_mappable =
302	!!(flags & NVGPU_AS_MAP_BUFFER_FLAGS_MAPPABLE_COMPBITS);
303
304	/* allocate compression resources if needed */	299	/* allocate compression resources if needed */
305	err = gk20a_alloc_comptags(g, dev, dmabuf,	300	err = gk20a_alloc_comptags(g, dev, dmabuf,
306	ctag_allocator,	301	ctag_allocator,
307	bfr.ctag_lines, user_mappable,	302	bfr.ctag_lines);
308	&ctag_map_win_size,
309	&ctag_map_win_ctagline);
310	if (err) {	303	if (err) {
311	/* ok to fall back here if we ran out */	304	/* ok to fall back here if we ran out */
312	/* TBD: we can partially alloc ctags as well... */	305	/* TBD: we can partially alloc ctags as well... */
@@ -370,9 +363,6 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
370	mapped_buffer->ctag_offset = bfr.ctag_offset;	363	mapped_buffer->ctag_offset = bfr.ctag_offset;
371	mapped_buffer->ctag_lines = bfr.ctag_lines;	364	mapped_buffer->ctag_lines = bfr.ctag_lines;
372	mapped_buffer->ctag_allocated_lines = bfr.ctag_allocated_lines;	365	mapped_buffer->ctag_allocated_lines = bfr.ctag_allocated_lines;
373	mapped_buffer->ctags_mappable = bfr.ctag_user_mappable;
374	mapped_buffer->ctag_map_win_size = ctag_map_win_size;
375	mapped_buffer->ctag_map_win_ctagline = ctag_map_win_ctagline;
376	mapped_buffer->vm = vm;	366	mapped_buffer->vm = vm;
377	mapped_buffer->flags = flags;	367	mapped_buffer->flags = flags;
378	mapped_buffer->kind = kind;	368	mapped_buffer->kind = kind;


diff --git a/drivers/gpu/nvgpu/common/linux/vm_priv.h b/drivers/gpu/nvgpu/common/linux/vm_priv.h index 14852264..4f6b10bb 100644 --- a/drivers/gpu/nvgpu/common/linux/vm_priv.h +++ b/drivers/gpu/nvgpu/common/linux/vm_priv.h
@@ -49,12 +49,6 @@ u64 nvgpu_vm_map(struct vm_gk20a *vm,
49	u64 mapping_size,	49	u64 mapping_size,
50	struct vm_gk20a_mapping_batch *mapping_batch);	50	struct vm_gk20a_mapping_batch *mapping_batch);
51		51
52	int nvgpu_vm_map_compbits(struct vm_gk20a *vm,
53	u64 mapping_gva,
54	u64 *compbits_win_gva,
55	u64 *mapping_iova,
56	u32 flags);
57
58	/* Note: batch may be NULL if map op is not part of a batch */	52	/* Note: batch may be NULL if map op is not part of a batch */
59	int nvgpu_vm_map_buffer(struct vm_gk20a *vm,	53	int nvgpu_vm_map_buffer(struct vm_gk20a *vm,
60	int dmabuf_fd,	54	int dmabuf_fd,
@@ -86,8 +80,6 @@ int gk20a_alloc_comptags(struct gk20a *g,
86	struct device *dev,	80	struct device *dev,
87	struct dma_buf *dmabuf,	81	struct dma_buf *dmabuf,
88	struct gk20a_comptag_allocator *allocator,	82	struct gk20a_comptag_allocator *allocator,
89	u32 lines, bool user_mappable,	83	u32 lines);
90	u64 *ctag_map_win_size,
91	u32 *ctag_map_win_ctagline);
92		84
93	#endif	85	#endif


diff --git a/drivers/gpu/nvgpu/gk20a/gk20a.c b/drivers/gpu/nvgpu/gk20a/gk20a.c index 639ec4b5..0cd314d6 100644 --- a/drivers/gpu/nvgpu/gk20a/gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/gk20a.c
@@ -444,7 +444,6 @@ int gk20a_init_gpu_characteristics(struct gk20a *g)
444		444
445	gpu->flags \|= NVGPU_GPU_FLAGS_SUPPORT_USERSPACE_MANAGED_AS;	445	gpu->flags \|= NVGPU_GPU_FLAGS_SUPPORT_USERSPACE_MANAGED_AS;
446	gpu->flags \|= NVGPU_GPU_FLAGS_SUPPORT_TSG;	446	gpu->flags \|= NVGPU_GPU_FLAGS_SUPPORT_TSG;
447	gpu->flags \|= NVGPU_GPU_FLAGS_SUPPORT_MAP_COMPBITS;
448		447
449	if (g->ops.clk_arb.get_arbiter_clk_domains)	448	if (g->ops.clk_arb.get_arbiter_clk_domains)
450	gpu->flags \|= NVGPU_GPU_FLAGS_SUPPORT_CLOCK_CONTROLS;	449	gpu->flags \|= NVGPU_GPU_FLAGS_SUPPORT_CLOCK_CONTROLS;


diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c index 3030c170..2d69a2aa 100644 --- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -296,19 +296,11 @@ int gk20a_alloc_comptags(struct gk20a *g,
296	struct device *dev,	296	struct device *dev,
297	struct dma_buf *dmabuf,	297	struct dma_buf *dmabuf,
298	struct gk20a_comptag_allocator *allocator,	298	struct gk20a_comptag_allocator *allocator,
299	u32 lines, bool user_mappable,	299	u32 lines)
300	u64 *ctag_map_win_size,
301	u32 *ctag_map_win_ctagline)
302	{	300	{
303	struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);	301	struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
304	u32 ctaglines_allocsize;	302	u32 ctaglines_allocsize;
305	u32 ctagline_align;
306	u32 offset;	303	u32 offset;
307	u32 alignment_lines;
308	const u32 aggregate_cacheline_sz =
309	g->gr.cacheline_size * g->gr.slices_per_ltc *
310	g->ltc_count;
311	const u32 small_pgsz = 4096;
312	int err;	304	int err;
313		305
314	if (!priv)	306	if (!priv)
@@ -317,42 +309,7 @@ int gk20a_alloc_comptags(struct gk20a *g,
317	if (!lines)	309	if (!lines)
318	return -EINVAL;	310	return -EINVAL;
319		311
320	if (!user_mappable) {	312	ctaglines_allocsize = lines;
321	ctaglines_allocsize = lines;
322	ctagline_align = 1;
323	} else {
324	/*
325	* For security, align the allocation on a page, and reserve
326	* whole pages. Unfortunately, we cannot ask the allocator to
327	* align here, since compbits per cacheline is not always a
328	* power of two. So, we just have to allocate enough extra that
329	* we're guaranteed to find a ctagline inside the allocation so
330	* that: 1) it is the first ctagline in a cacheline that starts
331	* at a page boundary, and 2) we can add enough overallocation
332	* that the ctaglines of the succeeding allocation are on
333	* different page than ours.
334	*/
335
336	ctagline_align =
337	(lcm(aggregate_cacheline_sz, small_pgsz) /
338	aggregate_cacheline_sz) *
339	g->gr.comptags_per_cacheline;
340
341	ctaglines_allocsize =
342	/* for alignment */
343	ctagline_align +
344
345	/* lines rounded up to cachelines */
346	DIV_ROUND_UP(lines, g->gr.comptags_per_cacheline) *
347	g->gr.comptags_per_cacheline +
348
349	/* trail-padding */
350	DIV_ROUND_UP(aggregate_cacheline_sz, small_pgsz) *
351	g->gr.comptags_per_cacheline;
352
353	if (ctaglines_allocsize < lines)
354	return -EINVAL; /* integer overflow */
355	}
356		313
357	/* store the allocator so we can use it when we free the ctags */	314	/* store the allocator so we can use it when we free the ctags */
358	priv->comptag_allocator = allocator;	315	priv->comptag_allocator = allocator;
@@ -361,53 +318,9 @@ int gk20a_alloc_comptags(struct gk20a *g,
361	if (err)	318	if (err)
362	return err;	319	return err;
363		320
364	/*
365	* offset needs to be at the start of a page/cacheline boundary;
366	* prune the preceding ctaglines that were allocated for alignment.
367	*/
368	alignment_lines =
369	DIV_ROUND_UP(offset, ctagline_align) * ctagline_align - offset;
370	if (alignment_lines) {
371	gk20a_comptaglines_free(allocator, offset, alignment_lines);
372	offset += alignment_lines;
373	ctaglines_allocsize -= alignment_lines;
374	}
375
376	/*
377	* check if we can prune the trailing, too; we just need to reserve
378	* whole pages and ctagcachelines.
379	*/
380	if (user_mappable) {
381	u32 needed_cachelines =
382	DIV_ROUND_UP(lines, g->gr.comptags_per_cacheline);
383	u32 needed_bytes = round_up(needed_cachelines *
384	aggregate_cacheline_sz,
385	small_pgsz);
386	u32 first_unneeded_cacheline =
387	DIV_ROUND_UP(needed_bytes, aggregate_cacheline_sz);
388	u32 needed_ctaglines = first_unneeded_cacheline *
389	g->gr.comptags_per_cacheline;
390	u64 win_size;
391
392	if (needed_ctaglines < ctaglines_allocsize) {
393	gk20a_comptaglines_free(allocator,
394	offset + needed_ctaglines,
395	ctaglines_allocsize - needed_ctaglines);
396	ctaglines_allocsize = needed_ctaglines;
397	}
398
399	*ctag_map_win_ctagline = offset;
400	win_size =
401	DIV_ROUND_UP(lines, g->gr.comptags_per_cacheline) *
402	aggregate_cacheline_sz;
403
404	*ctag_map_win_size = round_up(win_size, small_pgsz);
405	}
406
407	priv->comptags.offset = offset;	321	priv->comptags.offset = offset;
408	priv->comptags.lines = lines;	322	priv->comptags.lines = lines;
409	priv->comptags.allocated_lines = ctaglines_allocsize;	323	priv->comptags.allocated_lines = ctaglines_allocsize;
410	priv->comptags.user_mappable = user_mappable;
411		324
412	return 0;	325	return 0;
413	}	326	}
@@ -1202,191 +1115,6 @@ int gk20a_vidbuf_access_memory(struct gk20a g, struct dma_buf dmabuf,
1202	#endif	1115	#endif
1203	}	1116	}
1204		1117
1205	int nvgpu_vm_get_compbits_info(struct vm_gk20a *vm,
1206	u64 mapping_gva,
1207	u64 *compbits_win_size,
1208	u32 *compbits_win_ctagline,
1209	u32 *mapping_ctagline,
1210	u32 *flags)
1211	{
1212	struct nvgpu_mapped_buf *mapped_buffer;
1213	struct gk20a *g = vm->mm->g;
1214
1215	nvgpu_mutex_acquire(&vm->update_gmmu_lock);
1216
1217	mapped_buffer = __nvgpu_vm_find_mapped_buf(vm, mapping_gva);
1218
1219	if (!mapped_buffer \|\| !mapped_buffer->user_mapped)
1220	{
1221	nvgpu_mutex_release(&vm->update_gmmu_lock);
1222	nvgpu_err(g, "%s: bad offset 0x%llx", __func__, mapping_gva);
1223	return -EFAULT;
1224	}
1225
1226	*compbits_win_size = 0;
1227	*compbits_win_ctagline = 0;
1228	*mapping_ctagline = 0;
1229	*flags = 0;
1230
1231	if (mapped_buffer->ctag_offset)
1232	*flags \|= NVGPU_AS_GET_BUFFER_COMPBITS_INFO_FLAGS_HAS_COMPBITS;
1233
1234	if (mapped_buffer->ctags_mappable)
1235	{
1236	*flags \|= NVGPU_AS_GET_BUFFER_COMPBITS_INFO_FLAGS_MAPPABLE;
1237	*compbits_win_size = mapped_buffer->ctag_map_win_size;
1238	*compbits_win_ctagline = mapped_buffer->ctag_map_win_ctagline;
1239	*mapping_ctagline = mapped_buffer->ctag_offset;
1240	}
1241
1242	nvgpu_mutex_release(&vm->update_gmmu_lock);
1243	return 0;
1244	}
1245
1246
1247	int nvgpu_vm_map_compbits(struct vm_gk20a *vm,
1248	u64 mapping_gva,
1249	u64 *compbits_win_gva,
1250	u64 *mapping_iova,
1251	u32 flags)
1252	{
1253	struct nvgpu_mapped_buf *mapped_buffer;
1254	struct gk20a *g = gk20a_from_vm(vm);
1255	const bool fixed_mapping =
1256	(flags & NVGPU_AS_MAP_BUFFER_COMPBITS_FLAGS_FIXED_OFFSET) != 0;
1257
1258	if (vm->userspace_managed && !fixed_mapping) {
1259	nvgpu_err(g,
1260	"%s: non-fixed-offset mapping is not available on userspace managed address spaces",
1261	__func__);
1262	return -EFAULT;
1263	}
1264
1265	if (fixed_mapping && !vm->userspace_managed) {
1266	nvgpu_err(g,
1267	"%s: fixed-offset mapping is available only on userspace managed address spaces",
1268	__func__);
1269	return -EFAULT;
1270	}
1271
1272	nvgpu_mutex_acquire(&vm->update_gmmu_lock);
1273
1274	mapped_buffer = __nvgpu_vm_find_mapped_buf(vm, mapping_gva);
1275
1276	if (!mapped_buffer \|\| !mapped_buffer->user_mapped) {
1277	nvgpu_mutex_release(&vm->update_gmmu_lock);
1278	nvgpu_err(g, "%s: bad offset 0x%llx", __func__, mapping_gva);
1279	return -EFAULT;
1280	}
1281
1282	if (!mapped_buffer->ctags_mappable) {
1283	nvgpu_mutex_release(&vm->update_gmmu_lock);
1284	nvgpu_err(g, "%s: comptags not mappable, offset 0x%llx",
1285	__func__, mapping_gva);
1286	return -EFAULT;
1287	}
1288
1289	if (!mapped_buffer->ctag_map_win_addr) {
1290	const u32 small_pgsz_index = 0; /* small pages, 4K */
1291	const u32 aggregate_cacheline_sz =
1292	g->gr.cacheline_size * g->gr.slices_per_ltc *
1293	g->ltc_count;
1294
1295	/* first aggregate cacheline to map */
1296	u32 cacheline_start; /* inclusive */
1297
1298	/* offset of the start cacheline (will be page aligned) */
1299	u64 cacheline_offset_start;
1300
1301	if (!mapped_buffer->ctag_map_win_size) {
1302	nvgpu_mutex_release(&vm->update_gmmu_lock);
1303	nvgpu_err(g,
1304	"%s: mapping 0x%llx does not have "
1305	"mappable comptags",
1306	__func__, mapping_gva);
1307	return -EFAULT;
1308	}
1309
1310	cacheline_start = mapped_buffer->ctag_offset /
1311	g->gr.comptags_per_cacheline;
1312	cacheline_offset_start =
1313	(u64)cacheline_start * aggregate_cacheline_sz;
1314
1315	if (fixed_mapping) {
1316	struct buffer_attrs bfr;
1317	int err;
1318	struct nvgpu_vm_area *vm_area = NULL;
1319
1320	memset(&bfr, 0, sizeof(bfr));
1321
1322	bfr.pgsz_idx = small_pgsz_index;
1323
1324	err = nvgpu_vm_area_validate_buffer(
1325	vm, *compbits_win_gva, mapped_buffer->ctag_map_win_size,
1326	bfr.pgsz_idx, &vm_area);
1327
1328	if (err) {
1329	nvgpu_mutex_release(&vm->update_gmmu_lock);
1330	return err;
1331	}
1332
1333	if (vm_area) {
1334	/* this would create a dangling GPU VA
1335	* pointer if the space is freed
1336	* before before the buffer is
1337	* unmapped */
1338	nvgpu_mutex_release(&vm->update_gmmu_lock);
1339	nvgpu_err(g,
1340	"%s: comptags cannot be mapped into allocated space",
1341	__func__);
1342	return -EINVAL;
1343	}
1344	}
1345
1346	mapped_buffer->ctag_map_win_addr =
1347	g->ops.mm.gmmu_map(
1348	vm,
1349	!fixed_mapping ? 0 : compbits_win_gva, / va */
1350	g->gr.compbit_store.mem.priv.sgt,
1351	cacheline_offset_start, /* sg offset */
1352	mapped_buffer->ctag_map_win_size, /* size */
1353	small_pgsz_index,
1354	0, /* kind */
1355	0, /* ctag_offset */
1356	NVGPU_MAP_BUFFER_FLAGS_CACHEABLE_TRUE,
1357	gk20a_mem_flag_read_only,
1358	false, /* clear_ctags */
1359	false, /* sparse */
1360	false, /* priv */
1361	NULL, /* mapping_batch handle */
1362	g->gr.compbit_store.mem.aperture);
1363
1364	if (!mapped_buffer->ctag_map_win_addr) {
1365	nvgpu_mutex_release(&vm->update_gmmu_lock);
1366	nvgpu_err(g,
1367	"%s: failed to map comptags for mapping 0x%llx",
1368	__func__, mapping_gva);
1369	return -ENOMEM;
1370	}
1371	} else if (fixed_mapping && *compbits_win_gva &&
1372	mapped_buffer->ctag_map_win_addr != *compbits_win_gva) {
1373	nvgpu_mutex_release(&vm->update_gmmu_lock);
1374	nvgpu_err(g,
1375	"%s: re-requesting comptags map into mismatching address. buffer offset 0x"
1376	"%llx, existing comptag map at 0x%llx, requested remap 0x%llx",
1377	__func__, mapping_gva,
1378	mapped_buffer->ctag_map_win_addr, *compbits_win_gva);
1379	return -EINVAL;
1380	}
1381
1382	*mapping_iova = nvgpu_mem_get_addr_sgl(g, mapped_buffer->sgt->sgl);
1383	*compbits_win_gva = mapped_buffer->ctag_map_win_addr;
1384
1385	nvgpu_mutex_release(&vm->update_gmmu_lock);
1386
1387	return 0;
1388	}
1389
1390	#if defined(CONFIG_GK20A_VIDMEM)	1118	#if defined(CONFIG_GK20A_VIDMEM)
1391	static int gk20a_gmmu_clear_vidmem_mem(struct gk20a g, struct nvgpu_mem mem)	1119	static int gk20a_gmmu_clear_vidmem_mem(struct gk20a g, struct nvgpu_mem mem)
1392	{	1120	{
@@ -1688,19 +1416,6 @@ void nvgpu_vm_unmap_locked(struct nvgpu_mapped_buf *mapped_buffer,
1688	struct vm_gk20a *vm = mapped_buffer->vm;	1416	struct vm_gk20a *vm = mapped_buffer->vm;
1689	struct gk20a *g = vm->mm->g;	1417	struct gk20a *g = vm->mm->g;
1690		1418
1691	if (mapped_buffer->ctag_map_win_addr) {
1692	/* unmap compbits */
1693
1694	g->ops.mm.gmmu_unmap(vm,
1695	mapped_buffer->ctag_map_win_addr,
1696	mapped_buffer->ctag_map_win_size,
1697	0, /* page size 4k */
1698	true, /* va allocated */
1699	gk20a_mem_flag_none,
1700	false, /* not sparse */
1701	batch); /* batch handle */
1702	}
1703
1704	g->ops.mm.gmmu_unmap(vm,	1419	g->ops.mm.gmmu_unmap(vm,
1705	mapped_buffer->addr,	1420	mapped_buffer->addr,
1706	mapped_buffer->size,	1421	mapped_buffer->size,


diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h index 82a4ee85..c77bebf8 100644 --- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h +++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
@@ -389,13 +389,6 @@ struct sg_table gk20a_mm_pin(struct device dev, struct dma_buf *dmabuf);
389	void gk20a_mm_unpin(struct device dev, struct dma_buf dmabuf,	389	void gk20a_mm_unpin(struct device dev, struct dma_buf dmabuf,
390	struct sg_table *sgt);	390	struct sg_table *sgt);
391		391
392	int nvgpu_vm_get_compbits_info(struct vm_gk20a *vm,
393	u64 mapping_gva,
394	u64 *compbits_win_size,
395	u32 *compbits_win_ctagline,
396	u32 *mapping_ctagline,
397	u32 *flags);
398
399	/* vm-as interface */	392	/* vm-as interface */
400	struct nvgpu_as_alloc_space_args;	393	struct nvgpu_as_alloc_space_args;
401	struct nvgpu_as_free_space_args;	394	struct nvgpu_as_free_space_args;


diff --git a/drivers/gpu/nvgpu/include/nvgpu/vm.h b/drivers/gpu/nvgpu/include/nvgpu/vm.h index b5c64c99..604f4335 100644 --- a/drivers/gpu/nvgpu/include/nvgpu/vm.h +++ b/drivers/gpu/nvgpu/include/nvgpu/vm.h
@@ -96,13 +96,6 @@ struct nvgpu_mapped_buf {
96	u32 ctag_lines;	96	u32 ctag_lines;
97	u32 ctag_allocated_lines;	97	u32 ctag_allocated_lines;
98		98
99	/* For comptag mapping, these are the mapping window parameters */
100	bool ctags_mappable;
101	u64 ctag_map_win_addr; /* non-zero if mapped */
102	u64 ctag_map_win_size; /* non-zero if ctags_mappable */
103	u32 ctag_map_win_ctagline; /* ctagline at win start, set if
104	* ctags_mappable */
105
106	u32 flags;	99	u32 flags;
107	u32 kind;	100	u32 kind;
108	bool va_allocated;	101	bool va_allocated;