gpu: nvgpu: Move dma_buf usage from mm_gk20a.c

Move most of the dma_buf usage present in the mm_gk20a.c code out to Linux specific code and some commom/mm code. There's two primary groups of code: 1. dma_buf priv field code (for holding comptag data) 2. Comptag usage that relies on dma_buf pointers For (1) the dma_buf code was simply moved to common/linux/dmabuf.c since most of this code is clearly Linux specific. The comptag code was a bit more complicated since there is two parts to the comptag code. Firstly there's the code that manages the comptag memory. This is essentially a simple allocator. This was moved to common/mm/comptags.c since it can be shared across all chips. The second set of code is moved to common/linux/comptags.c since it is the interface between dma_bufs and the comptag memory. Two other fixes were done as well: - Add struct gk20a to the comptag allocator init so that the proper nvgpu_vzalloc() function could be used. - Add necessary includes to common/linux/vm_priv.h. JIRA NVGPU-30 JIRA NVGPU-138 Change-Id: I96c57f2763e5ebe18a2f2ee4b33e0e1a2597848c Signed-off-by: Alex Waterman <alexw@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1566628 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Alex Waterman <alexw@nvidia.com> 2017-09-07 18:27:55 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2017-10-18 19:00:37 -0400
commit: b3446bc0b6fca6cb992667f80a95f8503b6a652a (patch)
tree: 9882c36bfaef83da9d0a6eefec5e8c3564b93cea /drivers/gpu/nvgpu/gk20a
parent: bee9c830c7898ceebf8c396b40598350229a7203 (diff)
4 files changed, 5 insertions, 358 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
index 57c1c0bc..700dcdf8 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -3044,36 +3044,6 @@ out:
        return err;
 }
-int gk20a_comptag_allocator_init(struct gk20a_comptag_allocator *allocator,
-                unsigned long size)
-{
-        nvgpu_mutex_init(&allocator->lock);
-        /*
-         * 0th comptag is special and is never used. The base for this bitmap
-         * is 1, and its size is one less than the size of comptag store.
-         */
-        size--;
-        allocator->bitmap = vzalloc(BITS_TO_LONGS(size) * sizeof(long));
-        if (!allocator->bitmap)
-                return -ENOMEM;
-        allocator->size = size;
-        return 0;
-}
-void gk20a_comptag_allocator_destroy(struct gk20a_comptag_allocator *allocator)
-{
-        struct gr_gk20a *gr = container_of(allocator,
-                                           struct gr_gk20a, comp_tags);
-        /*
-         * called only when exiting the driver (gk20a_remove, or unwinding the
-         * init stage); no users should be active, so taking the mutex is
-         * unnecessary here.
-         */
-        allocator->size = 0;
-        nvgpu_vfree(gr->g, allocator->bitmap);
-}
 static void gk20a_remove_gr_support(struct gr_gk20a *gr)
 {
        struct gk20a *g = gr->g;
@@ -3148,7 +3118,7 @@ static void gk20a_remove_gr_support(struct gr_gk20a *gr)
                nvgpu_big_free(g, gr->ctx_vars.hwpm_ctxsw_buffer_offset_map);
        gr->ctx_vars.hwpm_ctxsw_buffer_offset_map = NULL;
-        gk20a_comptag_allocator_destroy(&gr->comp_tags);
+        gk20a_comptag_allocator_destroy(g, &gr->comp_tags);
 }
 static int gr_gk20a_init_gr_config(struct gk20a *g, struct gr_gk20a *gr)
diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
index 5fab43ca..84eb8970 100644
--- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
@@ -36,6 +36,8 @@
 #include "gr_ctx_gk20a.h"
 #include "mm_gk20a.h"
+#include <nvgpu/comptags.h>
 #define GR_IDLE_CHECK_DEFAULT           10 /* usec */
 #define GR_IDLE_CHECK_MAX               200 /* usec */
 #define GR_FECS_POLL_INTERVAL           5 /* usec */
@@ -342,13 +344,7 @@ struct gr_gk20a {
        u32 max_comptag_mem; /* max memory size (MB) for comptag */
        struct compbit_store_desc compbit_store;
-        struct gk20a_comptag_allocator {
+        struct gk20a_comptag_allocator comp_tags;
-                struct nvgpu_mutex lock;
-                /* this bitmap starts at ctag 1. 0th cannot be taken */
-                unsigned long *bitmap;
-                /* size of bitmap, not max ctags, so one less */
-                unsigned long size;
-        } comp_tags;
        struct gr_zcull_gk20a zcull;
@@ -503,10 +499,6 @@ int gk20a_init_gr_support(struct gk20a *g);
 int gk20a_enable_gr_hw(struct gk20a *g);
 int gk20a_gr_reset(struct gk20a *g);
 void gk20a_gr_wait_initialized(struct gk20a *g);
-/* real size here, but first (ctag 0) isn't used */
-int gk20a_comptag_allocator_init(struct gk20a_comptag_allocator *allocator,
-                unsigned long size);
-void gk20a_comptag_allocator_destroy(struct gk20a_comptag_allocator *allocator);
 int gk20a_init_gr_channel(struct channel_gk20a *ch_gk20a);
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
index 8936cd03..69d9e983 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -22,7 +22,6 @@
 * DEALINGS IN THE SOFTWARE.
 */
-#include <linux/scatterlist.h>
 #include <linux/dma-buf.h>
 #include <linux/dma-mapping.h>
 #include <linux/dma-attrs.h>
@@ -70,6 +69,7 @@
 * all the common APIs no longers have Linux stuff in them.
 */
 #include "common/linux/vm_priv.h"
+#include "common/linux/dmabuf.h"
 /*
 * GPU mapping life cycle
@@ -108,190 +108,6 @@ static int __must_check gk20a_init_hwpm(struct mm_gk20a *mm);
 static int __must_check gk20a_init_cde_vm(struct mm_gk20a *mm);
 static int __must_check gk20a_init_ce_vm(struct mm_gk20a *mm);
-struct gk20a_dmabuf_priv {
-        struct nvgpu_mutex lock;
-        struct gk20a *g;
-        struct gk20a_comptag_allocator *comptag_allocator;
-        struct gk20a_comptags comptags;
-        struct dma_buf_attachment *attach;
-        struct sg_table *sgt;
-        int pin_count;
-        struct nvgpu_list_node states;
-        u64 buffer_id;
-};
-static int gk20a_comptaglines_alloc(struct gk20a_comptag_allocator *allocator,
-                u32 *offset, u32 len)
-{
-        unsigned long addr;
-        int err = 0;
-        nvgpu_mutex_acquire(&allocator->lock);
-        addr = bitmap_find_next_zero_area(allocator->bitmap, allocator->size,
-                        0, len, 0);
-        if (addr < allocator->size) {
-                /* number zero is reserved; bitmap base is 1 */
-                *offset = 1 + addr;
-                bitmap_set(allocator->bitmap, addr, len);
-        } else {
-                err = -ENOMEM;
-        }
-        nvgpu_mutex_release(&allocator->lock);
-        return err;
-}
-static void gk20a_comptaglines_free(struct gk20a_comptag_allocator *allocator,
-                u32 offset, u32 len)
-{
-        /* number zero is reserved; bitmap base is 1 */
-        u32 addr = offset - 1;
-        WARN_ON(offset == 0);
-        WARN_ON(addr > allocator->size);
-        WARN_ON(addr + len > allocator->size);
-        nvgpu_mutex_acquire(&allocator->lock);
-        bitmap_clear(allocator->bitmap, addr, len);
-        nvgpu_mutex_release(&allocator->lock);
-}
-static void gk20a_mm_delete_priv(void *_priv)
-{
-        struct gk20a_buffer_state *s, *s_tmp;
-        struct gk20a_dmabuf_priv *priv = _priv;
-        struct gk20a *g;
-        if (!priv)
-                return;
-        g = priv->g;
-        if (priv->comptags.lines) {
-                BUG_ON(!priv->comptag_allocator);
-                gk20a_comptaglines_free(priv->comptag_allocator,
-                                priv->comptags.offset,
-                                priv->comptags.allocated_lines);
-        }
-        /* Free buffer states */
-        nvgpu_list_for_each_entry_safe(s, s_tmp, &priv->states,
-                                gk20a_buffer_state, list) {
-                gk20a_fence_put(s->fence);
-                nvgpu_list_del(&s->list);
-                nvgpu_kfree(g, s);
-        }
-        nvgpu_kfree(g, priv);
-}
-struct sg_table *gk20a_mm_pin(struct device *dev, struct dma_buf *dmabuf)
-{
-        struct gk20a_dmabuf_priv *priv;
-        priv = dma_buf_get_drvdata(dmabuf, dev);
-        if (WARN_ON(!priv))
-                return ERR_PTR(-EINVAL);
-        nvgpu_mutex_acquire(&priv->lock);
-        if (priv->pin_count == 0) {
-                priv->attach = dma_buf_attach(dmabuf, dev);
-                if (IS_ERR(priv->attach)) {
-                        nvgpu_mutex_release(&priv->lock);
-                        return (struct sg_table *)priv->attach;
-                }
-                priv->sgt = dma_buf_map_attachment(priv->attach,
-                                                   DMA_BIDIRECTIONAL);
-                if (IS_ERR(priv->sgt)) {
-                        dma_buf_detach(dmabuf, priv->attach);
-                        nvgpu_mutex_release(&priv->lock);
-                        return priv->sgt;
-                }
-        }
-        priv->pin_count++;
-        nvgpu_mutex_release(&priv->lock);
-        return priv->sgt;
-}
-void gk20a_mm_unpin(struct device *dev, struct dma_buf *dmabuf,
-                    struct sg_table *sgt)
-{
-        struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
-        dma_addr_t dma_addr;
-        if (IS_ERR(priv) || !priv)
-                return;
-        nvgpu_mutex_acquire(&priv->lock);
-        WARN_ON(priv->sgt != sgt);
-        priv->pin_count--;
-        WARN_ON(priv->pin_count < 0);
-        dma_addr = sg_dma_address(priv->sgt->sgl);
-        if (priv->pin_count == 0) {
-                dma_buf_unmap_attachment(priv->attach, priv->sgt,
-                                         DMA_BIDIRECTIONAL);
-                dma_buf_detach(dmabuf, priv->attach);
-        }
-        nvgpu_mutex_release(&priv->lock);
-}
-void gk20a_get_comptags(struct device *dev, struct dma_buf *dmabuf,
-                        struct gk20a_comptags *comptags)
-{
-        struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
-        if (!comptags)
-                return;
-        if (!priv) {
-                memset(comptags, 0, sizeof(*comptags));
-                return;
-        }
-        *comptags = priv->comptags;
-}
-int gk20a_alloc_comptags(struct gk20a *g,
-                         struct device *dev,
-                         struct dma_buf *dmabuf,
-                         struct gk20a_comptag_allocator *allocator,
-                         u32 lines)
-{
-        struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
-        u32 ctaglines_allocsize;
-        u32 offset;
-        int err;
-        if (!priv)
-                return -ENOSYS;
-        if (!lines)
-                return -EINVAL;
-        ctaglines_allocsize = lines;
-        /* store the allocator so we can use it when we free the ctags */
-        priv->comptag_allocator = allocator;
-        err = gk20a_comptaglines_alloc(allocator, &offset,
-                               ctaglines_allocsize);
-        if (err)
-                return err;
-        priv->comptags.offset = offset;
-        priv->comptags.lines = lines;
-        priv->comptags.allocated_lines = ctaglines_allocsize;
-        return 0;
-}
 static int gk20a_init_mm_reset_enable_hw(struct gk20a *g)
 {
        gk20a_dbg_fn("");
@@ -1037,87 +853,6 @@ int gk20a_vm_bind_channel(struct gk20a_as_share *as_share,
        return __gk20a_vm_bind_channel(as_share->vm, ch);
 }
-int gk20a_dmabuf_alloc_drvdata(struct dma_buf *dmabuf, struct device *dev)
-{
-        struct gk20a *g = gk20a_get_platform(dev)->g;
-        struct gk20a_dmabuf_priv *priv;
-        static u64 priv_count = 0;
-        priv = dma_buf_get_drvdata(dmabuf, dev);
-        if (likely(priv))
-                return 0;
-        nvgpu_mutex_acquire(&g->mm.priv_lock);
-        priv = dma_buf_get_drvdata(dmabuf, dev);
-        if (priv)
-                goto priv_exist_or_err;
-        priv = nvgpu_kzalloc(g, sizeof(*priv));
-        if (!priv) {
-                priv = ERR_PTR(-ENOMEM);
-                goto priv_exist_or_err;
-        }
-        nvgpu_mutex_init(&priv->lock);
-        nvgpu_init_list_node(&priv->states);
-        priv->buffer_id = ++priv_count;
-        priv->g = g;
-        dma_buf_set_drvdata(dmabuf, dev, priv, gk20a_mm_delete_priv);
-priv_exist_or_err:
-        nvgpu_mutex_release(&g->mm.priv_lock);
-        if (IS_ERR(priv))
-                return -ENOMEM;
-        return 0;
-}
-int gk20a_dmabuf_get_state(struct dma_buf *dmabuf, struct gk20a *g,
-                           u64 offset, struct gk20a_buffer_state **state)
-{
-        int err = 0;
-        struct gk20a_dmabuf_priv *priv;
-        struct gk20a_buffer_state *s;
-        struct device *dev = dev_from_gk20a(g);
-        if (WARN_ON(offset >= (u64)dmabuf->size))
-                return -EINVAL;
-        err = gk20a_dmabuf_alloc_drvdata(dmabuf, dev);
-        if (err)
-                return err;
-        priv = dma_buf_get_drvdata(dmabuf, dev);
-        if (WARN_ON(!priv))
-                return -ENOSYS;
-        nvgpu_mutex_acquire(&priv->lock);
-        nvgpu_list_for_each_entry(s, &priv->states, gk20a_buffer_state, list)
-                if (s->offset == offset)
-                        goto out;
-        /* State not found, create state. */
-        s = nvgpu_kzalloc(g, sizeof(*s));
-        if (!s) {
-                err = -ENOMEM;
-                goto out;
-        }
-        s->offset = offset;
-        nvgpu_init_list_node(&s->list);
-        nvgpu_mutex_init(&s->lock);
-        nvgpu_list_add_tail(&s->list, &priv->states);
-out:
-        nvgpu_mutex_release(&priv->lock);
-        if (!err)
-                *state = s;
-        return err;
-}
 int nvgpu_vm_map_buffer(struct vm_gk20a *vm,
                        int dmabuf_fd,
                        u64 *offset_align,
@@ -1613,34 +1348,3 @@ const struct gk20a_mmu_level *gk20a_mm_get_mmu_levels(struct gk20a *g,
        return (big_page_size == SZ_64K) ?
                 gk20a_mm_levels_64k : gk20a_mm_levels_128k;
 }
-int gk20a_mm_get_buffer_info(struct device *dev, int dmabuf_fd,
-                             u64 *buffer_id, u64 *buffer_len)
-{
-        struct dma_buf *dmabuf;
-        struct gk20a_dmabuf_priv *priv;
-        int err = 0;
-        dmabuf = dma_buf_get(dmabuf_fd);
-        if (IS_ERR(dmabuf)) {
-                dev_warn(dev, "%s: fd %d is not a dmabuf", __func__, dmabuf_fd);
-                return PTR_ERR(dmabuf);
-        }
-        err = gk20a_dmabuf_alloc_drvdata(dmabuf, dev);
-        if (err) {
-                dev_warn(dev, "Failed to allocate dmabuf drvdata (err = %d)",
-                         err);
-                goto clean_up;
-        }
-        priv = dma_buf_get_drvdata(dmabuf, dev);
-        if (likely(priv)) {
-                *buffer_id = priv->buffer_id;
-                *buffer_len = dmabuf->size;
-        }
-clean_up:
-        dma_buf_put(dmabuf);
-        return err;
-}
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
index 448496f5..04034d84 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
@@ -117,13 +117,6 @@ gk20a_buffer_state_from_list(struct nvgpu_list_node *node)
                ((uintptr_t)node - offsetof(struct gk20a_buffer_state, list));
 };
-struct gk20a_comptags {
-        u32 offset;
-        u32 lines;
-        u32 allocated_lines;
-        bool user_mappable;
-};
 struct priv_cmd_queue {
        struct nvgpu_mem mem;
        u32 size;       /* num of entries in words */
@@ -369,10 +362,6 @@ void gk20a_locked_gmmu_unmap(struct vm_gk20a *vm,
                             bool sparse,
                             struct vm_gk20a_mapping_batch *batch);
-struct sg_table *gk20a_mm_pin(struct device *dev, struct dma_buf *dmabuf);
-void gk20a_mm_unpin(struct device *dev, struct dma_buf *dmabuf,
-                    struct sg_table *sgt);
 /* vm-as interface */
 struct nvgpu_as_alloc_space_args;
 struct nvgpu_as_free_space_args;
@@ -381,14 +370,6 @@ int gk20a_vm_bind_channel(struct gk20a_as_share *as_share,
                          struct channel_gk20a *ch);
 int __gk20a_vm_bind_channel(struct vm_gk20a *vm, struct channel_gk20a *ch);
-void gk20a_get_comptags(struct device *dev, struct dma_buf *dmabuf,
-                        struct gk20a_comptags *comptags);
-int gk20a_dmabuf_alloc_drvdata(struct dma_buf *dmabuf, struct device *dev);
-int gk20a_dmabuf_get_state(struct dma_buf *dmabuf, struct gk20a *g,
-                           u64 offset, struct gk20a_buffer_state **state);
 void pde_range_from_vaddr_range(struct vm_gk20a *vm,
                                              u64 addr_lo, u64 addr_hi,
                                              u32 *pde_lo, u32 *pde_hi);
author	Alex Waterman <alexw@nvidia.com>	2017-09-07 18:27:55 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2017-10-18 19:00:37 -0400
commit	b3446bc0b6fca6cb992667f80a95f8503b6a652a (patch)
tree	9882c36bfaef83da9d0a6eefec5e8c3564b93cea /drivers/gpu/nvgpu/gk20a
parent	bee9c830c7898ceebf8c396b40598350229a7203 (diff)

diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c index 57c1c0bc..700dcdf8 100644 --- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.c
@@ -3044,36 +3044,6 @@ out:
3044	return err;	3044	return err;
3045	}	3045	}
3046		3046
3047	int gk20a_comptag_allocator_init(struct gk20a_comptag_allocator *allocator,
3048	unsigned long size)
3049	{
3050	nvgpu_mutex_init(&allocator->lock);
3051	/*
3052	* 0th comptag is special and is never used. The base for this bitmap
3053	* is 1, and its size is one less than the size of comptag store.
3054	*/
3055	size--;
3056	allocator->bitmap = vzalloc(BITS_TO_LONGS(size) * sizeof(long));
3057	if (!allocator->bitmap)
3058	return -ENOMEM;
3059	allocator->size = size;
3060	return 0;
3061	}
3062
3063	void gk20a_comptag_allocator_destroy(struct gk20a_comptag_allocator *allocator)
3064	{
3065	struct gr_gk20a *gr = container_of(allocator,
3066	struct gr_gk20a, comp_tags);
3067
3068	/*
3069	* called only when exiting the driver (gk20a_remove, or unwinding the
3070	* init stage); no users should be active, so taking the mutex is
3071	* unnecessary here.
3072	*/
3073	allocator->size = 0;
3074	nvgpu_vfree(gr->g, allocator->bitmap);
3075	}
3076
3077	static void gk20a_remove_gr_support(struct gr_gk20a *gr)	3047	static void gk20a_remove_gr_support(struct gr_gk20a *gr)
3078	{	3048	{
3079	struct gk20a *g = gr->g;	3049	struct gk20a *g = gr->g;
@@ -3148,7 +3118,7 @@ static void gk20a_remove_gr_support(struct gr_gk20a *gr)
3148	nvgpu_big_free(g, gr->ctx_vars.hwpm_ctxsw_buffer_offset_map);	3118	nvgpu_big_free(g, gr->ctx_vars.hwpm_ctxsw_buffer_offset_map);
3149	gr->ctx_vars.hwpm_ctxsw_buffer_offset_map = NULL;	3119	gr->ctx_vars.hwpm_ctxsw_buffer_offset_map = NULL;
3150		3120
3151	gk20a_comptag_allocator_destroy(&gr->comp_tags);	3121	gk20a_comptag_allocator_destroy(g, &gr->comp_tags);
3152	}	3122	}
3153		3123
3154	static int gr_gk20a_init_gr_config(struct gk20a g, struct gr_gk20a gr)	3124	static int gr_gk20a_init_gr_config(struct gk20a g, struct gr_gk20a gr)


diff --git a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h index 5fab43ca..84eb8970 100644 --- a/drivers/gpu/nvgpu/gk20a/gr_gk20a.h +++ b/drivers/gpu/nvgpu/gk20a/gr_gk20a.h
@@ -36,6 +36,8 @@
36	#include "gr_ctx_gk20a.h"	36	#include "gr_ctx_gk20a.h"
37	#include "mm_gk20a.h"	37	#include "mm_gk20a.h"
38		38
		39	#include <nvgpu/comptags.h>
		40
39	#define GR_IDLE_CHECK_DEFAULT 10 /* usec */	41	#define GR_IDLE_CHECK_DEFAULT 10 /* usec */
40	#define GR_IDLE_CHECK_MAX 200 /* usec */	42	#define GR_IDLE_CHECK_MAX 200 /* usec */
41	#define GR_FECS_POLL_INTERVAL 5 /* usec */	43	#define GR_FECS_POLL_INTERVAL 5 /* usec */
@@ -342,13 +344,7 @@ struct gr_gk20a {
342		344
343	u32 max_comptag_mem; /* max memory size (MB) for comptag */	345	u32 max_comptag_mem; /* max memory size (MB) for comptag */
344	struct compbit_store_desc compbit_store;	346	struct compbit_store_desc compbit_store;
345	struct gk20a_comptag_allocator {	347	struct gk20a_comptag_allocator comp_tags;
346	struct nvgpu_mutex lock;
347	/* this bitmap starts at ctag 1. 0th cannot be taken */
348	unsigned long *bitmap;
349	/* size of bitmap, not max ctags, so one less */
350	unsigned long size;
351	} comp_tags;
352		348
353	struct gr_zcull_gk20a zcull;	349	struct gr_zcull_gk20a zcull;
354		350
@@ -503,10 +499,6 @@ int gk20a_init_gr_support(struct gk20a *g);
503	int gk20a_enable_gr_hw(struct gk20a *g);	499	int gk20a_enable_gr_hw(struct gk20a *g);
504	int gk20a_gr_reset(struct gk20a *g);	500	int gk20a_gr_reset(struct gk20a *g);
505	void gk20a_gr_wait_initialized(struct gk20a *g);	501	void gk20a_gr_wait_initialized(struct gk20a *g);
506	/* real size here, but first (ctag 0) isn't used */
507	int gk20a_comptag_allocator_init(struct gk20a_comptag_allocator *allocator,
508	unsigned long size);
509	void gk20a_comptag_allocator_destroy(struct gk20a_comptag_allocator *allocator);
510		502
511	int gk20a_init_gr_channel(struct channel_gk20a *ch_gk20a);	503	int gk20a_init_gr_channel(struct channel_gk20a *ch_gk20a);
512		504


diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c index 8936cd03..69d9e983 100644 --- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -22,7 +22,6 @@
22	* DEALINGS IN THE SOFTWARE.	22	* DEALINGS IN THE SOFTWARE.
23	*/	23	*/
24		24
25	#include <linux/scatterlist.h>
26	#include <linux/dma-buf.h>	25	#include <linux/dma-buf.h>
27	#include <linux/dma-mapping.h>	26	#include <linux/dma-mapping.h>
28	#include <linux/dma-attrs.h>	27	#include <linux/dma-attrs.h>
@@ -70,6 +69,7 @@
70	* all the common APIs no longers have Linux stuff in them.	69	* all the common APIs no longers have Linux stuff in them.
71	*/	70	*/
72	#include "common/linux/vm_priv.h"	71	#include "common/linux/vm_priv.h"
		72	#include "common/linux/dmabuf.h"
73		73
74	/*	74	/*
75	* GPU mapping life cycle	75	* GPU mapping life cycle
@@ -108,190 +108,6 @@ static int __must_check gk20a_init_hwpm(struct mm_gk20a *mm);
108	static int __must_check gk20a_init_cde_vm(struct mm_gk20a *mm);	108	static int __must_check gk20a_init_cde_vm(struct mm_gk20a *mm);
109	static int __must_check gk20a_init_ce_vm(struct mm_gk20a *mm);	109	static int __must_check gk20a_init_ce_vm(struct mm_gk20a *mm);
110		110
111	struct gk20a_dmabuf_priv {
112	struct nvgpu_mutex lock;
113
114	struct gk20a *g;
115
116	struct gk20a_comptag_allocator *comptag_allocator;
117	struct gk20a_comptags comptags;
118
119	struct dma_buf_attachment *attach;
120	struct sg_table *sgt;
121
122	int pin_count;
123
124	struct nvgpu_list_node states;
125
126	u64 buffer_id;
127	};
128
129	static int gk20a_comptaglines_alloc(struct gk20a_comptag_allocator *allocator,
130	u32 *offset, u32 len)
131	{
132	unsigned long addr;
133	int err = 0;
134
135	nvgpu_mutex_acquire(&allocator->lock);
136	addr = bitmap_find_next_zero_area(allocator->bitmap, allocator->size,
137	0, len, 0);
138	if (addr < allocator->size) {
139	/* number zero is reserved; bitmap base is 1 */
140	*offset = 1 + addr;
141	bitmap_set(allocator->bitmap, addr, len);
142	} else {
143	err = -ENOMEM;
144	}
145	nvgpu_mutex_release(&allocator->lock);
146
147	return err;
148	}
149
150	static void gk20a_comptaglines_free(struct gk20a_comptag_allocator *allocator,
151	u32 offset, u32 len)
152	{
153	/* number zero is reserved; bitmap base is 1 */
154	u32 addr = offset - 1;
155	WARN_ON(offset == 0);
156	WARN_ON(addr > allocator->size);
157	WARN_ON(addr + len > allocator->size);
158
159	nvgpu_mutex_acquire(&allocator->lock);
160	bitmap_clear(allocator->bitmap, addr, len);
161	nvgpu_mutex_release(&allocator->lock);
162	}
163
164	static void gk20a_mm_delete_priv(void *_priv)
165	{
166	struct gk20a_buffer_state s, s_tmp;
167	struct gk20a_dmabuf_priv *priv = _priv;
168	struct gk20a *g;
169
170	if (!priv)
171	return;
172
173	g = priv->g;
174
175	if (priv->comptags.lines) {
176	BUG_ON(!priv->comptag_allocator);
177	gk20a_comptaglines_free(priv->comptag_allocator,
178	priv->comptags.offset,
179	priv->comptags.allocated_lines);
180	}
181
182	/* Free buffer states */
183	nvgpu_list_for_each_entry_safe(s, s_tmp, &priv->states,
184	gk20a_buffer_state, list) {
185	gk20a_fence_put(s->fence);
186	nvgpu_list_del(&s->list);
187	nvgpu_kfree(g, s);
188	}
189
190	nvgpu_kfree(g, priv);
191	}
192
193	struct sg_table gk20a_mm_pin(struct device dev, struct dma_buf *dmabuf)
194	{
195	struct gk20a_dmabuf_priv *priv;
196
197	priv = dma_buf_get_drvdata(dmabuf, dev);
198	if (WARN_ON(!priv))
199	return ERR_PTR(-EINVAL);
200
201	nvgpu_mutex_acquire(&priv->lock);
202
203	if (priv->pin_count == 0) {
204	priv->attach = dma_buf_attach(dmabuf, dev);
205	if (IS_ERR(priv->attach)) {
206	nvgpu_mutex_release(&priv->lock);
207	return (struct sg_table *)priv->attach;
208	}
209
210	priv->sgt = dma_buf_map_attachment(priv->attach,
211	DMA_BIDIRECTIONAL);
212	if (IS_ERR(priv->sgt)) {
213	dma_buf_detach(dmabuf, priv->attach);
214	nvgpu_mutex_release(&priv->lock);
215	return priv->sgt;
216	}
217	}
218
219	priv->pin_count++;
220	nvgpu_mutex_release(&priv->lock);
221	return priv->sgt;
222	}
223
224	void gk20a_mm_unpin(struct device dev, struct dma_buf dmabuf,
225	struct sg_table *sgt)
226	{
227	struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
228	dma_addr_t dma_addr;
229
230	if (IS_ERR(priv) \|\| !priv)
231	return;
232
233	nvgpu_mutex_acquire(&priv->lock);
234	WARN_ON(priv->sgt != sgt);
235	priv->pin_count--;
236	WARN_ON(priv->pin_count < 0);
237	dma_addr = sg_dma_address(priv->sgt->sgl);
238	if (priv->pin_count == 0) {
239	dma_buf_unmap_attachment(priv->attach, priv->sgt,
240	DMA_BIDIRECTIONAL);
241	dma_buf_detach(dmabuf, priv->attach);
242	}
243	nvgpu_mutex_release(&priv->lock);
244	}
245
246	void gk20a_get_comptags(struct device dev, struct dma_buf dmabuf,
247	struct gk20a_comptags *comptags)
248	{
249	struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
250
251	if (!comptags)
252	return;
253
254	if (!priv) {
255	memset(comptags, 0, sizeof(*comptags));
256	return;
257	}
258
259	*comptags = priv->comptags;
260	}
261
262	int gk20a_alloc_comptags(struct gk20a *g,
263	struct device *dev,
264	struct dma_buf *dmabuf,
265	struct gk20a_comptag_allocator *allocator,
266	u32 lines)
267	{
268	struct gk20a_dmabuf_priv *priv = dma_buf_get_drvdata(dmabuf, dev);
269	u32 ctaglines_allocsize;
270	u32 offset;
271	int err;
272
273	if (!priv)
274	return -ENOSYS;
275
276	if (!lines)
277	return -EINVAL;
278
279	ctaglines_allocsize = lines;
280
281	/* store the allocator so we can use it when we free the ctags */
282	priv->comptag_allocator = allocator;
283	err = gk20a_comptaglines_alloc(allocator, &offset,
284	ctaglines_allocsize);
285	if (err)
286	return err;
287
288	priv->comptags.offset = offset;
289	priv->comptags.lines = lines;
290	priv->comptags.allocated_lines = ctaglines_allocsize;
291
292	return 0;
293	}
294
295	static int gk20a_init_mm_reset_enable_hw(struct gk20a *g)	111	static int gk20a_init_mm_reset_enable_hw(struct gk20a *g)
296	{	112	{
297	gk20a_dbg_fn("");	113	gk20a_dbg_fn("");
@@ -1037,87 +853,6 @@ int gk20a_vm_bind_channel(struct gk20a_as_share *as_share,
1037	return __gk20a_vm_bind_channel(as_share->vm, ch);	853	return __gk20a_vm_bind_channel(as_share->vm, ch);
1038	}	854	}
1039		855
1040	int gk20a_dmabuf_alloc_drvdata(struct dma_buf dmabuf, struct device dev)
1041	{
1042	struct gk20a *g = gk20a_get_platform(dev)->g;
1043	struct gk20a_dmabuf_priv *priv;
1044	static u64 priv_count = 0;
1045
1046	priv = dma_buf_get_drvdata(dmabuf, dev);
1047	if (likely(priv))
1048	return 0;
1049
1050	nvgpu_mutex_acquire(&g->mm.priv_lock);
1051	priv = dma_buf_get_drvdata(dmabuf, dev);
1052	if (priv)
1053	goto priv_exist_or_err;
1054
1055	priv = nvgpu_kzalloc(g, sizeof(*priv));
1056	if (!priv) {
1057	priv = ERR_PTR(-ENOMEM);
1058	goto priv_exist_or_err;
1059	}
1060
1061	nvgpu_mutex_init(&priv->lock);
1062	nvgpu_init_list_node(&priv->states);
1063	priv->buffer_id = ++priv_count;
1064	priv->g = g;
1065	dma_buf_set_drvdata(dmabuf, dev, priv, gk20a_mm_delete_priv);
1066
1067	priv_exist_or_err:
1068	nvgpu_mutex_release(&g->mm.priv_lock);
1069	if (IS_ERR(priv))
1070	return -ENOMEM;
1071
1072	return 0;
1073	}
1074
1075	int gk20a_dmabuf_get_state(struct dma_buf dmabuf, struct gk20a g,
1076	u64 offset, struct gk20a_buffer_state **state)
1077	{
1078	int err = 0;
1079	struct gk20a_dmabuf_priv *priv;
1080	struct gk20a_buffer_state *s;
1081	struct device *dev = dev_from_gk20a(g);
1082
1083	if (WARN_ON(offset >= (u64)dmabuf->size))
1084	return -EINVAL;
1085
1086	err = gk20a_dmabuf_alloc_drvdata(dmabuf, dev);
1087	if (err)
1088	return err;
1089
1090	priv = dma_buf_get_drvdata(dmabuf, dev);
1091	if (WARN_ON(!priv))
1092	return -ENOSYS;
1093
1094	nvgpu_mutex_acquire(&priv->lock);
1095
1096	nvgpu_list_for_each_entry(s, &priv->states, gk20a_buffer_state, list)
1097	if (s->offset == offset)
1098	goto out;
1099
1100	/* State not found, create state. */
1101	s = nvgpu_kzalloc(g, sizeof(*s));
1102	if (!s) {
1103	err = -ENOMEM;
1104	goto out;
1105	}
1106
1107	s->offset = offset;
1108	nvgpu_init_list_node(&s->list);
1109	nvgpu_mutex_init(&s->lock);
1110	nvgpu_list_add_tail(&s->list, &priv->states);
1111
1112	out:
1113	nvgpu_mutex_release(&priv->lock);
1114	if (!err)
1115	*state = s;
1116	return err;
1117
1118
1119	}
1120
1121	int nvgpu_vm_map_buffer(struct vm_gk20a *vm,	856	int nvgpu_vm_map_buffer(struct vm_gk20a *vm,
1122	int dmabuf_fd,	857	int dmabuf_fd,
1123	u64 *offset_align,	858	u64 *offset_align,
@@ -1613,34 +1348,3 @@ const struct gk20a_mmu_level gk20a_mm_get_mmu_levels(struct gk20a g,
1613	return (big_page_size == SZ_64K) ?	1348	return (big_page_size == SZ_64K) ?
1614	gk20a_mm_levels_64k : gk20a_mm_levels_128k;	1349	gk20a_mm_levels_64k : gk20a_mm_levels_128k;
1615	}	1350	}
1616
1617	int gk20a_mm_get_buffer_info(struct device *dev, int dmabuf_fd,
1618	u64 buffer_id, u64 buffer_len)
1619	{
1620	struct dma_buf *dmabuf;
1621	struct gk20a_dmabuf_priv *priv;
1622	int err = 0;
1623
1624	dmabuf = dma_buf_get(dmabuf_fd);
1625	if (IS_ERR(dmabuf)) {
1626	dev_warn(dev, "%s: fd %d is not a dmabuf", __func__, dmabuf_fd);
1627	return PTR_ERR(dmabuf);
1628	}
1629
1630	err = gk20a_dmabuf_alloc_drvdata(dmabuf, dev);
1631	if (err) {
1632	dev_warn(dev, "Failed to allocate dmabuf drvdata (err = %d)",
1633	err);
1634	goto clean_up;
1635	}
1636
1637	priv = dma_buf_get_drvdata(dmabuf, dev);
1638	if (likely(priv)) {
1639	*buffer_id = priv->buffer_id;
1640	*buffer_len = dmabuf->size;
1641	}
1642
1643	clean_up:
1644	dma_buf_put(dmabuf);
1645	return err;
1646	}


diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h index 448496f5..04034d84 100644 --- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h +++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h
@@ -117,13 +117,6 @@ gk20a_buffer_state_from_list(struct nvgpu_list_node *node)
117	((uintptr_t)node - offsetof(struct gk20a_buffer_state, list));	117	((uintptr_t)node - offsetof(struct gk20a_buffer_state, list));
118	};	118	};
119		119
120	struct gk20a_comptags {
121	u32 offset;
122	u32 lines;
123	u32 allocated_lines;
124	bool user_mappable;
125	};
126
127	struct priv_cmd_queue {	120	struct priv_cmd_queue {
128	struct nvgpu_mem mem;	121	struct nvgpu_mem mem;
129	u32 size; /* num of entries in words */	122	u32 size; /* num of entries in words */
@@ -369,10 +362,6 @@ void gk20a_locked_gmmu_unmap(struct vm_gk20a *vm,
369	bool sparse,	362	bool sparse,
370	struct vm_gk20a_mapping_batch *batch);	363	struct vm_gk20a_mapping_batch *batch);
371		364
372	struct sg_table gk20a_mm_pin(struct device dev, struct dma_buf *dmabuf);
373	void gk20a_mm_unpin(struct device dev, struct dma_buf dmabuf,
374	struct sg_table *sgt);
375
376	/* vm-as interface */	365	/* vm-as interface */
377	struct nvgpu_as_alloc_space_args;	366	struct nvgpu_as_alloc_space_args;
378	struct nvgpu_as_free_space_args;	367	struct nvgpu_as_free_space_args;
@@ -381,14 +370,6 @@ int gk20a_vm_bind_channel(struct gk20a_as_share *as_share,
381	struct channel_gk20a *ch);	370	struct channel_gk20a *ch);
382	int __gk20a_vm_bind_channel(struct vm_gk20a vm, struct channel_gk20a ch);	371	int __gk20a_vm_bind_channel(struct vm_gk20a vm, struct channel_gk20a ch);
383		372
384	void gk20a_get_comptags(struct device dev, struct dma_buf dmabuf,
385	struct gk20a_comptags *comptags);
386
387	int gk20a_dmabuf_alloc_drvdata(struct dma_buf dmabuf, struct device dev);
388
389	int gk20a_dmabuf_get_state(struct dma_buf dmabuf, struct gk20a g,
390	u64 offset, struct gk20a_buffer_state **state);
391
392	void pde_range_from_vaddr_range(struct vm_gk20a *vm,	373	void pde_range_from_vaddr_range(struct vm_gk20a *vm,
393	u64 addr_lo, u64 addr_hi,	374	u64 addr_lo, u64 addr_hi,
394	u32 pde_lo, u32 pde_hi);	375	u32 pde_lo, u32 pde_hi);