gpu: nvgpu: move channel_sync_gk20a.* to common directory

1) Move channel_sync_gk20a.* from gk20a/ to common/ directory as they donot program any hardware registers. Also as an add-on rename channel_sync_gk20a.* to channel_sync.* and update the headers in required files. 2) Rename the struct gk20a_channel_sync to struct nvgpu_channel_sync. Also, corresponding syncpt and semaphore versions of the struct alongwith related methods are renamed by removing "gk20a" from their names and adding "nvgpu". 3) Add misra-c cleanups Jira NVGPU-1086 Change-Id: I4e0e21803ca3858dd7a5fc4d2454dba1f1bfcecd Signed-off-by: Debarshi Dutta <ddutta@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1812594 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Debarshi Dutta <ddutta@nvidia.com> 2018-09-04 08:09:36 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2018-09-18 02:39:24 -0400
commit: 2517d59be282426eec7a97745b76d745ff36c388 (patch)
tree: faf915b5cfffb781918d674ec7d769feb7e98ac8 /drivers/gpu/nvgpu/common
parent: 8381eeea4f9b4717854387068ddf9244973e7d0d (diff)
3 files changed, 680 insertions, 10 deletions
diff --git a/drivers/gpu/nvgpu/common/fifo/channel.c b/drivers/gpu/nvgpu/common/fifo/channel.c
index 45f5b736..1613f5f6 100644
--- a/drivers/gpu/nvgpu/common/fifo/channel.c
+++ b/drivers/gpu/nvgpu/common/fifo/channel.c
@@ -44,11 +44,11 @@
 #include <nvgpu/log2.h>
 #include <nvgpu/ptimer.h>
 #include <nvgpu/channel.h>
+#include <nvgpu/channel_sync.h>
 #include "gk20a/gk20a.h"
 #include "gk20a/dbg_gpu_gk20a.h"
 #include "gk20a/fence_gk20a.h"
-#include "gk20a/channel_sync_gk20a.h"
 static void free_channel(struct fifo_gk20a *f, struct channel_gk20a *c);
 static void gk20a_channel_dump_ref_actions(struct channel_gk20a *c);
@@ -416,7 +416,7 @@ static void gk20a_free_channel(struct channel_gk20a *ch, bool force)
        /* sync must be destroyed before releasing channel vm */
        nvgpu_mutex_acquire(&ch->sync_lock);
        if (ch->sync) {
-                gk20a_channel_sync_destroy(ch->sync, false);
+                nvgpu_channel_sync_destroy(ch->sync, false);
                ch->sync = NULL;
        }
        if (ch->user_sync) {
@@ -425,9 +425,9 @@ static void gk20a_free_channel(struct channel_gk20a *ch, bool force)
                 * But it's already done if channel has timedout
                 */
                if (ch->has_timedout) {
-                        gk20a_channel_sync_destroy(ch->user_sync, false);
+                        nvgpu_channel_sync_destroy(ch->user_sync, false);
                } else {
-                        gk20a_channel_sync_destroy(ch->user_sync, true);
+                        nvgpu_channel_sync_destroy(ch->user_sync, true);
                }
                ch->user_sync = NULL;
        }
@@ -1191,7 +1191,7 @@ int gk20a_channel_alloc_gpfifo(struct channel_gk20a *c,
        if (g->aggressive_sync_destroy_thresh == 0U) {
                nvgpu_mutex_acquire(&c->sync_lock);
-                c->sync = gk20a_channel_sync_create(c, false);
+                c->sync = nvgpu_channel_sync_create(c, false);
                if (c->sync == NULL) {
                        err = -ENOMEM;
                        nvgpu_mutex_release(&c->sync_lock);
@@ -1253,7 +1253,7 @@ clean_up_prealloc:
        }
 clean_up_sync:
        if (c->sync) {
-                gk20a_channel_sync_destroy(c->sync, false);
+                nvgpu_channel_sync_destroy(c->sync, false);
                c->sync = NULL;
        }
 clean_up_unmap:
@@ -1984,7 +1984,7 @@ void gk20a_channel_clean_up_jobs(struct channel_gk20a *c,
                                if (nvgpu_atomic_dec_and_test(
                                        &c->sync->refcount) &&
                                                g->aggressive_sync_destroy) {
-                                        gk20a_channel_sync_destroy(c->sync,
+                                        nvgpu_channel_sync_destroy(c->sync,
                                                false);
                                        c->sync = NULL;
                                }
diff --git a/drivers/gpu/nvgpu/common/fifo/submit.c b/drivers/gpu/nvgpu/common/fifo/submit.c
index 1f7a04a2..5a0beea9 100644
--- a/drivers/gpu/nvgpu/common/fifo/submit.c
+++ b/drivers/gpu/nvgpu/common/fifo/submit.c
@@ -24,12 +24,12 @@
 #include <nvgpu/ltc.h>
 #include <nvgpu/os_sched.h>
 #include <nvgpu/utils.h>
+#include <nvgpu/channel_sync.h>
 #include <nvgpu/hw/gk20a/hw_pbdma_gk20a.h>
 #include "gk20a/gk20a.h"
 #include "gk20a/fence_gk20a.h"
-#include "gk20a/channel_sync_gk20a.h"
 #include <trace/events/gk20a.h>
@@ -56,7 +56,7 @@ static int nvgpu_submit_prepare_syncs(struct channel_gk20a *c,
        if (g->aggressive_sync_destroy_thresh) {
                nvgpu_mutex_acquire(&c->sync_lock);
                if (!c->sync) {
-                        c->sync = gk20a_channel_sync_create(c, false);
+                        c->sync = nvgpu_channel_sync_create(c, false);
                        if (!c->sync) {
                                err = -ENOMEM;
                                nvgpu_mutex_release(&c->sync_lock);
@@ -409,7 +409,7 @@ static int nvgpu_submit_channel_gpfifo(struct channel_gk20a *c,
                }
                need_sync_framework =
-                        gk20a_channel_sync_needs_sync_framework(g) ||
+                        nvgpu_channel_sync_needs_os_fence_framework(g) ||
                        (flags & NVGPU_SUBMIT_FLAGS_SYNC_FENCE &&
                         flags & NVGPU_SUBMIT_FLAGS_FENCE_GET);
diff --git a/drivers/gpu/nvgpu/common/sync/channel_sync.c b/drivers/gpu/nvgpu/common/sync/channel_sync.c
new file mode 100644
index 00000000..b4caab38
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/sync/channel_sync.c
@@ -0,0 +1,670 @@
+/*
+ * GK20A Channel Synchronization Abstraction
+ *
+ * Copyright (c) 2014-2018, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <nvgpu/semaphore.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/log.h>
+#include <nvgpu/atomic.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/list.h>
+#include <nvgpu/nvhost.h>
+#include <nvgpu/os_fence.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/channel_sync.h>
+#include "gk20a/gk20a.h"
+#include "gk20a/fence_gk20a.h"
+#include "gk20a/mm_gk20a.h"
+#ifdef CONFIG_TEGRA_GK20A_NVHOST
+struct nvgpu_channel_sync_syncpt {
+        struct nvgpu_channel_sync ops;
+        struct channel_gk20a *c;
+        struct nvgpu_nvhost_dev *nvhost_dev;
+        u32 id;
+        struct nvgpu_mem syncpt_buf;
+};
+int channel_sync_syncpt_gen_wait_cmd(struct channel_gk20a *c,
+        u32 id, u32 thresh, struct priv_cmd_entry *wait_cmd,
+        u32 wait_cmd_size, int pos, bool preallocated)
+{
+        int err = 0;
+        bool is_expired = nvgpu_nvhost_syncpt_is_expired_ext(
+                c->g->nvhost_dev, id, thresh);
+        if (is_expired) {
+                if (preallocated) {
+                        nvgpu_memset(c->g, wait_cmd->mem,
+                        (wait_cmd->off + (u32)pos * wait_cmd_size) * (u32)sizeof(u32),
+                                0, wait_cmd_size * (u32)sizeof(u32));
+                }
+        } else {
+                if (!preallocated) {
+                        err = gk20a_channel_alloc_priv_cmdbuf(c,
+                                c->g->ops.fifo.get_syncpt_wait_cmd_size(), wait_cmd);
+                        if (err != 0) {
+                                nvgpu_err(c->g, "not enough priv cmd buffer space");
+                                return err;
+                        }
+                }
+                nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
+                                id, c->vm->syncpt_ro_map_gpu_va);
+                c->g->ops.fifo.add_syncpt_wait_cmd(c->g, wait_cmd,
+                        (u32)pos * wait_cmd_size, id, thresh,
+                        c->vm->syncpt_ro_map_gpu_va);
+        }
+        return 0;
+}
+static int channel_sync_syncpt_wait_raw(struct nvgpu_channel_sync *s,
+                u32 id, u32 thresh, struct priv_cmd_entry *wait_cmd)
+{
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        struct channel_gk20a *c = sp->c;
+        int err = 0;
+        u32 wait_cmd_size = c->g->ops.fifo.get_syncpt_wait_cmd_size();
+        if (!nvgpu_nvhost_syncpt_is_valid_pt_ext(sp->nvhost_dev, id)) {
+                return -EINVAL;
+        }
+        err = channel_sync_syncpt_gen_wait_cmd(c, id, thresh,
+                        wait_cmd, wait_cmd_size, 0, false);
+        return err;
+}
+static int channel_sync_syncpt_wait_fd(struct nvgpu_channel_sync *s, int fd,
+        struct priv_cmd_entry *wait_cmd, int max_wait_cmds)
+{
+        struct nvgpu_os_fence os_fence = {0};
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        struct channel_gk20a *c = sp->c;
+        int err = 0;
+        err = nvgpu_os_fence_fdget(&os_fence, c, fd);
+        if (err != 0) {
+                return -EINVAL;
+        }
+        err = os_fence.ops->program_waits(&os_fence,
+                wait_cmd, c, max_wait_cmds);
+        os_fence.ops->drop_ref(&os_fence);
+        return err;
+}
+static void channel_sync_syncpt_update(void *priv, int nr_completed)
+{
+        struct channel_gk20a *ch = priv;
+        gk20a_channel_update(ch);
+        /* note: channel_get() is in channel_sync_syncpt_incr_common() */
+        gk20a_channel_put(ch);
+}
+static int channel_sync_syncpt_incr_common(struct nvgpu_channel_sync *s,
+                                       bool wfi_cmd,
+                                       bool register_irq,
+                                       struct priv_cmd_entry *incr_cmd,
+                                       struct gk20a_fence *fence,
+                                       bool need_sync_fence)
+{
+        u32 thresh;
+        int err;
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        struct channel_gk20a *c = sp->c;
+        struct nvgpu_os_fence os_fence = {0};
+        err = gk20a_channel_alloc_priv_cmdbuf(c,
+                        c->g->ops.fifo.get_syncpt_incr_cmd_size(wfi_cmd),
+                        incr_cmd);
+        if (err != 0) {
+                return err;
+        }
+        nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
+                                sp->id, sp->syncpt_buf.gpu_va);
+        c->g->ops.fifo.add_syncpt_incr_cmd(c->g, wfi_cmd,
+                        incr_cmd, sp->id, sp->syncpt_buf.gpu_va);
+        thresh = nvgpu_nvhost_syncpt_incr_max_ext(sp->nvhost_dev, sp->id,
+                        c->g->ops.fifo.get_syncpt_incr_per_release());
+        if (register_irq) {
+                struct channel_gk20a *referenced = gk20a_channel_get(c);
+                WARN_ON(!referenced);
+                if (referenced) {
+                        /* note: channel_put() is in
+                         * channel_sync_syncpt_update() */
+                        err = nvgpu_nvhost_intr_register_notifier(
+                                sp->nvhost_dev,
+                                sp->id, thresh,
+                                channel_sync_syncpt_update, c);
+                        if (err != 0) {
+                                gk20a_channel_put(referenced);
+                        }
+                        /* Adding interrupt action should
+                         * never fail. A proper error handling
+                         * here would require us to decrement
+                         * the syncpt max back to its original
+                         * value. */
+                        WARN(err,
+                             "failed to set submit complete interrupt");
+                }
+        }
+        if (need_sync_fence) {
+                err = nvgpu_os_fence_syncpt_create(&os_fence, c, sp->nvhost_dev,
+                        sp->id, thresh);
+                if (err != 0) {
+                        goto clean_up_priv_cmd;
+                }
+        }
+        err = gk20a_fence_from_syncpt(fence, sp->nvhost_dev,
+         sp->id, thresh, os_fence);
+        if (err != 0) {
+                if (nvgpu_os_fence_is_initialized(&os_fence) != 0) {
+                        os_fence.ops->drop_ref(&os_fence);
+                }
+                goto clean_up_priv_cmd;
+        }
+        return 0;
+clean_up_priv_cmd:
+        gk20a_free_priv_cmdbuf(c, incr_cmd);
+        return err;
+}
+static int channel_sync_syncpt_incr(struct nvgpu_channel_sync *s,
+                              struct priv_cmd_entry *entry,
+                              struct gk20a_fence *fence,
+                              bool need_sync_fence,
+                              bool register_irq)
+{
+        /* Don't put wfi cmd to this one since we're not returning
+         * a fence to user space. */
+        return channel_sync_syncpt_incr_common(s,
+                        false /* no wfi */,
+                        register_irq /* register irq */,
+                        entry, fence, need_sync_fence);
+}
+static int channel_sync_syncpt_incr_user(struct nvgpu_channel_sync *s,
+                                   int wait_fence_fd,
+                                   struct priv_cmd_entry *entry,
+                                   struct gk20a_fence *fence,
+                                   bool wfi,
+                                   bool need_sync_fence,
+                                   bool register_irq)
+{
+        /* Need to do 'wfi + host incr' since we return the fence
+         * to user space. */
+        return channel_sync_syncpt_incr_common(s,
+                        wfi,
+                        register_irq /* register irq */,
+                        entry, fence, need_sync_fence);
+}
+static void channel_sync_syncpt_set_min_eq_max(struct nvgpu_channel_sync *s)
+{
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        nvgpu_nvhost_syncpt_set_min_eq_max_ext(sp->nvhost_dev, sp->id);
+}
+static void channel_sync_syncpt_set_safe_state(struct nvgpu_channel_sync *s)
+{
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        nvgpu_nvhost_syncpt_set_safe_state(sp->nvhost_dev, sp->id);
+}
+static int syncpt_get_id(struct nvgpu_channel_sync *s)
+{
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        return sp->id;
+}
+static u64 channel_sync_syncpt_get_address(struct nvgpu_channel_sync *s)
+{
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        return sp->syncpt_buf.gpu_va;
+}
+static void channel_sync_syncpt_destroy(struct nvgpu_channel_sync *s)
+{
+        struct nvgpu_channel_sync_syncpt *sp =
+                container_of(s, struct nvgpu_channel_sync_syncpt, ops);
+        sp->c->g->ops.fifo.free_syncpt_buf(sp->c, &sp->syncpt_buf);
+        nvgpu_nvhost_syncpt_set_min_eq_max_ext(sp->nvhost_dev, sp->id);
+        nvgpu_nvhost_syncpt_put_ref_ext(sp->nvhost_dev, sp->id);
+        nvgpu_kfree(sp->c->g, sp);
+}
+static struct nvgpu_channel_sync *
+channel_sync_syncpt_create(struct channel_gk20a *c, bool user_managed)
+{
+        struct nvgpu_channel_sync_syncpt *sp;
+        char syncpt_name[32];
+        sp = nvgpu_kzalloc(c->g, sizeof(*sp));
+        if (sp == NULL) {
+                return NULL;
+        }
+        sp->c = c;
+        sp->nvhost_dev = c->g->nvhost_dev;
+        if (user_managed) {
+                snprintf(syncpt_name, sizeof(syncpt_name),
+                        "%s_%d_user", c->g->name, c->chid);
+                sp->id = nvgpu_nvhost_get_syncpt_client_managed(sp->nvhost_dev,
+                                                syncpt_name);
+        } else {
+                snprintf(syncpt_name, sizeof(syncpt_name),
+                        "%s_%d", c->g->name, c->chid);
+                sp->id = nvgpu_nvhost_get_syncpt_host_managed(sp->nvhost_dev,
+                                                c->chid, syncpt_name);
+        }
+        if (sp->id == 0) {
+                nvgpu_kfree(c->g, sp);
+                nvgpu_err(c->g, "failed to get free syncpt");
+                return NULL;
+        }
+        sp->c->g->ops.fifo.alloc_syncpt_buf(sp->c, sp->id,
+                                &sp->syncpt_buf);
+        nvgpu_nvhost_syncpt_set_min_eq_max_ext(sp->nvhost_dev, sp->id);
+        nvgpu_atomic_set(&sp->ops.refcount, 0);
+        sp->ops.wait_syncpt             = channel_sync_syncpt_wait_raw;
+        sp->ops.wait_fd                 = channel_sync_syncpt_wait_fd;
+        sp->ops.incr                    = channel_sync_syncpt_incr;
+        sp->ops.incr_user               = channel_sync_syncpt_incr_user;
+        sp->ops.set_min_eq_max          = channel_sync_syncpt_set_min_eq_max;
+        sp->ops.set_safe_state          = channel_sync_syncpt_set_safe_state;
+        sp->ops.syncpt_id               = syncpt_get_id;
+        sp->ops.syncpt_address          = channel_sync_syncpt_get_address;
+        sp->ops.destroy                 = channel_sync_syncpt_destroy;
+        return &sp->ops;
+}
+#endif /* CONFIG_TEGRA_GK20A_NVHOST */
+struct nvgpu_channel_sync_semaphore {
+        struct nvgpu_channel_sync ops;
+        struct channel_gk20a *c;
+        /* A semaphore pool owned by this channel. */
+        struct nvgpu_semaphore_pool *pool;
+};
+static void add_sema_cmd(struct gk20a *g, struct channel_gk20a *c,
+                         struct nvgpu_semaphore *s, struct priv_cmd_entry *cmd,
+                         u32 offset, bool acquire, bool wfi)
+{
+        int ch = c->chid;
+        u32 ob, off = cmd->off + offset;
+        u64 va;
+        ob = off;
+        /*
+         * RO for acquire (since we just need to read the mem) and RW for
+         * release since we will need to write back to the semaphore memory.
+         */
+        va = acquire ? nvgpu_semaphore_gpu_ro_va(s) :
+                       nvgpu_semaphore_gpu_rw_va(s);
+        /*
+         * If the op is not an acquire (so therefor a release) we should
+         * incr the underlying sema next_value.
+         */
+        if (!acquire) {
+                nvgpu_semaphore_prepare(s, c->hw_sema);
+        }
+        g->ops.fifo.add_sema_cmd(g, s, va, cmd, off, acquire, wfi);
+        if (acquire) {
+                gpu_sema_verbose_dbg(g, "(A) c=%d ACQ_GE %-4u pool=%-3llu"
+                                     "va=0x%llx cmd_mem=0x%llx b=0x%llx off=%u",
+                                     ch, nvgpu_semaphore_get_value(s),
+                                     s->location.pool->page_idx, va, cmd->gva,
+                                     cmd->mem->gpu_va, ob);
+        } else {
+                gpu_sema_verbose_dbg(g, "(R) c=%d INCR %u (%u) pool=%-3llu"
+                                     "va=0x%llx cmd_mem=0x%llx b=0x%llx off=%u",
+                                     ch, nvgpu_semaphore_get_value(s),
+                                     nvgpu_semaphore_read(s),
+                                     s->location.pool->page_idx,
+                                     va, cmd->gva, cmd->mem->gpu_va, ob);
+        }
+}
+void channel_sync_semaphore_gen_wait_cmd(struct channel_gk20a *c,
+        struct nvgpu_semaphore *sema, struct priv_cmd_entry *wait_cmd,
+        u32 wait_cmd_size, int pos)
+{
+        if (sema == NULL) {
+                /* expired */
+                nvgpu_memset(c->g, wait_cmd->mem,
+                        (wait_cmd->off + (u32)pos * wait_cmd_size) * (u32)sizeof(u32),
+                        0, wait_cmd_size * (u32)sizeof(u32));
+        } else {
+                WARN_ON(!sema->incremented);
+                add_sema_cmd(c->g, c, sema, wait_cmd,
+                        (u32)pos * wait_cmd_size, true, false);
+                nvgpu_semaphore_put(sema);
+        }
+}
+static int channel_sync_semaphore_wait_raw_syncpt(
+                struct nvgpu_channel_sync *s, u32 id,
+                u32 thresh, struct priv_cmd_entry *entry)
+{
+        struct nvgpu_channel_sync_semaphore *sema =
+                container_of(s, struct nvgpu_channel_sync_semaphore, ops);
+        struct gk20a *g = sema->c->g;
+        nvgpu_err(g, "trying to use syncpoint synchronization");
+        return -ENODEV;
+}
+static int channel_sync_semaphore_wait_fd(
+                struct nvgpu_channel_sync *s, int fd,
+                struct priv_cmd_entry *entry, int max_wait_cmds)
+{
+        struct nvgpu_channel_sync_semaphore *sema =
+                container_of(s, struct nvgpu_channel_sync_semaphore, ops);
+        struct channel_gk20a *c = sema->c;
+        struct nvgpu_os_fence os_fence = {0};
+        int err;
+        err = nvgpu_os_fence_fdget(&os_fence, c, fd);
+        if (err != 0) {
+                return err;
+        }
+        err = os_fence.ops->program_waits(&os_fence,
+                entry, c, max_wait_cmds);
+        os_fence.ops->drop_ref(&os_fence);
+        return err;
+}
+static int channel_sync_semaphore_incr_common(
+                struct nvgpu_channel_sync *s, bool wfi_cmd,
+                struct priv_cmd_entry *incr_cmd,
+                struct gk20a_fence *fence,
+                bool need_sync_fence)
+{
+        u32 incr_cmd_size;
+        struct nvgpu_channel_sync_semaphore *sp =
+                container_of(s, struct nvgpu_channel_sync_semaphore, ops);
+        struct channel_gk20a *c = sp->c;
+        struct nvgpu_semaphore *semaphore;
+        int err = 0;
+        struct nvgpu_os_fence os_fence = {0};
+        semaphore = nvgpu_semaphore_alloc(c);
+        if (semaphore == NULL) {
+                nvgpu_err(c->g,
+                                "ran out of semaphores");
+                return -ENOMEM;
+        }
+        incr_cmd_size = c->g->ops.fifo.get_sema_incr_cmd_size();
+        err = gk20a_channel_alloc_priv_cmdbuf(c, incr_cmd_size, incr_cmd);
+        if (err) {
+                nvgpu_err(c->g,
+                                "not enough priv cmd buffer space");
+                goto clean_up_sema;
+        }
+        /* Release the completion semaphore. */
+        add_sema_cmd(c->g, c, semaphore, incr_cmd, 0, false, wfi_cmd);
+        if (need_sync_fence) {
+                err = nvgpu_os_fence_sema_create(&os_fence, c,
+                        semaphore);
+                if (err) {
+                        goto clean_up_sema;
+                }
+        }
+        err = gk20a_fence_from_semaphore(fence,
+                semaphore,
+                &c->semaphore_wq,
+                os_fence);
+        if (err != 0) {
+                if (nvgpu_os_fence_is_initialized(&os_fence) != 0) {
+                        os_fence.ops->drop_ref(&os_fence);
+                }
+                goto clean_up_sema;
+        }
+        return 0;
+clean_up_sema:
+        nvgpu_semaphore_put(semaphore);
+        return err;
+}
+static int channel_sync_semaphore_incr(
+                struct nvgpu_channel_sync *s,
+                struct priv_cmd_entry *entry,
+                struct gk20a_fence *fence,
+                bool need_sync_fence,
+                bool register_irq)
+{
+        /* Don't put wfi cmd to this one since we're not returning
+         * a fence to user space. */
+        return channel_sync_semaphore_incr_common(s,
+                        false /* no wfi */,
+                        entry, fence, need_sync_fence);
+}
+static int channel_sync_semaphore_incr_user(
+                struct nvgpu_channel_sync *s,
+                int wait_fence_fd,
+                struct priv_cmd_entry *entry,
+                struct gk20a_fence *fence,
+                bool wfi,
+                bool need_sync_fence,
+                bool register_irq)
+{
+#ifdef CONFIG_SYNC
+        int err;
+        err = channel_sync_semaphore_incr_common(s, wfi, entry, fence,
+                        need_sync_fence);
+        if (err != 0) {
+                return err;
+        }
+        return 0;
+#else
+        struct nvgpu_channel_sync_semaphore *sema =
+                container_of(s, struct nvgpu_channel_sync_semaphore, ops);
+        nvgpu_err(sema->c->g,
+                  "trying to use sync fds with CONFIG_SYNC disabled");
+        return -ENODEV;
+#endif
+}
+static void channel_sync_semaphore_set_min_eq_max(struct nvgpu_channel_sync *s)
+{
+        struct nvgpu_channel_sync_semaphore *sp =
+                container_of(s, struct nvgpu_channel_sync_semaphore, ops);
+        struct channel_gk20a *c = sp->c;
+        bool updated;
+        if (c->hw_sema == NULL) {
+                return;
+        }
+        updated = nvgpu_semaphore_reset(c->hw_sema);
+        if (updated) {
+                nvgpu_cond_broadcast_interruptible(&c->semaphore_wq);
+        }
+}
+static void channel_sync_semaphore_set_safe_state(struct nvgpu_channel_sync *s)
+{
+        /* Nothing to do. */
+}
+static int channel_sync_semaphore_get_id(struct nvgpu_channel_sync *s)
+{
+        return -EINVAL;
+}
+static u64 channel_sync_semaphore_get_address(struct nvgpu_channel_sync *s)
+{
+        return 0;
+}
+static void channel_sync_semaphore_destroy(struct nvgpu_channel_sync *s)
+{
+        struct nvgpu_channel_sync_semaphore *sema =
+                container_of(s, struct nvgpu_channel_sync_semaphore, ops);
+        struct channel_gk20a *c = sema->c;
+        struct gk20a *g = c->g;
+        if (c->has_os_fence_framework_support &&
+                g->os_channel.os_fence_framework_inst_exists(c)) {
+                        g->os_channel.destroy_os_fence_framework(c);
+        }
+        /* The sema pool is cleaned up by the VM destroy. */
+        sema->pool = NULL;
+        nvgpu_kfree(sema->c->g, sema);
+}
+static struct nvgpu_channel_sync *
+channel_sync_semaphore_create(struct channel_gk20a *c, bool user_managed)
+{
+        struct nvgpu_channel_sync_semaphore *sema;
+        struct gk20a *g = c->g;
+        char pool_name[20];
+        int asid = -1;
+        int err;
+        if (WARN_ON(c->vm == NULL)) {
+                return NULL;
+        }
+        sema = nvgpu_kzalloc(c->g, sizeof(*sema));
+        if (sema == NULL) {
+                return NULL;
+        }
+        sema->c = c;
+        sprintf(pool_name, "semaphore_pool-%d", c->chid);
+        sema->pool = c->vm->sema_pool;
+        if (c->vm->as_share != NULL) {
+                asid = c->vm->as_share->id;
+        }
+        if (c->has_os_fence_framework_support) {
+                /*Init the sync_timeline for this channel */
+                err = g->os_channel.init_os_fence_framework(c,
+                        "gk20a_ch%d_as%d", c->chid, asid);
+                if (err != 0) {
+                        nvgpu_kfree(g, sema);
+                        return NULL;
+                }
+        }
+        nvgpu_atomic_set(&sema->ops.refcount, 0);
+        sema->ops.wait_syncpt   = channel_sync_semaphore_wait_raw_syncpt;
+        sema->ops.wait_fd       = channel_sync_semaphore_wait_fd;
+        sema->ops.incr          = channel_sync_semaphore_incr;
+        sema->ops.incr_user     = channel_sync_semaphore_incr_user;
+        sema->ops.set_min_eq_max = channel_sync_semaphore_set_min_eq_max;
+        sema->ops.set_safe_state = channel_sync_semaphore_set_safe_state;
+        sema->ops.syncpt_id     = channel_sync_semaphore_get_id;
+        sema->ops.syncpt_address = channel_sync_semaphore_get_address;
+        sema->ops.destroy       = channel_sync_semaphore_destroy;
+        return &sema->ops;
+}
+void nvgpu_channel_sync_destroy(struct nvgpu_channel_sync *sync,
+        bool set_safe_state)
+{
+        if (set_safe_state) {
+                sync->set_safe_state(sync);
+        }
+        sync->destroy(sync);
+}
+struct nvgpu_channel_sync *nvgpu_channel_sync_create(struct channel_gk20a *c,
+        bool user_managed)
+{
+#ifdef CONFIG_TEGRA_GK20A_NVHOST
+        if (gk20a_platform_has_syncpoints(c->g))
+                return channel_sync_syncpt_create(c, user_managed);
+#endif
+        return channel_sync_semaphore_create(c, user_managed);
+}
+bool nvgpu_channel_sync_needs_os_fence_framework(struct gk20a *g)
+{
+        return !gk20a_platform_has_syncpoints(g);
+}
author	Debarshi Dutta <ddutta@nvidia.com>	2018-09-04 08:09:36 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2018-09-18 02:39:24 -0400
commit	2517d59be282426eec7a97745b76d745ff36c388 (patch)
tree	faf915b5cfffb781918d674ec7d769feb7e98ac8 /drivers/gpu/nvgpu/common
parent	8381eeea4f9b4717854387068ddf9244973e7d0d (diff)