1 files changed, 750 insertions, 0 deletions
diff --git a/include/os/linux/ioctl_tsg.c b/include/os/linux/ioctl_tsg.c
new file mode 100644
index 0000000..2f8cb3a
--- /dev/null
+++ b/include/os/linux/ioctl_tsg.c
@@ -0,0 +1,750 @@
+/*
+ * Copyright (c) 2014-2020, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <linux/fs.h>
+#include <linux/file.h>
+#include <linux/cdev.h>
+#include <linux/uaccess.h>
+#include <linux/poll.h>
+#include <uapi/linux/nvgpu.h>
+#include <linux/anon_inodes.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/log.h>
+#include <nvgpu/os_sched.h>
+#include <nvgpu/gk20a.h>
+#include <nvgpu/channel.h>
+#include <nvgpu/tsg.h>
+#include "gv11b/fifo_gv11b.h"
+#include "platform_gk20a.h"
+#include "ioctl_tsg.h"
+#include "ioctl_channel.h"
+#include "os_linux.h"
+struct tsg_private {
+        struct gk20a *g;
+        struct tsg_gk20a *tsg;
+};
+static int gk20a_tsg_bind_channel_fd(struct tsg_gk20a *tsg, int ch_fd)
+{
+        struct channel_gk20a *ch;
+        int err;
+        ch = gk20a_get_channel_from_file(ch_fd);
+        if (!ch)
+                return -EINVAL;
+        err = ch->g->ops.fifo.tsg_bind_channel(tsg, ch);
+        gk20a_channel_put(ch);
+        return err;
+}
+static int gk20a_tsg_ioctl_bind_channel_ex(struct gk20a *g,
+        struct tsg_gk20a *tsg, struct nvgpu_tsg_bind_channel_ex_args *arg)
+{
+        struct nvgpu_sched_ctrl *sched = &g->sched_ctrl;
+        struct channel_gk20a *ch;
+        struct gr_gk20a *gr = &g->gr;
+        int err = 0;
+        nvgpu_log(g, gpu_dbg_fn | gpu_dbg_sched, "tsgid=%u", tsg->tsgid);
+        nvgpu_mutex_acquire(&sched->control_lock);
+        if (sched->control_locked) {
+                err = -EPERM;
+                goto mutex_release;
+        }
+        err = gk20a_busy(g);
+        if (err) {
+                nvgpu_err(g, "failed to power on gpu");
+                goto mutex_release;
+        }
+        ch = gk20a_get_channel_from_file(arg->channel_fd);
+        if (!ch) {
+                err = -EINVAL;
+                goto idle;
+        }
+        if (arg->tpc_pg_enabled && (!tsg->tpc_num_initialized)) {
+                if ((arg->num_active_tpcs > gr->max_tpc_count) ||
+                                !(arg->num_active_tpcs)) {
+                        nvgpu_err(g, "Invalid num of active TPCs");
+                        err = -EINVAL;
+                        goto ch_put;
+                }
+                tsg->tpc_num_initialized = true;
+                tsg->num_active_tpcs = arg->num_active_tpcs;
+                tsg->tpc_pg_enabled = true;
+        } else {
+                tsg->tpc_pg_enabled = false; nvgpu_log(g, gpu_dbg_info, "dynamic TPC-PG not enabled");
+        }
+        if (arg->subcontext_id < g->fifo.max_subctx_count) {
+                ch->subctx_id = arg->subcontext_id;
+        } else {
+                err = -EINVAL;
+                goto ch_put;
+        }
+        nvgpu_log(g, gpu_dbg_info, "channel id : %d : subctx: %d",
+                                ch->chid, ch->subctx_id);
+        /* Use runqueue selector 1 for all ASYNC ids */
+        if (ch->subctx_id > CHANNEL_INFO_VEID0)
+                ch->runqueue_sel = 1;
+        err = ch->g->ops.fifo.tsg_bind_channel(tsg, ch);
+ch_put:
+        gk20a_channel_put(ch);
+idle:
+        gk20a_idle(g);
+mutex_release:
+        nvgpu_mutex_release(&sched->control_lock);
+        return err;
+}
+static int gk20a_tsg_unbind_channel_fd(struct tsg_gk20a *tsg, int ch_fd)
+{
+        struct channel_gk20a *ch;
+        int err = 0;
+        ch = gk20a_get_channel_from_file(ch_fd);
+        if (!ch)
+                return -EINVAL;
+        if (ch->tsgid != tsg->tsgid) {
+                err = -EINVAL;
+                goto out;
+        }
+        err = gk20a_tsg_unbind_channel(ch);
+        /*
+         * Mark the channel timedout since channel unbound from TSG
+         * has no context of its own so it can't serve any job
+         */
+        gk20a_channel_set_timedout(ch);
+out:
+        gk20a_channel_put(ch);
+        return err;
+}
+static int gk20a_tsg_get_event_data_from_id(struct tsg_gk20a *tsg,
+                                unsigned int event_id,
+                                struct gk20a_event_id_data **event_id_data)
+{
+        struct gk20a_event_id_data *local_event_id_data;
+        bool event_found = false;
+        nvgpu_mutex_acquire(&tsg->event_id_list_lock);
+        nvgpu_list_for_each_entry(local_event_id_data, &tsg->event_id_list,
+                                        gk20a_event_id_data, event_id_node) {
+                if (local_event_id_data->event_id == event_id) {
+                        event_found = true;
+                        break;
+                }
+        }
+        nvgpu_mutex_release(&tsg->event_id_list_lock);
+        if (event_found) {
+                *event_id_data = local_event_id_data;
+                return 0;
+        } else {
+                return -1;
+        }
+}
+/*
+ * Convert common event_id of the form NVGPU_EVENT_ID_* to Linux specific
+ * event_id of the form NVGPU_IOCTL_CHANNEL_EVENT_ID_* which is used in IOCTLs
+ */
+static u32 nvgpu_event_id_to_ioctl_channel_event_id(u32 event_id)
+{
+        switch (event_id) {
+        case NVGPU_EVENT_ID_BPT_INT:
+                return NVGPU_IOCTL_CHANNEL_EVENT_ID_BPT_INT;
+        case NVGPU_EVENT_ID_BPT_PAUSE:
+                return NVGPU_IOCTL_CHANNEL_EVENT_ID_BPT_PAUSE;
+        case NVGPU_EVENT_ID_BLOCKING_SYNC:
+                return NVGPU_IOCTL_CHANNEL_EVENT_ID_BLOCKING_SYNC;
+        case NVGPU_EVENT_ID_CILP_PREEMPTION_STARTED:
+                return NVGPU_IOCTL_CHANNEL_EVENT_ID_CILP_PREEMPTION_STARTED;
+        case NVGPU_EVENT_ID_CILP_PREEMPTION_COMPLETE:
+                return NVGPU_IOCTL_CHANNEL_EVENT_ID_CILP_PREEMPTION_COMPLETE;
+        case NVGPU_EVENT_ID_GR_SEMAPHORE_WRITE_AWAKEN:
+                return NVGPU_IOCTL_CHANNEL_EVENT_ID_GR_SEMAPHORE_WRITE_AWAKEN;
+        }
+        return NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX;
+}
+void gk20a_tsg_event_id_post_event(struct tsg_gk20a *tsg,
+                                       int __event_id)
+{
+        struct gk20a_event_id_data *event_id_data;
+        u32 event_id;
+        int err = 0;
+        struct gk20a *g = tsg->g;
+        event_id = nvgpu_event_id_to_ioctl_channel_event_id(__event_id);
+        if (event_id >= NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX)
+                return;
+        err = gk20a_tsg_get_event_data_from_id(tsg, event_id,
+                                                &event_id_data);
+        if (err)
+                return;
+        nvgpu_mutex_acquire(&event_id_data->lock);
+        nvgpu_log_info(g,
+                "posting event for event_id=%d on tsg=%d\n",
+                event_id, tsg->tsgid);
+        event_id_data->event_posted = true;
+        nvgpu_cond_broadcast_interruptible(&event_id_data->event_id_wq);
+        nvgpu_mutex_release(&event_id_data->lock);
+}
+static unsigned int gk20a_event_id_poll(struct file *filep, poll_table *wait)
+{
+        unsigned int mask = 0;
+        struct gk20a_event_id_data *event_id_data = filep->private_data;
+        struct gk20a *g = event_id_data->g;
+        u32 event_id = event_id_data->event_id;
+        struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
+        nvgpu_log(g, gpu_dbg_fn | gpu_dbg_info, " ");
+        poll_wait(filep, &event_id_data->event_id_wq.wq, wait);
+        nvgpu_mutex_acquire(&event_id_data->lock);
+        if (event_id_data->event_posted) {
+                nvgpu_log_info(g,
+                        "found pending event_id=%d on TSG=%d\n",
+                        event_id, tsg->tsgid);
+                mask = (POLLPRI | POLLIN);
+                event_id_data->event_posted = false;
+        }
+        nvgpu_mutex_release(&event_id_data->lock);
+        return mask;
+}
+static int gk20a_event_id_release(struct inode *inode, struct file *filp)
+{
+        struct gk20a_event_id_data *event_id_data = filp->private_data;
+        struct gk20a *g = event_id_data->g;
+        struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
+        nvgpu_mutex_acquire(&tsg->event_id_list_lock);
+        nvgpu_list_del(&event_id_data->event_id_node);
+        nvgpu_mutex_release(&tsg->event_id_list_lock);
+        nvgpu_mutex_destroy(&event_id_data->lock);
+        gk20a_put(g);
+        nvgpu_kfree(g, event_id_data);
+        filp->private_data = NULL;
+        return 0;
+}
+const struct file_operations gk20a_event_id_ops = {
+        .owner = THIS_MODULE,
+        .poll = gk20a_event_id_poll,
+        .release = gk20a_event_id_release,
+};
+static int gk20a_tsg_event_id_enable(struct tsg_gk20a *tsg,
+                                         int event_id,
+                                         int *fd)
+{
+        int err = 0;
+        int local_fd;
+        struct file *file;
+        char name[64];
+        struct gk20a_event_id_data *event_id_data;
+        struct gk20a *g;
+        g = gk20a_get(tsg->g);
+        if (!g)
+                return -ENODEV;
+        err = gk20a_tsg_get_event_data_from_id(tsg,
+                                event_id, &event_id_data);
+        if (err == 0) {
+                /* We already have event enabled */
+                err = -EINVAL;
+                goto free_ref;
+        }
+        err = get_unused_fd_flags(O_RDWR);
+        if (err < 0)
+                goto free_ref;
+        local_fd = err;
+        snprintf(name, sizeof(name), "nvgpu-event%d-fd%d",
+                 event_id, local_fd);
+        file = anon_inode_getfile(name, &gk20a_event_id_ops,
+                                  NULL, O_RDWR);
+        if (IS_ERR(file)) {
+                err = PTR_ERR(file);
+                goto clean_up;
+        }
+        event_id_data = nvgpu_kzalloc(tsg->g, sizeof(*event_id_data));
+        if (!event_id_data) {
+                err = -ENOMEM;
+                goto clean_up_file;
+        }
+        event_id_data->g = g;
+        event_id_data->id = tsg->tsgid;
+        event_id_data->event_id = event_id;
+        nvgpu_cond_init(&event_id_data->event_id_wq);
+        err = nvgpu_mutex_init(&event_id_data->lock);
+        if (err)
+                goto clean_up_free;
+        nvgpu_init_list_node(&event_id_data->event_id_node);
+        nvgpu_mutex_acquire(&tsg->event_id_list_lock);
+        nvgpu_list_add_tail(&event_id_data->event_id_node, &tsg->event_id_list);
+        nvgpu_mutex_release(&tsg->event_id_list_lock);
+        fd_install(local_fd, file);
+        file->private_data = event_id_data;
+        *fd = local_fd;
+        return 0;
+clean_up_free:
+        nvgpu_kfree(g, event_id_data);
+clean_up_file:
+        fput(file);
+clean_up:
+        put_unused_fd(local_fd);
+free_ref:
+        gk20a_put(g);
+        return err;
+}
+static int gk20a_tsg_event_id_ctrl(struct gk20a *g, struct tsg_gk20a *tsg,
+                struct nvgpu_event_id_ctrl_args *args)
+{
+        int err = 0;
+        int fd = -1;
+        if (args->event_id >= NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX)
+                return -EINVAL;
+        nvgpu_speculation_barrier();
+        switch (args->cmd) {
+        case NVGPU_IOCTL_CHANNEL_EVENT_ID_CMD_ENABLE:
+                err = gk20a_tsg_event_id_enable(tsg, args->event_id, &fd);
+                if (!err)
+                        args->event_fd = fd;
+                break;
+        default:
+                nvgpu_err(tsg->g, "unrecognized tsg event id cmd: 0x%x",
+                           args->cmd);
+                err = -EINVAL;
+                break;
+        }
+        return err;
+}
+int nvgpu_ioctl_tsg_open(struct gk20a *g, struct file *filp)
+{
+        struct tsg_private *priv;
+        struct tsg_gk20a *tsg;
+        struct device *dev;
+        int err;
+        g = gk20a_get(g);
+        if (!g)
+                return -ENODEV;
+        dev  = dev_from_gk20a(g);
+        nvgpu_log(g, gpu_dbg_fn, "tsg: %s", dev_name(dev));
+        priv = nvgpu_kmalloc(g, sizeof(*priv));
+        if (!priv) {
+                err = -ENOMEM;
+                goto free_ref;
+        }
+        err = gk20a_busy(g);
+        if (err) {
+                nvgpu_err(g, "failed to power on, %d", err);
+                goto free_mem;
+        }
+        tsg = gk20a_tsg_open(g, nvgpu_current_pid(g));
+        gk20a_idle(g);
+        if (!tsg) {
+                err = -ENOMEM;
+                goto free_mem;
+        }
+        priv->g = g;
+        priv->tsg = tsg;
+        filp->private_data = priv;
+        gk20a_sched_ctrl_tsg_added(g, tsg);
+        return 0;
+free_mem:
+        nvgpu_kfree(g, priv);
+free_ref:
+        gk20a_put(g);
+        return err;
+}
+int nvgpu_ioctl_tsg_dev_open(struct inode *inode, struct file *filp)
+{
+        struct nvgpu_os_linux *l;
+        struct gk20a *g;
+        int ret;
+        l = container_of(inode->i_cdev,
+                         struct nvgpu_os_linux, tsg.cdev);
+        g = &l->g;
+        nvgpu_log_fn(g, " ");
+        ret = gk20a_busy(g);
+        if (ret) {
+                nvgpu_err(g, "failed to power on, %d", ret);
+                return ret;
+        }
+        ret = nvgpu_ioctl_tsg_open(&l->g, filp);
+        gk20a_idle(g);
+        nvgpu_log_fn(g, "done");
+        return ret;
+}
+void nvgpu_ioctl_tsg_release(struct nvgpu_ref *ref)
+{
+        struct tsg_gk20a *tsg = container_of(ref, struct tsg_gk20a, refcount);
+        struct gk20a *g = tsg->g;
+        gk20a_sched_ctrl_tsg_removed(g, tsg);
+        gk20a_tsg_release(ref);
+        gk20a_put(g);
+}
+int nvgpu_ioctl_tsg_dev_release(struct inode *inode, struct file *filp)
+{
+        struct tsg_private *priv = filp->private_data;
+        struct tsg_gk20a *tsg;
+        if (!priv) {
+                /* open failed, never got a tsg for this file */
+                return 0;
+        }
+        tsg = priv->tsg;
+        nvgpu_ref_put(&tsg->refcount, nvgpu_ioctl_tsg_release);
+        nvgpu_kfree(tsg->g, priv);
+        return 0;
+}
+static int gk20a_tsg_ioctl_set_runlist_interleave(struct gk20a *g,
+        struct tsg_gk20a *tsg, struct nvgpu_runlist_interleave_args *arg)
+{
+        struct nvgpu_sched_ctrl *sched = &g->sched_ctrl;
+        u32 level = arg->level;
+        int err;
+        nvgpu_log(g, gpu_dbg_fn | gpu_dbg_sched, "tsgid=%u", tsg->tsgid);
+        nvgpu_mutex_acquire(&sched->control_lock);
+        if (sched->control_locked) {
+                err = -EPERM;
+                goto done;
+        }
+        err = gk20a_busy(g);
+        if (err) {
+                nvgpu_err(g, "failed to power on gpu");
+                goto done;
+        }
+        level = nvgpu_get_common_runlist_level(level);
+        err = gk20a_tsg_set_runlist_interleave(tsg, level);
+        gk20a_idle(g);
+done:
+        nvgpu_mutex_release(&sched->control_lock);
+        return err;
+}
+static int gk20a_tsg_ioctl_set_timeslice(struct gk20a *g,
+        struct tsg_gk20a *tsg, struct nvgpu_timeslice_args *arg)
+{
+        struct nvgpu_sched_ctrl *sched = &g->sched_ctrl;
+        int err;
+        nvgpu_log(g, gpu_dbg_fn | gpu_dbg_sched, "tsgid=%u", tsg->tsgid);
+        nvgpu_mutex_acquire(&sched->control_lock);
+        if (sched->control_locked) {
+                err = -EPERM;
+                goto done;
+        }
+        err = gk20a_busy(g);
+        if (err) {
+                nvgpu_err(g, "failed to power on gpu");
+                goto done;
+        }
+        err = gk20a_tsg_set_timeslice(tsg, arg->timeslice_us);
+        gk20a_idle(g);
+done:
+        nvgpu_mutex_release(&sched->control_lock);
+        return err;
+}
+static int gk20a_tsg_ioctl_get_timeslice(struct gk20a *g,
+        struct tsg_gk20a *tsg, struct nvgpu_timeslice_args *arg)
+{
+        arg->timeslice_us = gk20a_tsg_get_timeslice(tsg);
+        return 0;
+}
+static int gk20a_tsg_ioctl_read_single_sm_error_state(struct gk20a *g,
+                struct tsg_gk20a *tsg,
+                struct nvgpu_tsg_read_single_sm_error_state_args *args)
+{
+        struct gr_gk20a *gr = &g->gr;
+        struct nvgpu_tsg_sm_error_state *sm_error_state;
+        struct nvgpu_tsg_sm_error_state_record sm_error_state_record;
+        u32 sm_id;
+        int err = 0;
+        sm_id = args->sm_id;
+        if (sm_id >= gr->no_of_sm)
+                return -EINVAL;
+        nvgpu_speculation_barrier();
+        sm_error_state = tsg->sm_error_states + sm_id;
+        sm_error_state_record.global_esr =
+                sm_error_state->hww_global_esr;
+        sm_error_state_record.warp_esr =
+                sm_error_state->hww_warp_esr;
+        sm_error_state_record.warp_esr_pc =
+                sm_error_state->hww_warp_esr_pc;
+        sm_error_state_record.global_esr_report_mask =
+                sm_error_state->hww_global_esr_report_mask;
+        sm_error_state_record.warp_esr_report_mask =
+                sm_error_state->hww_warp_esr_report_mask;
+        if (args->record_size > 0) {
+                size_t write_size = sizeof(*sm_error_state);
+                nvgpu_speculation_barrier();
+                if (write_size > args->record_size)
+                        write_size = args->record_size;
+                nvgpu_mutex_acquire(&g->dbg_sessions_lock);
+                err = copy_to_user((void __user *)(uintptr_t)
+                                                args->record_mem,
+                                   &sm_error_state_record,
+                                   write_size);
+                nvgpu_mutex_release(&g->dbg_sessions_lock);
+                if (err) {
+                        nvgpu_err(g, "copy_to_user failed!");
+                        return err;
+                }
+                args->record_size = write_size;
+        }
+        return 0;
+}
+long nvgpu_ioctl_tsg_dev_ioctl(struct file *filp, unsigned int cmd,
+                             unsigned long arg)
+{
+        struct tsg_private *priv = filp->private_data;
+        struct tsg_gk20a *tsg = priv->tsg;
+        struct gk20a *g = tsg->g;
+        u8 __maybe_unused buf[NVGPU_TSG_IOCTL_MAX_ARG_SIZE];
+        int err = 0;
+        nvgpu_log_fn(g, "start %d", _IOC_NR(cmd));
+        if ((_IOC_TYPE(cmd) != NVGPU_TSG_IOCTL_MAGIC) ||
+            (_IOC_NR(cmd) == 0) ||
+            (_IOC_NR(cmd) > NVGPU_TSG_IOCTL_LAST) ||
+            (_IOC_SIZE(cmd) > NVGPU_TSG_IOCTL_MAX_ARG_SIZE))
+                return -EINVAL;
+        memset(buf, 0, sizeof(buf));
+        if (_IOC_DIR(cmd) & _IOC_WRITE) {
+                if (copy_from_user(buf, (void __user *)arg, _IOC_SIZE(cmd)))
+                        return -EFAULT;
+        }
+        if (!g->sw_ready) {
+                err = gk20a_busy(g);
+                if (err)
+                        return err;
+                gk20a_idle(g);
+        }
+        switch (cmd) {
+        case NVGPU_TSG_IOCTL_BIND_CHANNEL:
+                {
+                int ch_fd = *(int *)buf;
+                if (ch_fd < 0) {
+                        err = -EINVAL;
+                        break;
+                }
+                err = gk20a_tsg_bind_channel_fd(tsg, ch_fd);
+                break;
+                }
+        case NVGPU_TSG_IOCTL_BIND_CHANNEL_EX:
+        {
+                err = gk20a_tsg_ioctl_bind_channel_ex(g, tsg,
+                        (struct nvgpu_tsg_bind_channel_ex_args *)buf);
+                break;
+        }
+        case NVGPU_TSG_IOCTL_UNBIND_CHANNEL:
+                {
+                int ch_fd = *(int *)buf;
+                if (ch_fd < 0) {
+                        err = -EINVAL;
+                        break;
+                }
+                err = gk20a_busy(g);
+                if (err) {
+                        nvgpu_err(g,
+                           "failed to host gk20a for ioctl cmd: 0x%x", cmd);
+                        break;
+                }
+                err = gk20a_tsg_unbind_channel_fd(tsg, ch_fd);
+                gk20a_idle(g);
+                break;
+                }
+        case NVGPU_IOCTL_TSG_ENABLE:
+                {
+                err = gk20a_busy(g);
+                if (err) {
+                        nvgpu_err(g,
+                           "failed to host gk20a for ioctl cmd: 0x%x", cmd);
+                        return err;
+                }
+                g->ops.fifo.enable_tsg(tsg);
+                gk20a_idle(g);
+                break;
+                }
+        case NVGPU_IOCTL_TSG_DISABLE:
+                {
+                err = gk20a_busy(g);
+                if (err) {
+                        nvgpu_err(g,
+                           "failed to host gk20a for ioctl cmd: 0x%x", cmd);
+                        return err;
+                }
+                g->ops.fifo.disable_tsg(tsg);
+                gk20a_idle(g);
+                break;
+                }
+        case NVGPU_IOCTL_TSG_PREEMPT:
+                {
+                err = gk20a_busy(g);
+                if (err) {
+                        nvgpu_err(g,
+                           "failed to host gk20a for ioctl cmd: 0x%x", cmd);
+                        return err;
+                }
+                /* preempt TSG */
+                err = g->ops.fifo.preempt_tsg(g, tsg);
+                gk20a_idle(g);
+                break;
+                }
+        case NVGPU_IOCTL_TSG_EVENT_ID_CTRL:
+                {
+                err = gk20a_tsg_event_id_ctrl(g, tsg,
+                        (struct nvgpu_event_id_ctrl_args *)buf);
+                break;
+                }
+        case NVGPU_IOCTL_TSG_SET_RUNLIST_INTERLEAVE:
+                err = gk20a_tsg_ioctl_set_runlist_interleave(g, tsg,
+                        (struct nvgpu_runlist_interleave_args *)buf);
+                break;
+        case NVGPU_IOCTL_TSG_SET_TIMESLICE:
+                {
+                err = gk20a_tsg_ioctl_set_timeslice(g, tsg,
+                        (struct nvgpu_timeslice_args *)buf);
+                break;
+                }
+        case NVGPU_IOCTL_TSG_GET_TIMESLICE:
+                {
+                err = gk20a_tsg_ioctl_get_timeslice(g, tsg,
+                        (struct nvgpu_timeslice_args *)buf);
+                break;
+                }
+        case NVGPU_TSG_IOCTL_READ_SINGLE_SM_ERROR_STATE:
+                {
+                err = gk20a_tsg_ioctl_read_single_sm_error_state(g, tsg,
+                        (struct nvgpu_tsg_read_single_sm_error_state_args *)buf);
+                break;
+                }
+        default:
+                nvgpu_err(g, "unrecognized tsg gpu ioctl cmd: 0x%x",
+                           cmd);
+                err = -ENOTTY;
+                break;
+        }
+        if ((err == 0) && (_IOC_DIR(cmd) & _IOC_READ))
+                err = copy_to_user((void __user *)arg,
+                                   buf, _IOC_SIZE(cmd));
+        return err;
+}

diff --git a/include/os/linux/ioctl_tsg.c b/include/os/linux/ioctl_tsg.c new file mode 100644 index 0000000..2f8cb3a --- /dev/null +++ b/include/os/linux/ioctl_tsg.c
@@ -0,0 +1,750 @@
	1	/*
	2	* Copyright (c) 2014-2020, NVIDIA CORPORATION. All rights reserved.
	3	*
	4	* This program is free software; you can redistribute it and/or modify it
	5	* under the terms and conditions of the GNU General Public License,
	6	* version 2, as published by the Free Software Foundation.
	7	*
	8	* This program is distributed in the hope it will be useful, but WITHOUT
	9	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
	10	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
	11	* more details.
	12	*
	13	* You should have received a copy of the GNU General Public License
	14	* along with this program. If not, see <http://www.gnu.org/licenses/>.
	15	*/
	16
	17	#include <linux/fs.h>
	18	#include <linux/file.h>
	19	#include <linux/cdev.h>
	20	#include <linux/uaccess.h>
	21	#include <linux/poll.h>
	22	#include <uapi/linux/nvgpu.h>
	23	#include <linux/anon_inodes.h>
	24
	25	#include <nvgpu/kmem.h>
	26	#include <nvgpu/log.h>
	27	#include <nvgpu/os_sched.h>
	28	#include <nvgpu/gk20a.h>
	29	#include <nvgpu/channel.h>
	30	#include <nvgpu/tsg.h>
	31
	32	#include "gv11b/fifo_gv11b.h"
	33	#include "platform_gk20a.h"
	34	#include "ioctl_tsg.h"
	35	#include "ioctl_channel.h"
	36	#include "os_linux.h"
	37
	38	struct tsg_private {
	39	struct gk20a *g;
	40	struct tsg_gk20a *tsg;
	41	};
	42
	43	static int gk20a_tsg_bind_channel_fd(struct tsg_gk20a *tsg, int ch_fd)
	44	{
	45	struct channel_gk20a *ch;
	46	int err;
	47
	48	ch = gk20a_get_channel_from_file(ch_fd);
	49	if (!ch)
	50	return -EINVAL;
	51
	52	err = ch->g->ops.fifo.tsg_bind_channel(tsg, ch);
	53
	54	gk20a_channel_put(ch);
	55	return err;
	56	}
	57
	58	static int gk20a_tsg_ioctl_bind_channel_ex(struct gk20a *g,
	59	struct tsg_gk20a tsg, struct nvgpu_tsg_bind_channel_ex_args arg)
	60	{
	61	struct nvgpu_sched_ctrl *sched = &g->sched_ctrl;
	62	struct channel_gk20a *ch;
	63	struct gr_gk20a *gr = &g->gr;
	64	int err = 0;
	65
	66	nvgpu_log(g, gpu_dbg_fn \| gpu_dbg_sched, "tsgid=%u", tsg->tsgid);
	67
	68	nvgpu_mutex_acquire(&sched->control_lock);
	69	if (sched->control_locked) {
	70	err = -EPERM;
	71	goto mutex_release;
	72	}
	73	err = gk20a_busy(g);
	74	if (err) {
	75	nvgpu_err(g, "failed to power on gpu");
	76	goto mutex_release;
	77	}
	78
	79	ch = gk20a_get_channel_from_file(arg->channel_fd);
	80	if (!ch) {
	81	err = -EINVAL;
	82	goto idle;
	83	}
	84
	85	if (arg->tpc_pg_enabled && (!tsg->tpc_num_initialized)) {
	86	if ((arg->num_active_tpcs > gr->max_tpc_count) \|\|
	87	!(arg->num_active_tpcs)) {
	88	nvgpu_err(g, "Invalid num of active TPCs");
	89	err = -EINVAL;
	90	goto ch_put;
	91	}
	92	tsg->tpc_num_initialized = true;
	93	tsg->num_active_tpcs = arg->num_active_tpcs;
	94	tsg->tpc_pg_enabled = true;
	95	} else {
	96	tsg->tpc_pg_enabled = false; nvgpu_log(g, gpu_dbg_info, "dynamic TPC-PG not enabled");
	97	}
	98
	99	if (arg->subcontext_id < g->fifo.max_subctx_count) {
	100	ch->subctx_id = arg->subcontext_id;
	101	} else {
	102	err = -EINVAL;
	103	goto ch_put;
	104	}
	105
	106	nvgpu_log(g, gpu_dbg_info, "channel id : %d : subctx: %d",
	107	ch->chid, ch->subctx_id);
	108
	109	/* Use runqueue selector 1 for all ASYNC ids */
	110	if (ch->subctx_id > CHANNEL_INFO_VEID0)
	111	ch->runqueue_sel = 1;
	112
	113	err = ch->g->ops.fifo.tsg_bind_channel(tsg, ch);
	114	ch_put:
	115	gk20a_channel_put(ch);
	116	idle:
	117	gk20a_idle(g);
	118	mutex_release:
	119	nvgpu_mutex_release(&sched->control_lock);
	120	return err;
	121	}
	122
	123	static int gk20a_tsg_unbind_channel_fd(struct tsg_gk20a *tsg, int ch_fd)
	124	{
	125	struct channel_gk20a *ch;
	126	int err = 0;
	127
	128	ch = gk20a_get_channel_from_file(ch_fd);
	129	if (!ch)
	130	return -EINVAL;
	131
	132	if (ch->tsgid != tsg->tsgid) {
	133	err = -EINVAL;
	134	goto out;
	135	}
	136
	137	err = gk20a_tsg_unbind_channel(ch);
	138
	139	/*
	140	* Mark the channel timedout since channel unbound from TSG
	141	* has no context of its own so it can't serve any job
	142	*/
	143	gk20a_channel_set_timedout(ch);
	144
	145	out:
	146	gk20a_channel_put(ch);
	147	return err;
	148	}
	149
	150	static int gk20a_tsg_get_event_data_from_id(struct tsg_gk20a *tsg,
	151	unsigned int event_id,
	152	struct gk20a_event_id_data **event_id_data)
	153	{
	154	struct gk20a_event_id_data *local_event_id_data;
	155	bool event_found = false;
	156
	157	nvgpu_mutex_acquire(&tsg->event_id_list_lock);
	158	nvgpu_list_for_each_entry(local_event_id_data, &tsg->event_id_list,
	159	gk20a_event_id_data, event_id_node) {
	160	if (local_event_id_data->event_id == event_id) {
	161	event_found = true;
	162	break;
	163	}
	164	}
	165	nvgpu_mutex_release(&tsg->event_id_list_lock);
	166
	167	if (event_found) {
	168	*event_id_data = local_event_id_data;
	169	return 0;
	170	} else {
	171	return -1;
	172	}
	173	}
	174
	175	/*
	176	* Convert common event_id of the form NVGPU_EVENT_ID_* to Linux specific
	177	* event_id of the form NVGPU_IOCTL_CHANNEL_EVENT_ID_* which is used in IOCTLs
	178	*/
	179	static u32 nvgpu_event_id_to_ioctl_channel_event_id(u32 event_id)
	180	{
	181	switch (event_id) {
	182	case NVGPU_EVENT_ID_BPT_INT:
	183	return NVGPU_IOCTL_CHANNEL_EVENT_ID_BPT_INT;
	184	case NVGPU_EVENT_ID_BPT_PAUSE:
	185	return NVGPU_IOCTL_CHANNEL_EVENT_ID_BPT_PAUSE;
	186	case NVGPU_EVENT_ID_BLOCKING_SYNC:
	187	return NVGPU_IOCTL_CHANNEL_EVENT_ID_BLOCKING_SYNC;
	188	case NVGPU_EVENT_ID_CILP_PREEMPTION_STARTED:
	189	return NVGPU_IOCTL_CHANNEL_EVENT_ID_CILP_PREEMPTION_STARTED;
	190	case NVGPU_EVENT_ID_CILP_PREEMPTION_COMPLETE:
	191	return NVGPU_IOCTL_CHANNEL_EVENT_ID_CILP_PREEMPTION_COMPLETE;
	192	case NVGPU_EVENT_ID_GR_SEMAPHORE_WRITE_AWAKEN:
	193	return NVGPU_IOCTL_CHANNEL_EVENT_ID_GR_SEMAPHORE_WRITE_AWAKEN;
	194	}
	195
	196	return NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX;
	197	}
	198
	199	void gk20a_tsg_event_id_post_event(struct tsg_gk20a *tsg,
	200	int __event_id)
	201	{
	202	struct gk20a_event_id_data *event_id_data;
	203	u32 event_id;
	204	int err = 0;
	205	struct gk20a *g = tsg->g;
	206
	207	event_id = nvgpu_event_id_to_ioctl_channel_event_id(__event_id);
	208	if (event_id >= NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX)
	209	return;
	210
	211	err = gk20a_tsg_get_event_data_from_id(tsg, event_id,
	212	&event_id_data);
	213	if (err)
	214	return;
	215
	216	nvgpu_mutex_acquire(&event_id_data->lock);
	217
	218	nvgpu_log_info(g,
	219	"posting event for event_id=%d on tsg=%d\n",
	220	event_id, tsg->tsgid);
	221	event_id_data->event_posted = true;
	222
	223	nvgpu_cond_broadcast_interruptible(&event_id_data->event_id_wq);
	224
	225	nvgpu_mutex_release(&event_id_data->lock);
	226	}
	227
	228	static unsigned int gk20a_event_id_poll(struct file filep, poll_table wait)
	229	{
	230	unsigned int mask = 0;
	231	struct gk20a_event_id_data *event_id_data = filep->private_data;
	232	struct gk20a *g = event_id_data->g;
	233	u32 event_id = event_id_data->event_id;
	234	struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
	235
	236	nvgpu_log(g, gpu_dbg_fn \| gpu_dbg_info, " ");
	237
	238	poll_wait(filep, &event_id_data->event_id_wq.wq, wait);
	239
	240	nvgpu_mutex_acquire(&event_id_data->lock);
	241
	242	if (event_id_data->event_posted) {
	243	nvgpu_log_info(g,
	244	"found pending event_id=%d on TSG=%d\n",
	245	event_id, tsg->tsgid);
	246	mask = (POLLPRI \| POLLIN);
	247	event_id_data->event_posted = false;
	248	}
	249
	250	nvgpu_mutex_release(&event_id_data->lock);
	251
	252	return mask;
	253	}
	254
	255	static int gk20a_event_id_release(struct inode inode, struct file filp)
	256	{
	257	struct gk20a_event_id_data *event_id_data = filp->private_data;
	258	struct gk20a *g = event_id_data->g;
	259	struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
	260
	261	nvgpu_mutex_acquire(&tsg->event_id_list_lock);
	262	nvgpu_list_del(&event_id_data->event_id_node);
	263	nvgpu_mutex_release(&tsg->event_id_list_lock);
	264
	265	nvgpu_mutex_destroy(&event_id_data->lock);
	266	gk20a_put(g);
	267	nvgpu_kfree(g, event_id_data);
	268	filp->private_data = NULL;
	269
	270	return 0;
	271	}
	272
	273	const struct file_operations gk20a_event_id_ops = {
	274	.owner = THIS_MODULE,
	275	.poll = gk20a_event_id_poll,
	276	.release = gk20a_event_id_release,
	277	};
	278
	279	static int gk20a_tsg_event_id_enable(struct tsg_gk20a *tsg,
	280	int event_id,
	281	int *fd)
	282	{
	283	int err = 0;
	284	int local_fd;
	285	struct file *file;
	286	char name[64];
	287	struct gk20a_event_id_data *event_id_data;
	288	struct gk20a *g;
	289
	290	g = gk20a_get(tsg->g);
	291	if (!g)
	292	return -ENODEV;
	293
	294	err = gk20a_tsg_get_event_data_from_id(tsg,
	295	event_id, &event_id_data);
	296	if (err == 0) {
	297	/* We already have event enabled */
	298	err = -EINVAL;
	299	goto free_ref;
	300	}
	301
	302	err = get_unused_fd_flags(O_RDWR);
	303	if (err < 0)
	304	goto free_ref;
	305	local_fd = err;
	306
	307	snprintf(name, sizeof(name), "nvgpu-event%d-fd%d",
	308	event_id, local_fd);
	309
	310	file = anon_inode_getfile(name, &gk20a_event_id_ops,
	311	NULL, O_RDWR);
	312	if (IS_ERR(file)) {
	313	err = PTR_ERR(file);
	314	goto clean_up;
	315	}
	316
	317	event_id_data = nvgpu_kzalloc(tsg->g, sizeof(*event_id_data));
	318	if (!event_id_data) {
	319	err = -ENOMEM;
	320	goto clean_up_file;
	321	}
	322	event_id_data->g = g;
	323	event_id_data->id = tsg->tsgid;
	324	event_id_data->event_id = event_id;
	325
	326	nvgpu_cond_init(&event_id_data->event_id_wq);
	327	err = nvgpu_mutex_init(&event_id_data->lock);
	328	if (err)
	329	goto clean_up_free;
	330
	331	nvgpu_init_list_node(&event_id_data->event_id_node);
	332
	333	nvgpu_mutex_acquire(&tsg->event_id_list_lock);
	334	nvgpu_list_add_tail(&event_id_data->event_id_node, &tsg->event_id_list);
	335	nvgpu_mutex_release(&tsg->event_id_list_lock);
	336
	337	fd_install(local_fd, file);
	338	file->private_data = event_id_data;
	339
	340	*fd = local_fd;
	341
	342	return 0;
	343
	344	clean_up_free:
	345	nvgpu_kfree(g, event_id_data);
	346	clean_up_file:
	347	fput(file);
	348	clean_up:
	349	put_unused_fd(local_fd);
	350	free_ref:
	351	gk20a_put(g);
	352	return err;
	353	}
	354
	355	static int gk20a_tsg_event_id_ctrl(struct gk20a g, struct tsg_gk20a tsg,
	356	struct nvgpu_event_id_ctrl_args *args)
	357	{
	358	int err = 0;
	359	int fd = -1;
	360
	361	if (args->event_id >= NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX)
	362	return -EINVAL;
	363
	364	nvgpu_speculation_barrier();
	365	switch (args->cmd) {
	366	case NVGPU_IOCTL_CHANNEL_EVENT_ID_CMD_ENABLE:
	367	err = gk20a_tsg_event_id_enable(tsg, args->event_id, &fd);
	368	if (!err)
	369	args->event_fd = fd;
	370	break;
	371
	372	default:
	373	nvgpu_err(tsg->g, "unrecognized tsg event id cmd: 0x%x",
	374	args->cmd);
	375	err = -EINVAL;
	376	break;
	377	}
	378
	379	return err;
	380	}
	381
	382	int nvgpu_ioctl_tsg_open(struct gk20a g, struct file filp)
	383	{
	384	struct tsg_private *priv;
	385	struct tsg_gk20a *tsg;
	386	struct device *dev;
	387	int err;
	388
	389	g = gk20a_get(g);
	390	if (!g)
	391	return -ENODEV;
	392
	393	dev = dev_from_gk20a(g);
	394
	395	nvgpu_log(g, gpu_dbg_fn, "tsg: %s", dev_name(dev));
	396
	397	priv = nvgpu_kmalloc(g, sizeof(*priv));
	398	if (!priv) {
	399	err = -ENOMEM;
	400	goto free_ref;
	401	}
	402
	403	err = gk20a_busy(g);
	404	if (err) {
	405	nvgpu_err(g, "failed to power on, %d", err);
	406	goto free_mem;
	407	}
	408
	409	tsg = gk20a_tsg_open(g, nvgpu_current_pid(g));
	410	gk20a_idle(g);
	411	if (!tsg) {
	412	err = -ENOMEM;
	413	goto free_mem;
	414	}
	415
	416	priv->g = g;
	417	priv->tsg = tsg;
	418	filp->private_data = priv;
	419
	420	gk20a_sched_ctrl_tsg_added(g, tsg);
	421
	422	return 0;
	423
	424	free_mem:
	425	nvgpu_kfree(g, priv);
	426	free_ref:
	427	gk20a_put(g);
	428	return err;
	429	}
	430
	431	int nvgpu_ioctl_tsg_dev_open(struct inode inode, struct file filp)
	432	{
	433	struct nvgpu_os_linux *l;
	434	struct gk20a *g;
	435	int ret;
	436
	437	l = container_of(inode->i_cdev,
	438	struct nvgpu_os_linux, tsg.cdev);
	439	g = &l->g;
	440
	441	nvgpu_log_fn(g, " ");
	442
	443	ret = gk20a_busy(g);
	444	if (ret) {
	445	nvgpu_err(g, "failed to power on, %d", ret);
	446	return ret;
	447	}
	448
	449	ret = nvgpu_ioctl_tsg_open(&l->g, filp);
	450
	451	gk20a_idle(g);
	452	nvgpu_log_fn(g, "done");
	453	return ret;
	454	}
	455
	456	void nvgpu_ioctl_tsg_release(struct nvgpu_ref *ref)
	457	{
	458	struct tsg_gk20a *tsg = container_of(ref, struct tsg_gk20a, refcount);
	459	struct gk20a *g = tsg->g;
	460
	461	gk20a_sched_ctrl_tsg_removed(g, tsg);
	462
	463	gk20a_tsg_release(ref);
	464	gk20a_put(g);
	465	}
	466
	467	int nvgpu_ioctl_tsg_dev_release(struct inode inode, struct file filp)
	468	{
	469	struct tsg_private *priv = filp->private_data;
	470	struct tsg_gk20a *tsg;
	471
	472	if (!priv) {
	473	/* open failed, never got a tsg for this file */
	474	return 0;
	475	}
	476
	477	tsg = priv->tsg;
	478
	479	nvgpu_ref_put(&tsg->refcount, nvgpu_ioctl_tsg_release);
	480	nvgpu_kfree(tsg->g, priv);
	481	return 0;
	482	}
	483
	484	static int gk20a_tsg_ioctl_set_runlist_interleave(struct gk20a *g,
	485	struct tsg_gk20a tsg, struct nvgpu_runlist_interleave_args arg)
	486	{
	487	struct nvgpu_sched_ctrl *sched = &g->sched_ctrl;
	488	u32 level = arg->level;
	489	int err;
	490
	491	nvgpu_log(g, gpu_dbg_fn \| gpu_dbg_sched, "tsgid=%u", tsg->tsgid);
	492
	493	nvgpu_mutex_acquire(&sched->control_lock);
	494	if (sched->control_locked) {
	495	err = -EPERM;
	496	goto done;
	497	}
	498	err = gk20a_busy(g);
	499	if (err) {
	500	nvgpu_err(g, "failed to power on gpu");
	501	goto done;
	502	}
	503
	504	level = nvgpu_get_common_runlist_level(level);
	505	err = gk20a_tsg_set_runlist_interleave(tsg, level);
	506
	507	gk20a_idle(g);
	508	done:
	509	nvgpu_mutex_release(&sched->control_lock);
	510	return err;
	511	}
	512
	513	static int gk20a_tsg_ioctl_set_timeslice(struct gk20a *g,
	514	struct tsg_gk20a tsg, struct nvgpu_timeslice_args arg)
	515	{
	516	struct nvgpu_sched_ctrl *sched = &g->sched_ctrl;
	517	int err;
	518
	519	nvgpu_log(g, gpu_dbg_fn \| gpu_dbg_sched, "tsgid=%u", tsg->tsgid);
	520
	521	nvgpu_mutex_acquire(&sched->control_lock);
	522	if (sched->control_locked) {
	523	err = -EPERM;
	524	goto done;
	525	}
	526	err = gk20a_busy(g);
	527	if (err) {
	528	nvgpu_err(g, "failed to power on gpu");
	529	goto done;
	530	}
	531	err = gk20a_tsg_set_timeslice(tsg, arg->timeslice_us);
	532	gk20a_idle(g);
	533	done:
	534	nvgpu_mutex_release(&sched->control_lock);
	535	return err;
	536	}
	537
	538	static int gk20a_tsg_ioctl_get_timeslice(struct gk20a *g,
	539	struct tsg_gk20a tsg, struct nvgpu_timeslice_args arg)
	540	{
	541	arg->timeslice_us = gk20a_tsg_get_timeslice(tsg);
	542	return 0;
	543	}
	544
	545	static int gk20a_tsg_ioctl_read_single_sm_error_state(struct gk20a *g,
	546	struct tsg_gk20a *tsg,
	547	struct nvgpu_tsg_read_single_sm_error_state_args *args)
	548	{
	549	struct gr_gk20a *gr = &g->gr;
	550	struct nvgpu_tsg_sm_error_state *sm_error_state;
	551	struct nvgpu_tsg_sm_error_state_record sm_error_state_record;
	552	u32 sm_id;
	553	int err = 0;
	554
	555	sm_id = args->sm_id;
	556	if (sm_id >= gr->no_of_sm)
	557	return -EINVAL;
	558
	559	nvgpu_speculation_barrier();
	560
	561	sm_error_state = tsg->sm_error_states + sm_id;
	562	sm_error_state_record.global_esr =
	563	sm_error_state->hww_global_esr;
	564	sm_error_state_record.warp_esr =
	565	sm_error_state->hww_warp_esr;
	566	sm_error_state_record.warp_esr_pc =
	567	sm_error_state->hww_warp_esr_pc;
	568	sm_error_state_record.global_esr_report_mask =
	569	sm_error_state->hww_global_esr_report_mask;
	570	sm_error_state_record.warp_esr_report_mask =
	571	sm_error_state->hww_warp_esr_report_mask;
	572
	573	if (args->record_size > 0) {
	574	size_t write_size = sizeof(*sm_error_state);
	575
	576	nvgpu_speculation_barrier();
	577	if (write_size > args->record_size)
	578	write_size = args->record_size;
	579
	580	nvgpu_mutex_acquire(&g->dbg_sessions_lock);
	581	err = copy_to_user((void __user *)(uintptr_t)
	582	args->record_mem,
	583	&sm_error_state_record,
	584	write_size);
	585	nvgpu_mutex_release(&g->dbg_sessions_lock);
	586	if (err) {
	587	nvgpu_err(g, "copy_to_user failed!");
	588	return err;
	589	}
	590
	591	args->record_size = write_size;
	592	}
	593
	594	return 0;
	595	}
	596
	597	long nvgpu_ioctl_tsg_dev_ioctl(struct file *filp, unsigned int cmd,
	598	unsigned long arg)
	599	{
	600	struct tsg_private *priv = filp->private_data;
	601	struct tsg_gk20a *tsg = priv->tsg;
	602	struct gk20a *g = tsg->g;
	603	u8 __maybe_unused buf[NVGPU_TSG_IOCTL_MAX_ARG_SIZE];
	604	int err = 0;
	605
	606	nvgpu_log_fn(g, "start %d", _IOC_NR(cmd));
	607
	608	if ((_IOC_TYPE(cmd) != NVGPU_TSG_IOCTL_MAGIC) \|\|
	609	(_IOC_NR(cmd) == 0) \|\|
	610	(_IOC_NR(cmd) > NVGPU_TSG_IOCTL_LAST) \|\|
	611	(_IOC_SIZE(cmd) > NVGPU_TSG_IOCTL_MAX_ARG_SIZE))
	612	return -EINVAL;
	613
	614	memset(buf, 0, sizeof(buf));
	615	if (_IOC_DIR(cmd) & _IOC_WRITE) {
	616	if (copy_from_user(buf, (void __user *)arg, _IOC_SIZE(cmd)))
	617	return -EFAULT;
	618	}
	619
	620	if (!g->sw_ready) {
	621	err = gk20a_busy(g);
	622	if (err)
	623	return err;
	624
	625	gk20a_idle(g);
	626	}
	627
	628	switch (cmd) {
	629	case NVGPU_TSG_IOCTL_BIND_CHANNEL:
	630	{
	631	int ch_fd = (int )buf;
	632	if (ch_fd < 0) {
	633	err = -EINVAL;
	634	break;
	635	}
	636	err = gk20a_tsg_bind_channel_fd(tsg, ch_fd);
	637	break;
	638	}
	639
	640	case NVGPU_TSG_IOCTL_BIND_CHANNEL_EX:
	641	{
	642	err = gk20a_tsg_ioctl_bind_channel_ex(g, tsg,
	643	(struct nvgpu_tsg_bind_channel_ex_args *)buf);
	644	break;
	645	}
	646
	647	case NVGPU_TSG_IOCTL_UNBIND_CHANNEL:
	648	{
	649	int ch_fd = (int )buf;
	650
	651	if (ch_fd < 0) {
	652	err = -EINVAL;
	653	break;
	654	}
	655	err = gk20a_busy(g);
	656	if (err) {
	657	nvgpu_err(g,
	658	"failed to host gk20a for ioctl cmd: 0x%x", cmd);
	659	break;
	660	}
	661	err = gk20a_tsg_unbind_channel_fd(tsg, ch_fd);
	662	gk20a_idle(g);
	663	break;
	664	}
	665
	666	case NVGPU_IOCTL_TSG_ENABLE:
	667	{
	668	err = gk20a_busy(g);
	669	if (err) {
	670	nvgpu_err(g,
	671	"failed to host gk20a for ioctl cmd: 0x%x", cmd);
	672	return err;
	673	}
	674	g->ops.fifo.enable_tsg(tsg);
	675	gk20a_idle(g);
	676	break;
	677	}
	678
	679	case NVGPU_IOCTL_TSG_DISABLE:
	680	{
	681	err = gk20a_busy(g);
	682	if (err) {
	683	nvgpu_err(g,
	684	"failed to host gk20a for ioctl cmd: 0x%x", cmd);
	685	return err;
	686	}
	687	g->ops.fifo.disable_tsg(tsg);
	688	gk20a_idle(g);
	689	break;
	690	}
	691
	692	case NVGPU_IOCTL_TSG_PREEMPT:
	693	{
	694	err = gk20a_busy(g);
	695	if (err) {
	696	nvgpu_err(g,
	697	"failed to host gk20a for ioctl cmd: 0x%x", cmd);
	698	return err;
	699	}
	700	/* preempt TSG */
	701	err = g->ops.fifo.preempt_tsg(g, tsg);
	702	gk20a_idle(g);
	703	break;
	704	}
	705
	706	case NVGPU_IOCTL_TSG_EVENT_ID_CTRL:
	707	{
	708	err = gk20a_tsg_event_id_ctrl(g, tsg,
	709	(struct nvgpu_event_id_ctrl_args *)buf);
	710	break;
	711	}
	712
	713	case NVGPU_IOCTL_TSG_SET_RUNLIST_INTERLEAVE:
	714	err = gk20a_tsg_ioctl_set_runlist_interleave(g, tsg,
	715	(struct nvgpu_runlist_interleave_args *)buf);
	716	break;
	717
	718	case NVGPU_IOCTL_TSG_SET_TIMESLICE:
	719	{
	720	err = gk20a_tsg_ioctl_set_timeslice(g, tsg,
	721	(struct nvgpu_timeslice_args *)buf);
	722	break;
	723	}
	724	case NVGPU_IOCTL_TSG_GET_TIMESLICE:
	725	{
	726	err = gk20a_tsg_ioctl_get_timeslice(g, tsg,
	727	(struct nvgpu_timeslice_args *)buf);
	728	break;
	729	}
	730
	731	case NVGPU_TSG_IOCTL_READ_SINGLE_SM_ERROR_STATE:
	732	{
	733	err = gk20a_tsg_ioctl_read_single_sm_error_state(g, tsg,
	734	(struct nvgpu_tsg_read_single_sm_error_state_args *)buf);
	735	break;
	736	}
	737
	738	default:
	739	nvgpu_err(g, "unrecognized tsg gpu ioctl cmd: 0x%x",
	740	cmd);
	741	err = -ENOTTY;
	742	break;
	743	}
	744
	745	if ((err == 0) && (_IOC_DIR(cmd) & _IOC_READ))
	746	err = copy_to_user((void __user *)arg,
	747	buf, _IOC_SIZE(cmd));
	748
	749	return err;
	750	}