From a07e10f494c158ae31d6187e9be3db409528a507 Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Thu, 23 Mar 2017 14:19:01 -0700
Subject: gpu: nvgpu: Move channel IOCTL code to Linux module

Move channel IOCTL specific code to Linux module. This clears some
Linux dependencies from channel_gk20a.c.

JIRA NVGPU-32

Change-Id: I41817d612b959709365bcabff9c8a15f2bfe4c60
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: http://git-master/r/1330804
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/Makefile.nvgpu               |    1 +
 drivers/gpu/nvgpu/clk/clk_arb.c                |    3 +
 drivers/gpu/nvgpu/common/linux/ioctl.c         |    2 +-
 drivers/gpu/nvgpu/common/linux/ioctl_channel.c | 1179 ++++++++++++++++++++++
 drivers/gpu/nvgpu/common/linux/ioctl_channel.h |   21 +
 drivers/gpu/nvgpu/gk20a/cde_gk20a.c            |    3 +-
 drivers/gpu/nvgpu/gk20a/ce2_gk20a.c            |    3 +-
 drivers/gpu/nvgpu/gk20a/channel_gk20a.c        | 1281 ++----------------------
 drivers/gpu/nvgpu/gk20a/channel_gk20a.h        |   14 +-
 drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c    |    2 +
 drivers/gpu/nvgpu/gk20a/sched_gk20a.c          |    2 +
 drivers/gpu/nvgpu/gp106/xve_gp106.c            |    1 +
 12 files changed, 1294 insertions(+), 1218 deletions(-)
 create mode 100644 drivers/gpu/nvgpu/common/linux/ioctl_channel.c
 create mode 100644 drivers/gpu/nvgpu/common/linux/ioctl_channel.h

(limited to 'drivers/gpu/nvgpu')

diff --git a/drivers/gpu/nvgpu/Makefile.nvgpu b/drivers/gpu/nvgpu/Makefile.nvgpu
index e9e7581a..665076de 100644
--- a/drivers/gpu/nvgpu/Makefile.nvgpu
+++ b/drivers/gpu/nvgpu/Makefile.nvgpu
@@ -28,6 +28,7 @@ nvgpu-y := \
 	common/linux/ioctl.o \
 	common/linux/ioctl_ctrl.o \
 	common/linux/ioctl_as.o \
+	common/linux/ioctl_channel.o \
 	common/mm/nvgpu_allocator.o \
 	common/mm/bitmap_allocator.o \
 	common/mm/buddy_allocator.o \
diff --git a/drivers/gpu/nvgpu/clk/clk_arb.c b/drivers/gpu/nvgpu/clk/clk_arb.c
index 0ccc7c53..dc063709 100644
--- a/drivers/gpu/nvgpu/clk/clk_arb.c
+++ b/drivers/gpu/nvgpu/clk/clk_arb.c
@@ -19,6 +19,9 @@
 #include <linux/bitops.h>
 #include <linux/rculist.h>
 #include <linux/llist.h>
+#include <linux/uaccess.h>
+#include <linux/poll.h>
+#include <linux/atomic.h>
 
 #include <nvgpu/lock.h>
 #include <nvgpu/kmem.h>
diff --git a/drivers/gpu/nvgpu/common/linux/ioctl.c b/drivers/gpu/nvgpu/common/linux/ioctl.c
index 53b9476e..db252aeb 100644
--- a/drivers/gpu/nvgpu/common/linux/ioctl.c
+++ b/drivers/gpu/nvgpu/common/linux/ioctl.c
@@ -23,8 +23,8 @@
 #include "gk20a/gk20a.h"
 #include "gk20a/dbg_gpu_gk20a.h"
 #include "gk20a/ctxsw_trace_gk20a.h"
-#include "gk20a/channel_gk20a.h"
 #include "gk20a/tsg_gk20a.h"
+#include "ioctl_channel.h"
 #include "ioctl_ctrl.h"
 #include "ioctl_as.h"
 
diff --git a/drivers/gpu/nvgpu/common/linux/ioctl_channel.c b/drivers/gpu/nvgpu/common/linux/ioctl_channel.c
new file mode 100644
index 00000000..4a9531de
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/linux/ioctl_channel.c
@@ -0,0 +1,1179 @@
+/*
+ * GK20A Graphics channel
+ *
+ * Copyright (c) 2011-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include <linux/list.h>
+#include <trace/events/gk20a.h>
+#include <linux/file.h>
+#include <linux/anon_inodes.h>
+#include <linux/dma-buf.h>
+
+#include <nvgpu/semaphore.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/kmem.h>
+
+#include "gk20a/gk20a.h"
+#include "gk20a/debug_gk20a.h"
+#include "gk20a/ctxsw_trace_gk20a.h"
+#include "gk20a/dbg_gpu_gk20a.h"
+#include "gk20a/fence_gk20a.h"
+
+/*
+ * Although channels do have pointers back to the gk20a struct that they were
+ * created under in cases where the driver is killed that pointer can be bad.
+ * The channel memory can be freed before the release() function for a given
+ * channel is called. This happens when the driver dies and userspace doesn't
+ * get a chance to call release() until after the entire gk20a driver data is
+ * unloaded and freed.
+ */
+struct channel_priv {
+	struct gk20a *g;
+	struct channel_gk20a *c;
+};
+
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+
+static int gk20a_channel_cycle_stats(struct channel_gk20a *ch,
+		       struct nvgpu_cycle_stats_args *args)
+{
+	struct dma_buf *dmabuf;
+	void *virtual_address;
+
+	/* is it allowed to handle calls for current GPU? */
+	if (0 == (ch->g->gpu_characteristics.flags &
+			NVGPU_GPU_FLAGS_SUPPORT_CYCLE_STATS))
+		return -ENOSYS;
+
+	if (args->dmabuf_fd && !ch->cyclestate.cyclestate_buffer_handler) {
+
+		/* set up new cyclestats buffer */
+		dmabuf = dma_buf_get(args->dmabuf_fd);
+		if (IS_ERR(dmabuf))
+			return PTR_ERR(dmabuf);
+		virtual_address = dma_buf_vmap(dmabuf);
+		if (!virtual_address)
+			return -ENOMEM;
+
+		ch->cyclestate.cyclestate_buffer_handler = dmabuf;
+		ch->cyclestate.cyclestate_buffer = virtual_address;
+		ch->cyclestate.cyclestate_buffer_size = dmabuf->size;
+		return 0;
+
+	} else if (!args->dmabuf_fd &&
+			ch->cyclestate.cyclestate_buffer_handler) {
+		gk20a_channel_free_cycle_stats_buffer(ch);
+		return 0;
+
+	} else if (!args->dmabuf_fd &&
+			!ch->cyclestate.cyclestate_buffer_handler) {
+		/* no requst from GL */
+		return 0;
+
+	} else {
+		pr_err("channel already has cyclestats buffer\n");
+		return -EINVAL;
+	}
+}
+
+static int gk20a_flush_cycle_stats_snapshot(struct channel_gk20a *ch)
+{
+	int ret;
+
+	nvgpu_mutex_acquire(&ch->cs_client_mutex);
+	if (ch->cs_client)
+		ret = gr_gk20a_css_flush(ch, ch->cs_client);
+	else
+		ret = -EBADF;
+	nvgpu_mutex_release(&ch->cs_client_mutex);
+
+	return ret;
+}
+
+static int gk20a_attach_cycle_stats_snapshot(struct channel_gk20a *ch,
+				u32 dmabuf_fd,
+				u32 perfmon_id_count,
+				u32 *perfmon_id_start)
+{
+	int ret;
+
+	nvgpu_mutex_acquire(&ch->cs_client_mutex);
+	if (ch->cs_client) {
+		ret = -EEXIST;
+	} else {
+		ret = gr_gk20a_css_attach(ch,
+					dmabuf_fd,
+					perfmon_id_count,
+					perfmon_id_start,
+					&ch->cs_client);
+	}
+	nvgpu_mutex_release(&ch->cs_client_mutex);
+
+	return ret;
+}
+
+static int gk20a_channel_cycle_stats_snapshot(struct channel_gk20a *ch,
+			struct nvgpu_cycle_stats_snapshot_args *args)
+{
+	int ret;
+
+	/* is it allowed to handle calls for current GPU? */
+	if (0 == (ch->g->gpu_characteristics.flags &
+			NVGPU_GPU_FLAGS_SUPPORT_CYCLE_STATS_SNAPSHOT))
+		return -ENOSYS;
+
+	if (!args->dmabuf_fd)
+		return -EINVAL;
+
+	/* handle the command (most frequent cases first) */
+	switch (args->cmd) {
+	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT_CMD_FLUSH:
+		ret = gk20a_flush_cycle_stats_snapshot(ch);
+		args->extra = 0;
+		break;
+
+	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT_CMD_ATTACH:
+		ret = gk20a_attach_cycle_stats_snapshot(ch,
+						args->dmabuf_fd,
+						args->extra,
+						&args->extra);
+		break;
+
+	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT_CMD_DETACH:
+		ret = gk20a_channel_free_cycle_stats_snapshot(ch);
+		args->extra = 0;
+		break;
+
+	default:
+		pr_err("cyclestats: unknown command %u\n", args->cmd);
+		ret = -EINVAL;
+		break;
+	}
+
+	return ret;
+}
+#endif
+
+static int gk20a_channel_set_wdt_status(struct channel_gk20a *ch,
+		struct nvgpu_channel_wdt_args *args)
+{
+	if (args->wdt_status == NVGPU_IOCTL_CHANNEL_DISABLE_WDT)
+		ch->wdt_enabled = false;
+	else if (args->wdt_status == NVGPU_IOCTL_CHANNEL_ENABLE_WDT)
+		ch->wdt_enabled = true;
+
+	return 0;
+}
+
+static int gk20a_init_error_notifier(struct channel_gk20a *ch,
+		struct nvgpu_set_error_notifier *args)
+{
+	struct device *dev = dev_from_gk20a(ch->g);
+	struct dma_buf *dmabuf;
+	void *va;
+	u64 end = args->offset + sizeof(struct nvgpu_notification);
+
+	if (!args->mem) {
+		pr_err("gk20a_init_error_notifier: invalid memory handle\n");
+		return -EINVAL;
+	}
+
+	dmabuf = dma_buf_get(args->mem);
+
+	gk20a_channel_free_error_notifiers(ch);
+
+	if (IS_ERR(dmabuf)) {
+		pr_err("Invalid handle: %d\n", args->mem);
+		return -EINVAL;
+	}
+
+	if (end > dmabuf->size || end < sizeof(struct nvgpu_notification)) {
+		dma_buf_put(dmabuf);
+		gk20a_err(dev, "gk20a_init_error_notifier: invalid offset\n");
+		return -EINVAL;
+	}
+
+	/* map handle */
+	va = dma_buf_vmap(dmabuf);
+	if (!va) {
+		dma_buf_put(dmabuf);
+		pr_err("Cannot map notifier handle\n");
+		return -ENOMEM;
+	}
+
+	ch->error_notifier = va + args->offset;
+	ch->error_notifier_va = va;
+	memset(ch->error_notifier, 0, sizeof(struct nvgpu_notification));
+
+	/* set channel notifiers pointer */
+	nvgpu_mutex_acquire(&ch->error_notifier_mutex);
+	ch->error_notifier_ref = dmabuf;
+	nvgpu_mutex_release(&ch->error_notifier_mutex);
+
+	return 0;
+}
+
+struct channel_gk20a *gk20a_get_channel_from_file(int fd)
+{
+	struct channel_priv *priv;
+	struct file *f = fget(fd);
+
+	if (!f)
+		return NULL;
+
+	if (f->f_op != &gk20a_channel_ops) {
+		fput(f);
+		return NULL;
+	}
+
+	priv = (struct channel_priv *)f->private_data;
+	fput(f);
+	return priv->c;
+}
+
+int gk20a_channel_release(struct inode *inode, struct file *filp)
+{
+	struct channel_priv *priv = filp->private_data;
+	struct channel_gk20a *ch = priv->c;
+	struct gk20a *g = priv->g;
+
+	int err;
+
+	err = gk20a_busy(g);
+	if (err) {
+		gk20a_err(dev_from_gk20a(g), "failed to release a channel!");
+		goto channel_release;
+	}
+
+	trace_gk20a_channel_release(dev_name(g->dev));
+
+	gk20a_channel_close(ch);
+	gk20a_idle(g);
+
+channel_release:
+	gk20a_put(g);
+	nvgpu_kfree(g, filp->private_data);
+	filp->private_data = NULL;
+	return 0;
+}
+
+/* note: runlist_id -1 is synonym for the ENGINE_GR_GK20A runlist id */
+static int __gk20a_channel_open(struct gk20a *g,
+				struct file *filp, s32 runlist_id)
+{
+	int err;
+	struct channel_gk20a *ch;
+	struct channel_priv *priv;
+
+	gk20a_dbg_fn("");
+
+	g = gk20a_get(g);
+	if (!g)
+		return -ENODEV;
+
+	trace_gk20a_channel_open(dev_name(g->dev));
+
+	priv = nvgpu_kzalloc(g, sizeof(*priv));
+	if (!priv) {
+		err = -ENOMEM;
+		goto free_ref;
+	}
+
+	err = gk20a_busy(g);
+	if (err) {
+		gk20a_err(dev_from_gk20a(g), "failed to power on, %d", err);
+		goto fail_busy;
+	}
+	/* All the user space channel should be non privilege */
+	ch = gk20a_open_new_channel(g, runlist_id, false);
+	gk20a_idle(g);
+	if (!ch) {
+		gk20a_err(dev_from_gk20a(g),
+			"failed to get f");
+		err = -ENOMEM;
+		goto fail_busy;
+	}
+
+	gk20a_channel_trace_sched_param(
+		trace_gk20a_channel_sched_defaults, ch);
+
+	priv->g = g;
+	priv->c = ch;
+
+	filp->private_data = priv;
+	return 0;
+
+fail_busy:
+	nvgpu_kfree(g, priv);
+free_ref:
+	gk20a_put(g);
+	return err;
+}
+
+int gk20a_channel_open(struct inode *inode, struct file *filp)
+{
+	struct gk20a *g = container_of(inode->i_cdev,
+			struct gk20a, channel.cdev);
+	int ret;
+
+	gk20a_dbg_fn("start");
+	ret = __gk20a_channel_open(g, filp, -1);
+
+	gk20a_dbg_fn("end");
+	return ret;
+}
+
+int gk20a_channel_open_ioctl(struct gk20a *g,
+		struct nvgpu_channel_open_args *args)
+{
+	int err;
+	int fd;
+	struct file *file;
+	char name[64];
+	s32 runlist_id = args->in.runlist_id;
+
+	err = get_unused_fd_flags(O_RDWR);
+	if (err < 0)
+		return err;
+	fd = err;
+
+	snprintf(name, sizeof(name), "nvhost-%s-fd%d",
+		 dev_name(g->dev), fd);
+
+	file = anon_inode_getfile(name, g->channel.cdev.ops, NULL, O_RDWR);
+	if (IS_ERR(file)) {
+		err = PTR_ERR(file);
+		goto clean_up;
+	}
+
+	err = __gk20a_channel_open(g, file, runlist_id);
+	if (err)
+		goto clean_up_file;
+
+	fd_install(fd, file);
+	args->out.channel_fd = fd;
+	return 0;
+
+clean_up_file:
+	fput(file);
+clean_up:
+	put_unused_fd(fd);
+	return err;
+}
+
+int nvgpu_channel_ioctl_alloc_gpfifo(struct channel_gk20a *c,
+		struct nvgpu_alloc_gpfifo_ex_args *args)
+{
+	return gk20a_channel_alloc_gpfifo(c, args->num_entries,
+			args->num_inflight_jobs,
+			args->flags);
+}
+
+
+static int gk20a_channel_wait_semaphore(struct channel_gk20a *ch,
+					ulong id, u32 offset,
+					u32 payload, long timeout)
+{
+	struct device *dev = ch->g->dev;
+	struct dma_buf *dmabuf;
+	void *data;
+	u32 *semaphore;
+	int ret = 0;
+	long remain;
+
+	/* do not wait if channel has timed out */
+	if (ch->has_timedout)
+		return -ETIMEDOUT;
+
+	dmabuf = dma_buf_get(id);
+	if (IS_ERR(dmabuf)) {
+		gk20a_err(dev, "invalid notifier nvmap handle 0x%lx", id);
+		return -EINVAL;
+	}
+
+	data = dma_buf_kmap(dmabuf, offset >> PAGE_SHIFT);
+	if (!data) {
+		gk20a_err(dev, "failed to map notifier memory");
+		ret = -EINVAL;
+		goto cleanup_put;
+	}
+
+	semaphore = data + (offset & ~PAGE_MASK);
+
+	remain = wait_event_interruptible_timeout(
+			ch->semaphore_wq,
+			*semaphore == payload || ch->has_timedout,
+			timeout);
+
+	if (remain == 0 && *semaphore != payload)
+		ret = -ETIMEDOUT;
+	else if (remain < 0)
+		ret = remain;
+
+	dma_buf_kunmap(dmabuf, offset >> PAGE_SHIFT, data);
+cleanup_put:
+	dma_buf_put(dmabuf);
+	return ret;
+}
+
+static int gk20a_channel_wait(struct channel_gk20a *ch,
+			      struct nvgpu_wait_args *args)
+{
+	struct device *d = dev_from_gk20a(ch->g);
+	struct dma_buf *dmabuf;
+	struct notification *notif;
+	struct timespec tv;
+	u64 jiffies;
+	ulong id;
+	u32 offset;
+	unsigned long timeout;
+	int remain, ret = 0;
+	u64 end;
+
+	gk20a_dbg_fn("");
+
+	if (ch->has_timedout)
+		return -ETIMEDOUT;
+
+	if (args->timeout == NVGPU_NO_TIMEOUT)
+		timeout = MAX_SCHEDULE_TIMEOUT;
+	else
+		timeout = (u32)msecs_to_jiffies(args->timeout);
+
+	switch (args->type) {
+	case NVGPU_WAIT_TYPE_NOTIFIER:
+		id = args->condition.notifier.dmabuf_fd;
+		offset = args->condition.notifier.offset;
+		end = offset + sizeof(struct notification);
+
+		dmabuf = dma_buf_get(id);
+		if (IS_ERR(dmabuf)) {
+			gk20a_err(d, "invalid notifier nvmap handle 0x%lx",
+				   id);
+			return -EINVAL;
+		}
+
+		if (end > dmabuf->size || end < sizeof(struct notification)) {
+			dma_buf_put(dmabuf);
+			gk20a_err(d, "invalid notifier offset\n");
+			return -EINVAL;
+		}
+
+		notif = dma_buf_vmap(dmabuf);
+		if (!notif) {
+			gk20a_err(d, "failed to map notifier memory");
+			return -ENOMEM;
+		}
+
+		notif = (struct notification *)((uintptr_t)notif + offset);
+
+		/* user should set status pending before
+		 * calling this ioctl */
+		remain = wait_event_interruptible_timeout(
+				ch->notifier_wq,
+				notif->status == 0 || ch->has_timedout,
+				timeout);
+
+		if (remain == 0 && notif->status != 0) {
+			ret = -ETIMEDOUT;
+			goto notif_clean_up;
+		} else if (remain < 0) {
+			ret = -EINTR;
+			goto notif_clean_up;
+		}
+
+		/* TBD: fill in correct information */
+		jiffies = get_jiffies_64();
+		jiffies_to_timespec(jiffies, &tv);
+		notif->timestamp.nanoseconds[0] = tv.tv_nsec;
+		notif->timestamp.nanoseconds[1] = tv.tv_sec;
+		notif->info32 = 0xDEADBEEF; /* should be object name */
+		notif->info16 = ch->hw_chid; /* should be method offset */
+
+notif_clean_up:
+		dma_buf_vunmap(dmabuf, notif);
+		return ret;
+
+	case NVGPU_WAIT_TYPE_SEMAPHORE:
+		ret = gk20a_channel_wait_semaphore(ch,
+				args->condition.semaphore.dmabuf_fd,
+				args->condition.semaphore.offset,
+				args->condition.semaphore.payload,
+				timeout);
+
+		break;
+
+	default:
+		ret = -EINVAL;
+		break;
+	}
+
+	return ret;
+}
+
+static unsigned int gk20a_event_id_poll(struct file *filep, poll_table *wait)
+{
+	unsigned int mask = 0;
+	struct gk20a_event_id_data *event_id_data = filep->private_data;
+	struct gk20a *g = event_id_data->g;
+	u32 event_id = event_id_data->event_id;
+
+	gk20a_dbg(gpu_dbg_fn | gpu_dbg_info, "");
+
+	poll_wait(filep, &event_id_data->event_id_wq, wait);
+
+	nvgpu_mutex_acquire(&event_id_data->lock);
+
+	if (event_id_data->is_tsg) {
+		struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
+
+		if (event_id_data->event_posted) {
+			gk20a_dbg_info(
+				"found pending event_id=%d on TSG=%d\n",
+				event_id, tsg->tsgid);
+			mask = (POLLPRI | POLLIN);
+			event_id_data->event_posted = false;
+		}
+	} else {
+		struct channel_gk20a *ch = g->fifo.channel
+					   + event_id_data->id;
+
+		if (event_id_data->event_posted) {
+			gk20a_dbg_info(
+				"found pending event_id=%d on chid=%d\n",
+				event_id, ch->hw_chid);
+			mask = (POLLPRI | POLLIN);
+			event_id_data->event_posted = false;
+		}
+	}
+
+	nvgpu_mutex_release(&event_id_data->lock);
+
+	return mask;
+}
+
+static int gk20a_event_id_release(struct inode *inode, struct file *filp)
+{
+	struct gk20a_event_id_data *event_id_data = filp->private_data;
+	struct gk20a *g = event_id_data->g;
+
+	if (event_id_data->is_tsg) {
+		struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
+
+		nvgpu_mutex_acquire(&tsg->event_id_list_lock);
+		list_del_init(&event_id_data->event_id_node);
+		nvgpu_mutex_release(&tsg->event_id_list_lock);
+	} else {
+		struct channel_gk20a *ch = g->fifo.channel + event_id_data->id;
+
+		nvgpu_mutex_acquire(&ch->event_id_list_lock);
+		list_del_init(&event_id_data->event_id_node);
+		nvgpu_mutex_release(&ch->event_id_list_lock);
+	}
+
+	nvgpu_mutex_destroy(&event_id_data->lock);
+	gk20a_put(g);
+	nvgpu_kfree(g, event_id_data);
+	filp->private_data = NULL;
+
+	return 0;
+}
+
+const struct file_operations gk20a_event_id_ops = {
+	.owner = THIS_MODULE,
+	.poll = gk20a_event_id_poll,
+	.release = gk20a_event_id_release,
+};
+
+static int gk20a_channel_get_event_data_from_id(struct channel_gk20a *ch,
+				u32 event_id,
+				struct gk20a_event_id_data **event_id_data)
+{
+	struct gk20a_event_id_data *local_event_id_data;
+	bool event_found = false;
+
+	nvgpu_mutex_acquire(&ch->event_id_list_lock);
+	list_for_each_entry(local_event_id_data, &ch->event_id_list,
+						 event_id_node) {
+		if (local_event_id_data->event_id == event_id) {
+			event_found = true;
+			break;
+		}
+	}
+	nvgpu_mutex_release(&ch->event_id_list_lock);
+
+	if (event_found) {
+		*event_id_data = local_event_id_data;
+		return 0;
+	} else {
+		return -1;
+	}
+}
+
+void gk20a_channel_event_id_post_event(struct channel_gk20a *ch,
+				       u32 event_id)
+{
+	struct gk20a_event_id_data *event_id_data;
+	int err = 0;
+
+	err = gk20a_channel_get_event_data_from_id(ch, event_id,
+						&event_id_data);
+	if (err)
+		return;
+
+	nvgpu_mutex_acquire(&event_id_data->lock);
+
+	gk20a_dbg_info(
+		"posting event for event_id=%d on ch=%d\n",
+		event_id, ch->hw_chid);
+	event_id_data->event_posted = true;
+
+	wake_up_interruptible_all(&event_id_data->event_id_wq);
+
+	nvgpu_mutex_release(&event_id_data->lock);
+}
+
+static int gk20a_channel_event_id_enable(struct channel_gk20a *ch,
+					 int event_id,
+					 int *fd)
+{
+	struct gk20a *g;
+	int err = 0;
+	int local_fd;
+	struct file *file;
+	char name[64];
+	struct gk20a_event_id_data *event_id_data;
+
+	g = gk20a_get(ch->g);
+	if (!g)
+		return -ENODEV;
+
+	err = gk20a_channel_get_event_data_from_id(ch,
+				event_id, &event_id_data);
+	if (err == 0) {
+		/* We already have event enabled */
+		err = -EINVAL;
+		goto free_ref;
+	}
+
+	err = get_unused_fd_flags(O_RDWR);
+	if (err < 0)
+		goto free_ref;
+	local_fd = err;
+
+	snprintf(name, sizeof(name), "nvgpu-event%d-fd%d",
+		 event_id, local_fd);
+	file = anon_inode_getfile(name, &gk20a_event_id_ops,
+				  NULL, O_RDWR);
+	if (IS_ERR(file)) {
+		err = PTR_ERR(file);
+		goto clean_up;
+	}
+
+	event_id_data = nvgpu_kzalloc(ch->g, sizeof(*event_id_data));
+	if (!event_id_data) {
+		err = -ENOMEM;
+		goto clean_up_file;
+	}
+	event_id_data->g = g;
+	event_id_data->id = ch->hw_chid;
+	event_id_data->is_tsg = false;
+	event_id_data->event_id = event_id;
+
+	init_waitqueue_head(&event_id_data->event_id_wq);
+	err = nvgpu_mutex_init(&event_id_data->lock);
+	if (err)
+		goto clean_up_free;
+	INIT_LIST_HEAD(&event_id_data->event_id_node);
+
+	nvgpu_mutex_acquire(&ch->event_id_list_lock);
+	list_add_tail(&event_id_data->event_id_node, &ch->event_id_list);
+	nvgpu_mutex_release(&ch->event_id_list_lock);
+
+	fd_install(local_fd, file);
+	file->private_data = event_id_data;
+
+	*fd = local_fd;
+
+	return 0;
+
+clean_up_free:
+	kfree(event_id_data);
+clean_up_file:
+	fput(file);
+clean_up:
+	put_unused_fd(local_fd);
+free_ref:
+	gk20a_put(g);
+	return err;
+}
+
+static int gk20a_channel_event_id_ctrl(struct channel_gk20a *ch,
+		struct nvgpu_event_id_ctrl_args *args)
+{
+	int err = 0;
+	int fd = -1;
+
+	if (args->event_id >= NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX)
+		return -EINVAL;
+
+	if (gk20a_is_channel_marked_as_tsg(ch))
+		return -EINVAL;
+
+	switch (args->cmd) {
+	case NVGPU_IOCTL_CHANNEL_EVENT_ID_CMD_ENABLE:
+		err = gk20a_channel_event_id_enable(ch, args->event_id, &fd);
+		if (!err)
+			args->event_fd = fd;
+		break;
+
+	default:
+		gk20a_err(dev_from_gk20a(ch->g),
+			   "unrecognized channel event id cmd: 0x%x",
+			   args->cmd);
+		err = -EINVAL;
+		break;
+	}
+
+	return err;
+}
+
+static int gk20a_channel_zcull_bind(struct channel_gk20a *ch,
+			    struct nvgpu_zcull_bind_args *args)
+{
+	struct gk20a *g = ch->g;
+	struct gr_gk20a *gr = &g->gr;
+
+	gk20a_dbg_fn("");
+
+	return g->ops.gr.bind_ctxsw_zcull(g, gr, ch,
+				args->gpu_va, args->mode);
+}
+
+static int gk20a_ioctl_channel_submit_gpfifo(
+	struct channel_gk20a *ch,
+	struct nvgpu_submit_gpfifo_args *args)
+{
+	struct gk20a_fence *fence_out;
+	struct fifo_profile_gk20a *profile = NULL;
+
+	int ret = 0;
+	gk20a_dbg_fn("");
+
+#ifdef CONFIG_DEBUG_FS
+	profile = gk20a_fifo_profile_acquire(ch->g);
+
+	if (profile)
+		profile->timestamp[PROFILE_IOCTL_ENTRY] = sched_clock();
+#endif
+	if (ch->has_timedout)
+		return -ETIMEDOUT;
+	ret = gk20a_submit_channel_gpfifo(ch, NULL, args, args->num_entries,
+					  args->flags, &args->fence,
+					  &fence_out, false, profile);
+
+	if (ret)
+		goto clean_up;
+
+	/* Convert fence_out to something we can pass back to user space. */
+	if (args->flags & NVGPU_SUBMIT_GPFIFO_FLAGS_FENCE_GET) {
+		if (args->flags & NVGPU_SUBMIT_GPFIFO_FLAGS_SYNC_FENCE) {
+			int fd = gk20a_fence_install_fd(fence_out);
+			if (fd < 0)
+				ret = fd;
+			else
+				args->fence.id = fd;
+		} else {
+			args->fence.id = fence_out->syncpt_id;
+			args->fence.value = fence_out->syncpt_value;
+		}
+	}
+	gk20a_fence_put(fence_out);
+#ifdef CONFIG_DEBUG_FS
+	if (profile) {
+		profile->timestamp[PROFILE_IOCTL_EXIT] = sched_clock();
+		gk20a_fifo_profile_release(ch->g, profile);
+	}
+#endif
+clean_up:
+	return ret;
+}
+
+long gk20a_channel_ioctl(struct file *filp,
+	unsigned int cmd, unsigned long arg)
+{
+	struct channel_priv *priv = filp->private_data;
+	struct channel_gk20a *ch = priv->c;
+	struct device *dev = ch->g->dev;
+	u8 buf[NVGPU_IOCTL_CHANNEL_MAX_ARG_SIZE] = {0};
+	int err = 0;
+
+	gk20a_dbg_fn("start %d", _IOC_NR(cmd));
+
+	if ((_IOC_TYPE(cmd) != NVGPU_IOCTL_MAGIC) ||
+		(_IOC_NR(cmd) == 0) ||
+		(_IOC_NR(cmd) > NVGPU_IOCTL_CHANNEL_LAST) ||
+		(_IOC_SIZE(cmd) > NVGPU_IOCTL_CHANNEL_MAX_ARG_SIZE))
+		return -EINVAL;
+
+	if (_IOC_DIR(cmd) & _IOC_WRITE) {
+		if (copy_from_user(buf, (void __user *)arg, _IOC_SIZE(cmd)))
+			return -EFAULT;
+	}
+
+	/* take a ref or return timeout if channel refs can't be taken */
+	ch = gk20a_channel_get(ch);
+	if (!ch)
+		return -ETIMEDOUT;
+
+	/* protect our sanity for threaded userspace - most of the channel is
+	 * not thread safe */
+	nvgpu_mutex_acquire(&ch->ioctl_lock);
+
+	/* this ioctl call keeps a ref to the file which keeps a ref to the
+	 * channel */
+
+	switch (cmd) {
+	case NVGPU_IOCTL_CHANNEL_OPEN:
+		err = gk20a_channel_open_ioctl(ch->g,
+			(struct nvgpu_channel_open_args *)buf);
+		break;
+	case NVGPU_IOCTL_CHANNEL_SET_NVMAP_FD:
+		break;
+	case NVGPU_IOCTL_CHANNEL_ALLOC_OBJ_CTX:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = ch->g->ops.gr.alloc_obj_ctx(ch,
+				(struct nvgpu_alloc_obj_ctx_args *)buf);
+		gk20a_idle(ch->g);
+		break;
+	case NVGPU_IOCTL_CHANNEL_ALLOC_GPFIFO_EX:
+	{
+		struct nvgpu_alloc_gpfifo_ex_args *alloc_gpfifo_ex_args =
+			(struct nvgpu_alloc_gpfifo_ex_args *)buf;
+
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+
+		if (!is_power_of_2(alloc_gpfifo_ex_args->num_entries)) {
+			err = -EINVAL;
+			gk20a_idle(ch->g);
+			break;
+		}
+		err = gk20a_channel_alloc_gpfifo(ch,
+				alloc_gpfifo_ex_args->num_entries,
+				alloc_gpfifo_ex_args->num_inflight_jobs,
+				alloc_gpfifo_ex_args->flags);
+		gk20a_idle(ch->g);
+		break;
+	}
+	case NVGPU_IOCTL_CHANNEL_ALLOC_GPFIFO:
+	{
+		struct nvgpu_alloc_gpfifo_args *alloc_gpfifo_args =
+			(struct nvgpu_alloc_gpfifo_args *)buf;
+
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+
+		/*
+		 * Kernel can insert one extra gpfifo entry before user
+		 * submitted gpfifos and another one after, for internal usage.
+		 * Triple the requested size.
+		 */
+		err = gk20a_channel_alloc_gpfifo(ch,
+				alloc_gpfifo_args->num_entries * 3,
+				0,
+				alloc_gpfifo_args->flags);
+		gk20a_idle(ch->g);
+		break;
+	}
+	case NVGPU_IOCTL_CHANNEL_SUBMIT_GPFIFO:
+		err = gk20a_ioctl_channel_submit_gpfifo(ch,
+				(struct nvgpu_submit_gpfifo_args *)buf);
+		break;
+	case NVGPU_IOCTL_CHANNEL_WAIT:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+
+		/* waiting is thread-safe, not dropping this mutex could
+		 * deadlock in certain conditions */
+		nvgpu_mutex_release(&ch->ioctl_lock);
+
+		err = gk20a_channel_wait(ch,
+				(struct nvgpu_wait_args *)buf);
+
+		nvgpu_mutex_acquire(&ch->ioctl_lock);
+
+		gk20a_idle(ch->g);
+		break;
+	case NVGPU_IOCTL_CHANNEL_ZCULL_BIND:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = gk20a_channel_zcull_bind(ch,
+				(struct nvgpu_zcull_bind_args *)buf);
+		gk20a_idle(ch->g);
+		break;
+	case NVGPU_IOCTL_CHANNEL_SET_ERROR_NOTIFIER:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = gk20a_init_error_notifier(ch,
+				(struct nvgpu_set_error_notifier *)buf);
+		gk20a_idle(ch->g);
+		break;
+#ifdef CONFIG_GK20A_CYCLE_STATS
+	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = gk20a_channel_cycle_stats(ch,
+				(struct nvgpu_cycle_stats_args *)buf);
+		gk20a_idle(ch->g);
+		break;
+#endif
+	case NVGPU_IOCTL_CHANNEL_SET_TIMEOUT:
+	{
+		u32 timeout =
+			(u32)((struct nvgpu_set_timeout_args *)buf)->timeout;
+		gk20a_dbg(gpu_dbg_gpu_dbg, "setting timeout (%d ms) for chid %d",
+			   timeout, ch->hw_chid);
+		ch->timeout_ms_max = timeout;
+		gk20a_channel_trace_sched_param(
+			trace_gk20a_channel_set_timeout, ch);
+		break;
+	}
+	case NVGPU_IOCTL_CHANNEL_SET_TIMEOUT_EX:
+	{
+		u32 timeout =
+			(u32)((struct nvgpu_set_timeout_args *)buf)->timeout;
+		bool timeout_debug_dump = !((u32)
+			((struct nvgpu_set_timeout_ex_args *)buf)->flags &
+			(1 << NVGPU_TIMEOUT_FLAG_DISABLE_DUMP));
+		gk20a_dbg(gpu_dbg_gpu_dbg, "setting timeout (%d ms) for chid %d",
+			   timeout, ch->hw_chid);
+		ch->timeout_ms_max = timeout;
+		ch->timeout_debug_dump = timeout_debug_dump;
+		gk20a_channel_trace_sched_param(
+			trace_gk20a_channel_set_timeout, ch);
+		break;
+	}
+	case NVGPU_IOCTL_CHANNEL_GET_TIMEDOUT:
+		((struct nvgpu_get_param_args *)buf)->value =
+			ch->has_timedout;
+		break;
+	case NVGPU_IOCTL_CHANNEL_SET_PRIORITY:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = ch->g->ops.fifo.channel_set_priority(ch,
+			((struct nvgpu_set_priority_args *)buf)->priority);
+
+		gk20a_idle(ch->g);
+		gk20a_channel_trace_sched_param(
+			trace_gk20a_channel_set_priority, ch);
+		break;
+	case NVGPU_IOCTL_CHANNEL_ENABLE:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		if (ch->g->ops.fifo.enable_channel)
+			ch->g->ops.fifo.enable_channel(ch);
+		else
+			err = -ENOSYS;
+		gk20a_idle(ch->g);
+		break;
+	case NVGPU_IOCTL_CHANNEL_DISABLE:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		if (ch->g->ops.fifo.disable_channel)
+			ch->g->ops.fifo.disable_channel(ch);
+		else
+			err = -ENOSYS;
+		gk20a_idle(ch->g);
+		break;
+	case NVGPU_IOCTL_CHANNEL_PREEMPT:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = gk20a_fifo_preempt(ch->g, ch);
+		gk20a_idle(ch->g);
+		break;
+	case NVGPU_IOCTL_CHANNEL_FORCE_RESET:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = ch->g->ops.fifo.force_reset_ch(ch,
+				NVGPU_CHANNEL_RESETCHANNEL_VERIF_ERROR, true);
+		gk20a_idle(ch->g);
+		break;
+	case NVGPU_IOCTL_CHANNEL_EVENT_ID_CTRL:
+		err = gk20a_channel_event_id_ctrl(ch,
+			      (struct nvgpu_event_id_ctrl_args *)buf);
+		break;
+#ifdef CONFIG_GK20A_CYCLE_STATS
+	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = gk20a_channel_cycle_stats_snapshot(ch,
+				(struct nvgpu_cycle_stats_snapshot_args *)buf);
+		gk20a_idle(ch->g);
+		break;
+#endif
+	case NVGPU_IOCTL_CHANNEL_WDT:
+		err = gk20a_channel_set_wdt_status(ch,
+				(struct nvgpu_channel_wdt_args *)buf);
+		break;
+	case NVGPU_IOCTL_CHANNEL_SET_RUNLIST_INTERLEAVE:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = gk20a_channel_set_runlist_interleave(ch,
+			((struct nvgpu_runlist_interleave_args *)buf)->level);
+
+		gk20a_idle(ch->g);
+		gk20a_channel_trace_sched_param(
+			trace_gk20a_channel_set_runlist_interleave, ch);
+		break;
+	case NVGPU_IOCTL_CHANNEL_SET_TIMESLICE:
+		err = gk20a_busy(ch->g);
+		if (err) {
+			dev_err(dev,
+				"%s: failed to host gk20a for ioctl cmd: 0x%x",
+				__func__, cmd);
+			break;
+		}
+		err = ch->g->ops.fifo.channel_set_timeslice(ch,
+			((struct nvgpu_timeslice_args *)buf)->timeslice_us);
+
+		gk20a_idle(ch->g);
+		gk20a_channel_trace_sched_param(
+			trace_gk20a_channel_set_timeslice, ch);
+		break;
+	case NVGPU_IOCTL_CHANNEL_SET_PREEMPTION_MODE:
+		if (ch->g->ops.gr.set_preemption_mode) {
+			err = gk20a_busy(ch->g);
+			if (err) {
+				dev_err(dev,
+					"%s: failed to host gk20a for ioctl cmd: 0x%x",
+					__func__, cmd);
+				break;
+			}
+			err = ch->g->ops.gr.set_preemption_mode(ch,
+			     ((struct nvgpu_preemption_mode_args *)buf)->graphics_preempt_mode,
+			     ((struct nvgpu_preemption_mode_args *)buf)->compute_preempt_mode);
+			gk20a_idle(ch->g);
+		} else {
+			err = -EINVAL;
+		}
+		break;
+	case NVGPU_IOCTL_CHANNEL_SET_BOOSTED_CTX:
+		if (ch->g->ops.gr.set_boosted_ctx) {
+			bool boost =
+				((struct nvgpu_boosted_ctx_args *)buf)->boost;
+
+			err = gk20a_busy(ch->g);
+			if (err) {
+				dev_err(dev,
+					"%s: failed to host gk20a for ioctl cmd: 0x%x",
+					__func__, cmd);
+				break;
+			}
+			err = ch->g->ops.gr.set_boosted_ctx(ch, boost);
+			gk20a_idle(ch->g);
+		} else {
+			err = -EINVAL;
+		}
+		break;
+	default:
+		dev_dbg(dev, "unrecognized ioctl cmd: 0x%x", cmd);
+		err = -ENOTTY;
+		break;
+	}
+
+	if ((err == 0) && (_IOC_DIR(cmd) & _IOC_READ))
+		err = copy_to_user((void __user *)arg, buf, _IOC_SIZE(cmd));
+
+	nvgpu_mutex_release(&ch->ioctl_lock);
+
+	gk20a_channel_put(ch);
+
+	gk20a_dbg_fn("end");
+
+	return err;
+}
diff --git a/drivers/gpu/nvgpu/common/linux/ioctl_channel.h b/drivers/gpu/nvgpu/common/linux/ioctl_channel.h
new file mode 100644
index 00000000..f57739e2
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/linux/ioctl_channel.h
@@ -0,0 +1,21 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ */
+#ifndef __NVGPU_IOCTL_CHANNEL_H__
+#define __NVGPU_IOCTL_CHANNEL_H__
+
+int gk20a_channel_open(struct inode *inode, struct file *filp);
+int gk20a_channel_release(struct inode *inode, struct file *filp);
+long gk20a_channel_ioctl(struct file *filp,
+	unsigned int cmd, unsigned long arg);
+
+#endif
diff --git a/drivers/gpu/nvgpu/gk20a/cde_gk20a.c b/drivers/gpu/nvgpu/gk20a/cde_gk20a.c
index 42850588..926e21ef 100644
--- a/drivers/gpu/nvgpu/gk20a/cde_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/cde_gk20a.c
@@ -1224,8 +1224,7 @@ static int gk20a_cde_load(struct gk20a_cde_ctx *cde_ctx)
 	}
 
 	/* allocate gpfifo (1024 should be more than enough) */
-	err = gk20a_alloc_channel_gpfifo(ch,
-		&(struct nvgpu_alloc_gpfifo_ex_args){1024, 0, 0, {}});
+	err = gk20a_channel_alloc_gpfifo(ch, 1024, 0, 0);
 	if (err) {
 		gk20a_warn(cde_ctx->dev, "cde: unable to allocate gpfifo");
 		goto err_alloc_gpfifo;
diff --git a/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c b/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c
index 48f0cf8d..cce7a769 100644
--- a/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/ce2_gk20a.c
@@ -471,8 +471,7 @@ u32 gk20a_ce_create_context_with_cb(struct device *dev,
 	}
 
 	/* allocate gpfifo (1024 should be more than enough) */
-	err = gk20a_alloc_channel_gpfifo(ce_ctx->ch,
-		&(struct nvgpu_alloc_gpfifo_ex_args){1024, 0, 0, {}});
+	err = gk20a_channel_alloc_gpfifo(ce_ctx->ch, 1024, 0, 0);
 	if (err) {
 		gk20a_err(ce_ctx->dev, "ce: unable to allocate gpfifo");
 		goto end;
diff --git a/drivers/gpu/nvgpu/gk20a/channel_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_gk20a.c
index cd49b4a9..b7306369 100644
--- a/drivers/gpu/nvgpu/gk20a/channel_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/channel_gk20a.c
@@ -16,15 +16,10 @@
  * along with this program.  If not, see <http://www.gnu.org/licenses/>.
  */
 
-#include <linux/nvhost.h>
 #include <linux/list.h>
 #include <linux/delay.h>
-#include <linux/highmem.h> /* need for nvmap.h*/
 #include <linux/kthread.h>
 #include <trace/events/gk20a.h>
-#include <linux/scatterlist.h>
-#include <linux/file.h>
-#include <linux/anon_inodes.h>
 #include <linux/dma-buf.h>
 #include <linux/circ_buf.h>
 
@@ -40,8 +35,6 @@
 
 #include <nvgpu/hw/gk20a/hw_pbdma_gk20a.h>
 
-#define NVMAP_HANDLE_PARAM_SIZE 1
-
 /*
  * Although channels do have pointers back to the gk20a struct that they were
  * created under in cases where the driver is killed that pointer can be bad.
@@ -55,7 +48,6 @@ struct channel_priv {
 	struct channel_gk20a *c;
 };
 
-static struct channel_gk20a *allocate_channel(struct fifo_gk20a *f);
 static void free_channel(struct fifo_gk20a *f, struct channel_gk20a *c);
 static void gk20a_channel_dump_ref_actions(struct channel_gk20a *c);
 
@@ -76,7 +68,6 @@ static struct channel_gk20a_job *channel_gk20a_joblist_peek(
 
 static int channel_gk20a_update_runlist(struct channel_gk20a *c,
 					bool add);
-static void gk20a_free_error_notifiers(struct channel_gk20a *ch);
 
 static u32 gk20a_get_channel_watchdog_timeout(struct channel_gk20a *ch);
 
@@ -323,171 +314,6 @@ void gk20a_disable_channel(struct channel_gk20a *ch)
 	channel_gk20a_update_runlist(ch, false);
 }
 
-#if defined(CONFIG_GK20A_CYCLE_STATS)
-
-static void gk20a_free_cycle_stats_buffer(struct channel_gk20a *ch)
-{
-	/* disable existing cyclestats buffer */
-	nvgpu_mutex_acquire(&ch->cyclestate.cyclestate_buffer_mutex);
-	if (ch->cyclestate.cyclestate_buffer_handler) {
-		dma_buf_vunmap(ch->cyclestate.cyclestate_buffer_handler,
-				ch->cyclestate.cyclestate_buffer);
-		dma_buf_put(ch->cyclestate.cyclestate_buffer_handler);
-		ch->cyclestate.cyclestate_buffer_handler = NULL;
-		ch->cyclestate.cyclestate_buffer = NULL;
-		ch->cyclestate.cyclestate_buffer_size = 0;
-	}
-	nvgpu_mutex_release(&ch->cyclestate.cyclestate_buffer_mutex);
-}
-
-static int gk20a_channel_cycle_stats(struct channel_gk20a *ch,
-		       struct nvgpu_cycle_stats_args *args)
-{
-	struct dma_buf *dmabuf;
-	void *virtual_address;
-
-	/* is it allowed to handle calls for current GPU? */
-	if (0 == (ch->g->gpu_characteristics.flags &
-			NVGPU_GPU_FLAGS_SUPPORT_CYCLE_STATS))
-		return -ENOSYS;
-
-	if (args->dmabuf_fd && !ch->cyclestate.cyclestate_buffer_handler) {
-
-		/* set up new cyclestats buffer */
-		dmabuf = dma_buf_get(args->dmabuf_fd);
-		if (IS_ERR(dmabuf))
-			return PTR_ERR(dmabuf);
-		virtual_address = dma_buf_vmap(dmabuf);
-		if (!virtual_address)
-			return -ENOMEM;
-
-		ch->cyclestate.cyclestate_buffer_handler = dmabuf;
-		ch->cyclestate.cyclestate_buffer = virtual_address;
-		ch->cyclestate.cyclestate_buffer_size = dmabuf->size;
-		return 0;
-
-	} else if (!args->dmabuf_fd &&
-			ch->cyclestate.cyclestate_buffer_handler) {
-		gk20a_free_cycle_stats_buffer(ch);
-		return 0;
-
-	} else if (!args->dmabuf_fd &&
-			!ch->cyclestate.cyclestate_buffer_handler) {
-		/* no requst from GL */
-		return 0;
-
-	} else {
-		pr_err("channel already has cyclestats buffer\n");
-		return -EINVAL;
-	}
-}
-
-
-static int gk20a_flush_cycle_stats_snapshot(struct channel_gk20a *ch)
-{
-	int ret;
-
-	nvgpu_mutex_acquire(&ch->cs_client_mutex);
-	if (ch->cs_client)
-		ret = gr_gk20a_css_flush(ch, ch->cs_client);
-	else
-		ret = -EBADF;
-	nvgpu_mutex_release(&ch->cs_client_mutex);
-
-	return ret;
-}
-
-static int gk20a_attach_cycle_stats_snapshot(struct channel_gk20a *ch,
-				u32 dmabuf_fd,
-				u32 perfmon_id_count,
-				u32 *perfmon_id_start)
-{
-	int ret;
-
-	nvgpu_mutex_acquire(&ch->cs_client_mutex);
-	if (ch->cs_client) {
-		ret = -EEXIST;
-	} else {
-		ret = gr_gk20a_css_attach(ch,
-					dmabuf_fd,
-					perfmon_id_count,
-					perfmon_id_start,
-					&ch->cs_client);
-	}
-	nvgpu_mutex_release(&ch->cs_client_mutex);
-
-	return ret;
-}
-
-static int gk20a_free_cycle_stats_snapshot(struct channel_gk20a *ch)
-{
-	int ret;
-
-	nvgpu_mutex_acquire(&ch->cs_client_mutex);
-	if (ch->cs_client) {
-		ret = gr_gk20a_css_detach(ch, ch->cs_client);
-		ch->cs_client = NULL;
-	} else {
-		ret = 0;
-	}
-	nvgpu_mutex_release(&ch->cs_client_mutex);
-
-	return ret;
-}
-
-static int gk20a_channel_cycle_stats_snapshot(struct channel_gk20a *ch,
-			struct nvgpu_cycle_stats_snapshot_args *args)
-{
-	int ret;
-
-	/* is it allowed to handle calls for current GPU? */
-	if (0 == (ch->g->gpu_characteristics.flags &
-			NVGPU_GPU_FLAGS_SUPPORT_CYCLE_STATS_SNAPSHOT))
-		return -ENOSYS;
-
-	if (!args->dmabuf_fd)
-		return -EINVAL;
-
-	/* handle the command (most frequent cases first) */
-	switch (args->cmd) {
-	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT_CMD_FLUSH:
-		ret = gk20a_flush_cycle_stats_snapshot(ch);
-		args->extra = 0;
-		break;
-
-	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT_CMD_ATTACH:
-		ret = gk20a_attach_cycle_stats_snapshot(ch,
-						args->dmabuf_fd,
-						args->extra,
-						&args->extra);
-		break;
-
-	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT_CMD_DETACH:
-		ret = gk20a_free_cycle_stats_snapshot(ch);
-		args->extra = 0;
-		break;
-
-	default:
-		pr_err("cyclestats: unknown command %u\n", args->cmd);
-		ret = -EINVAL;
-		break;
-	}
-
-	return ret;
-}
-#endif
-
-static int gk20a_channel_set_wdt_status(struct channel_gk20a *ch,
-		struct nvgpu_channel_wdt_args *args)
-{
-	if (args->wdt_status == NVGPU_IOCTL_CHANNEL_DISABLE_WDT)
-		ch->wdt_enabled = false;
-	else if (args->wdt_status == NVGPU_IOCTL_CHANNEL_ENABLE_WDT)
-		ch->wdt_enabled = true;
-
-	return 0;
-}
-
 int gk20a_channel_set_runlist_interleave(struct channel_gk20a *ch,
 						u32 level)
 {
@@ -516,54 +342,6 @@ int gk20a_channel_set_runlist_interleave(struct channel_gk20a *ch,
 	return ret ? ret : g->ops.fifo.update_runlist(g, ch->runlist_id, ~0, true, true);
 }
 
-static int gk20a_init_error_notifier(struct channel_gk20a *ch,
-		struct nvgpu_set_error_notifier *args)
-{
-	struct device *dev = dev_from_gk20a(ch->g);
-	struct dma_buf *dmabuf;
-	void *va;
-	u64 end = args->offset + sizeof(struct nvgpu_notification);
-
-	if (!args->mem) {
-		pr_err("gk20a_init_error_notifier: invalid memory handle\n");
-		return -EINVAL;
-	}
-
-	dmabuf = dma_buf_get(args->mem);
-
-	gk20a_free_error_notifiers(ch);
-
-	if (IS_ERR(dmabuf)) {
-		pr_err("Invalid handle: %d\n", args->mem);
-		return -EINVAL;
-	}
-
-	if (end > dmabuf->size || end < sizeof(struct nvgpu_notification)) {
-		dma_buf_put(dmabuf);
-		gk20a_err(dev, "gk20a_init_error_notifier: invalid offset\n");
-		return -EINVAL;
-	}
-
-	/* map handle */
-	va = dma_buf_vmap(dmabuf);
-	if (!va) {
-		dma_buf_put(dmabuf);
-		pr_err("Cannot map notifier handle\n");
-		return -ENOMEM;
-	}
-
-	ch->error_notifier = va + args->offset;
-	ch->error_notifier_va = va;
-	memset(ch->error_notifier, 0, sizeof(struct nvgpu_notification));
-
-	/* set channel notifiers pointer */
-	nvgpu_mutex_acquire(&ch->error_notifier_mutex);
-	ch->error_notifier_ref = dmabuf;
-	nvgpu_mutex_release(&ch->error_notifier_mutex);
-
-	return 0;
-}
-
 /**
  * gk20a_set_error_notifier_locked()
  * Should be called with ch->error_notifier_mutex held
@@ -595,7 +373,7 @@ void gk20a_set_error_notifier(struct channel_gk20a *ch, __u32 error)
 	nvgpu_mutex_release(&ch->error_notifier_mutex);
 }
 
-static void gk20a_free_error_notifiers(struct channel_gk20a *ch)
+void gk20a_channel_free_error_notifiers(struct channel_gk20a *ch)
 {
 	nvgpu_mutex_acquire(&ch->error_notifier_mutex);
 	if (ch->error_notifier_ref) {
@@ -628,6 +406,40 @@ static void gk20a_wait_until_counter_is_N(
 	}
 }
 
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+void gk20a_channel_free_cycle_stats_buffer(struct channel_gk20a *ch)
+{
+	/* disable existing cyclestats buffer */
+	nvgpu_mutex_acquire(&ch->cyclestate.cyclestate_buffer_mutex);
+	if (ch->cyclestate.cyclestate_buffer_handler) {
+		dma_buf_vunmap(ch->cyclestate.cyclestate_buffer_handler,
+				ch->cyclestate.cyclestate_buffer);
+		dma_buf_put(ch->cyclestate.cyclestate_buffer_handler);
+		ch->cyclestate.cyclestate_buffer_handler = NULL;
+		ch->cyclestate.cyclestate_buffer = NULL;
+		ch->cyclestate.cyclestate_buffer_size = 0;
+	}
+	nvgpu_mutex_release(&ch->cyclestate.cyclestate_buffer_mutex);
+}
+
+int gk20a_channel_free_cycle_stats_snapshot(struct channel_gk20a *ch)
+{
+	int ret;
+
+	nvgpu_mutex_acquire(&ch->cs_client_mutex);
+	if (ch->cs_client) {
+		ret = gr_gk20a_css_detach(ch, ch->cs_client);
+		ch->cs_client = NULL;
+	} else {
+		ret = 0;
+	}
+	nvgpu_mutex_release(&ch->cs_client_mutex);
+
+	return ret;
+}
+
+#endif
+
 /* call ONLY when no references to the channel exist: after the last put */
 static void gk20a_free_channel(struct channel_gk20a *ch, bool force)
 {
@@ -700,7 +512,7 @@ static void gk20a_free_channel(struct channel_gk20a *ch, bool force)
 	gk20a_dbg_info("freeing bound channel context, timeout=%ld",
 			timeout);
 
-	gk20a_free_error_notifiers(ch);
+	gk20a_channel_free_error_notifiers(ch);
 
 	if (g->ops.fecs_trace.unbind_channel && !ch->vpr)
 		g->ops.fecs_trace.unbind_channel(g, ch);
@@ -715,8 +527,8 @@ static void gk20a_free_channel(struct channel_gk20a *ch, bool force)
 	memset(&ch->gpfifo, 0, sizeof(struct gpfifo_desc));
 
 #if defined(CONFIG_GK20A_CYCLE_STATS)
-	gk20a_free_cycle_stats_buffer(ch);
-	gk20a_free_cycle_stats_snapshot(ch);
+	gk20a_channel_free_cycle_stats_buffer(ch);
+	gk20a_channel_free_cycle_stats_snapshot(ch);
 #endif
 
 	channel_gk20a_free_priv_cmdbuf(ch);
@@ -930,50 +742,6 @@ void __gk20a_channel_kill(struct channel_gk20a *ch)
 	gk20a_free_channel(ch, true);
 }
 
-struct channel_gk20a *gk20a_get_channel_from_file(int fd)
-{
-	struct channel_priv *priv;
-	struct file *f = fget(fd);
-
-	if (!f)
-		return NULL;
-
-	if (f->f_op != &gk20a_channel_ops) {
-		fput(f);
-		return NULL;
-	}
-
-	priv = (struct channel_priv *)f->private_data;
-	fput(f);
-	return priv->c;
-}
-
-int gk20a_channel_release(struct inode *inode, struct file *filp)
-{
-	struct channel_priv *priv = filp->private_data;
-	struct channel_gk20a *ch = priv->c;
-	struct gk20a *g = priv->g;
-
-	int err;
-
-	err = gk20a_busy(g);
-	if (err) {
-		gk20a_err(dev_from_gk20a(g), "failed to release a channel!");
-		goto channel_release;
-	}
-
-	trace_gk20a_channel_release(g->name);
-
-	gk20a_channel_close(ch);
-	gk20a_idle(g);
-
-channel_release:
-	gk20a_put(g);
-	nvgpu_kfree(g, filp->private_data);
-	filp->private_data = NULL;
-	return 0;
-}
-
 static void gk20a_channel_update_runcb_fn(struct work_struct *work)
 {
 	struct channel_gk20a *ch =
@@ -1100,109 +868,6 @@ struct channel_gk20a *gk20a_open_new_channel(struct gk20a *g,
 	return ch;
 }
 
-/* note: runlist_id -1 is synonym for the ENGINE_GR_GK20A runlist id */
-static int __gk20a_channel_open(struct gk20a *g, struct file *filp, s32 runlist_id)
-{
-	int err;
-	struct channel_gk20a *ch;
-	struct channel_priv *priv;
-
-	gk20a_dbg_fn("");
-
-	g = gk20a_get(g);
-	if (!g)
-		return -ENODEV;
-
-	trace_gk20a_channel_open(g->name);
-
-	priv = nvgpu_kzalloc(g, sizeof(*priv));
-	if (!priv) {
-		err = -ENOMEM;
-		goto free_ref;
-	}
-
-	err = gk20a_busy(g);
-	if (err) {
-		gk20a_err(dev_from_gk20a(g), "failed to power on, %d", err);
-		goto fail_busy;
-	}
-	/* All the user space channel should be non privilege */
-	ch = gk20a_open_new_channel(g, runlist_id, false);
-	gk20a_idle(g);
-	if (!ch) {
-		gk20a_err(dev_from_gk20a(g),
-			"failed to get f");
-		err = -ENOMEM;
-		goto fail_busy;
-	}
-
-	gk20a_channel_trace_sched_param(
-		trace_gk20a_channel_sched_defaults, ch);
-
-	priv->g = g;
-	priv->c = ch;
-
-	filp->private_data = priv;
-	return 0;
-
-fail_busy:
-	nvgpu_kfree(g, priv);
-free_ref:
-	gk20a_put(g);
-	return err;
-}
-
-int gk20a_channel_open(struct inode *inode, struct file *filp)
-{
-	struct gk20a *g = container_of(inode->i_cdev,
-			struct gk20a, channel.cdev);
-	int ret;
-
-	gk20a_dbg_fn("start");
-	ret = __gk20a_channel_open(g, filp, -1);
-
-	gk20a_dbg_fn("end");
-	return ret;
-}
-
-int gk20a_channel_open_ioctl(struct gk20a *g,
-		struct nvgpu_channel_open_args *args)
-{
-	int err;
-	int fd;
-	struct file *file;
-	char name[64];
-	s32 runlist_id = args->in.runlist_id;
-
-	err = get_unused_fd_flags(O_RDWR);
-	if (err < 0)
-		return err;
-	fd = err;
-
-	snprintf(name, sizeof(name), "nvhost-%s-fd%d",
-		 g->name, fd);
-
-	file = anon_inode_getfile(name, g->channel.cdev.ops, NULL, O_RDWR);
-	if (IS_ERR(file)) {
-		err = PTR_ERR(file);
-		goto clean_up;
-	}
-
-	err = __gk20a_channel_open(g, file, runlist_id);
-	if (err)
-		goto clean_up_file;
-
-	fd_install(fd, file);
-	args->out.channel_fd = fd;
-	return 0;
-
-clean_up_file:
-	fput(file);
-clean_up:
-	put_unused_fd(fd);
-	return err;
-}
-
 /* allocate private cmd buffer.
    used for inserting commands before/after user submitted buffers. */
 static int channel_gk20a_alloc_priv_cmdbuf(struct channel_gk20a *c)
@@ -1542,8 +1207,10 @@ static void channel_gk20a_free_prealloc_resources(struct channel_gk20a *c)
 	c->joblist.pre_alloc.enabled = false;
 }
 
-int gk20a_alloc_channel_gpfifo(struct channel_gk20a *c,
-		struct nvgpu_alloc_gpfifo_ex_args *args)
+int gk20a_channel_alloc_gpfifo(struct channel_gk20a *c,
+		unsigned int num_entries,
+		unsigned int num_inflight_jobs,
+		u32 flags)
 {
 	struct gk20a *g = c->g;
 	struct device *d = dev_from_gk20a(g);
@@ -1553,12 +1220,12 @@ int gk20a_alloc_channel_gpfifo(struct channel_gk20a *c,
 	int err = 0;
 	unsigned long acquire_timeout;
 
-	gpfifo_size = args->num_entries;
+	gpfifo_size = num_entries;
 
-	if (args->flags & NVGPU_ALLOC_GPFIFO_EX_FLAGS_VPR_ENABLED)
+	if (flags & NVGPU_ALLOC_GPFIFO_EX_FLAGS_VPR_ENABLED)
 		c->vpr = true;
 
-	if (args->flags & NVGPU_ALLOC_GPFIFO_EX_FLAGS_DETERMINISTIC)
+	if (flags & NVGPU_ALLOC_GPFIFO_EX_FLAGS_DETERMINISTIC)
 		c->deterministic = true;
 
 	/* an address space needs to have been bound at this point. */
@@ -1625,15 +1292,15 @@ int gk20a_alloc_channel_gpfifo(struct channel_gk20a *c,
 
 	err = g->ops.fifo.setup_ramfc(c, c->gpfifo.mem.gpu_va,
 					c->gpfifo.entry_num,
-					acquire_timeout, args->flags);
+					acquire_timeout, flags);
 	if (err)
 		goto clean_up_sync;
 
 	/* TBD: setup engine contexts */
 
-	if (args->num_inflight_jobs) {
+	if (num_inflight_jobs) {
 		err = channel_gk20a_prealloc_resources(c,
-				args->num_inflight_jobs);
+				num_inflight_jobs);
 		if (err)
 			goto clean_up_sync;
 	}
@@ -1654,7 +1321,7 @@ int gk20a_alloc_channel_gpfifo(struct channel_gk20a *c,
 clean_up_priv_cmd:
 	channel_gk20a_free_priv_cmdbuf(c);
 clean_up_prealloc:
-	if (args->num_inflight_jobs)
+	if (num_inflight_jobs)
 		channel_gk20a_free_prealloc_resources(c);
 clean_up_sync:
 	if (c->sync) {
@@ -3033,419 +2700,39 @@ fail_1:
 	return err;
 }
 
-static int gk20a_channel_wait_semaphore(struct channel_gk20a *ch,
-					ulong id, u32 offset,
-					u32 payload, long timeout)
+/* in this context the "channel" is the host1x channel which
+ * maps to *all* gk20a channels */
+int gk20a_channel_suspend(struct gk20a *g)
 {
-	struct device *dev = ch->g->dev;
-	struct dma_buf *dmabuf;
-	void *data;
-	u32 *semaphore;
-	int ret = 0;
-	long remain;
+	struct fifo_gk20a *f = &g->fifo;
+	u32 chid;
+	bool channels_in_use = false;
+	u32 active_runlist_ids = 0;
 
-	/* do not wait if channel has timed out */
-	if (ch->has_timedout)
-		return -ETIMEDOUT;
+	gk20a_dbg_fn("");
 
-	dmabuf = dma_buf_get(id);
-	if (IS_ERR(dmabuf)) {
-		gk20a_err(dev, "invalid notifier nvmap handle 0x%lx", id);
-		return -EINVAL;
-	}
+	for (chid = 0; chid < f->num_channels; chid++) {
+		struct channel_gk20a *ch = &f->channel[chid];
+		if (gk20a_channel_get(ch)) {
+			gk20a_dbg_info("suspend channel %d", chid);
+			/* disable channel */
+			gk20a_disable_channel_tsg(g, ch);
+			/* preempt the channel */
+			gk20a_fifo_preempt(g, ch);
+			/* wait for channel update notifiers */
+			if (ch->update_fn)
+				cancel_work_sync(&ch->update_fn_work);
 
-	data = dma_buf_kmap(dmabuf, offset >> PAGE_SHIFT);
-	if (!data) {
-		gk20a_err(dev, "failed to map notifier memory");
-		ret = -EINVAL;
-		goto cleanup_put;
-	}
+			channels_in_use = true;
 
-	semaphore = data + (offset & ~PAGE_MASK);
+			active_runlist_ids |= BIT(ch->runlist_id);
 
-	remain = wait_event_interruptible_timeout(
-			ch->semaphore_wq,
-			*semaphore == payload || ch->has_timedout,
-			timeout);
+			gk20a_channel_put(ch);
+		}
+	}
 
-	if (remain == 0 && *semaphore != payload)
-		ret = -ETIMEDOUT;
-	else if (remain < 0)
-		ret = remain;
-
-	dma_buf_kunmap(dmabuf, offset >> PAGE_SHIFT, data);
-cleanup_put:
-	dma_buf_put(dmabuf);
-	return ret;
-}
-
-static int gk20a_channel_wait(struct channel_gk20a *ch,
-			      struct nvgpu_wait_args *args)
-{
-	struct device *d = dev_from_gk20a(ch->g);
-	struct dma_buf *dmabuf;
-	struct notification *notif;
-	struct timespec tv;
-	u64 jiffies;
-	ulong id;
-	u32 offset;
-	unsigned long timeout;
-	int remain, ret = 0;
-	u64 end;
-
-	gk20a_dbg_fn("");
-
-	if (ch->has_timedout)
-		return -ETIMEDOUT;
-
-	if (args->timeout == NVGPU_NO_TIMEOUT)
-		timeout = MAX_SCHEDULE_TIMEOUT;
-	else
-		timeout = (u32)msecs_to_jiffies(args->timeout);
-
-	switch (args->type) {
-	case NVGPU_WAIT_TYPE_NOTIFIER:
-		id = args->condition.notifier.dmabuf_fd;
-		offset = args->condition.notifier.offset;
-		end = offset + sizeof(struct notification);
-
-		dmabuf = dma_buf_get(id);
-		if (IS_ERR(dmabuf)) {
-			gk20a_err(d, "invalid notifier nvmap handle 0x%lx",
-				   id);
-			return -EINVAL;
-		}
-
-		if (end > dmabuf->size || end < sizeof(struct notification)) {
-			dma_buf_put(dmabuf);
-			gk20a_err(d, "invalid notifier offset\n");
-			return -EINVAL;
-		}
-
-		notif = dma_buf_vmap(dmabuf);
-		if (!notif) {
-			gk20a_err(d, "failed to map notifier memory");
-			return -ENOMEM;
-		}
-
-		notif = (struct notification *)((uintptr_t)notif + offset);
-
-		/* user should set status pending before
-		 * calling this ioctl */
-		remain = wait_event_interruptible_timeout(
-				ch->notifier_wq,
-				notif->status == 0 || ch->has_timedout,
-				timeout);
-
-		if (remain == 0 && notif->status != 0) {
-			ret = -ETIMEDOUT;
-			goto notif_clean_up;
-		} else if (remain < 0) {
-			ret = -EINTR;
-			goto notif_clean_up;
-		}
-
-		/* TBD: fill in correct information */
-		jiffies = get_jiffies_64();
-		jiffies_to_timespec(jiffies, &tv);
-		notif->timestamp.nanoseconds[0] = tv.tv_nsec;
-		notif->timestamp.nanoseconds[1] = tv.tv_sec;
-		notif->info32 = 0xDEADBEEF; /* should be object name */
-		notif->info16 = ch->hw_chid; /* should be method offset */
-
-notif_clean_up:
-		dma_buf_vunmap(dmabuf, notif);
-		return ret;
-
-	case NVGPU_WAIT_TYPE_SEMAPHORE:
-		ret = gk20a_channel_wait_semaphore(ch,
-				args->condition.semaphore.dmabuf_fd,
-				args->condition.semaphore.offset,
-				args->condition.semaphore.payload,
-				timeout);
-
-		break;
-
-	default:
-		ret = -EINVAL;
-		break;
-	}
-
-	return ret;
-}
-
-static unsigned int gk20a_event_id_poll(struct file *filep, poll_table *wait)
-{
-	unsigned int mask = 0;
-	struct gk20a_event_id_data *event_id_data = filep->private_data;
-	struct gk20a *g = event_id_data->g;
-	u32 event_id = event_id_data->event_id;
-
-	gk20a_dbg(gpu_dbg_fn | gpu_dbg_info, "");
-
-	poll_wait(filep, &event_id_data->event_id_wq, wait);
-
-	nvgpu_mutex_acquire(&event_id_data->lock);
-
-	if (event_id_data->is_tsg) {
-		struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
-
-		if (event_id_data->event_posted) {
-			gk20a_dbg_info(
-				"found pending event_id=%d on TSG=%d\n",
-				event_id, tsg->tsgid);
-			mask = (POLLPRI | POLLIN);
-			event_id_data->event_posted = false;
-		}
-	} else {
-		struct channel_gk20a *ch = g->fifo.channel
-					   + event_id_data->id;
-
-		if (event_id_data->event_posted) {
-			gk20a_dbg_info(
-				"found pending event_id=%d on chid=%d\n",
-				event_id, ch->hw_chid);
-			mask = (POLLPRI | POLLIN);
-			event_id_data->event_posted = false;
-		}
-	}
-
-	nvgpu_mutex_release(&event_id_data->lock);
-
-	return mask;
-}
-
-static int gk20a_event_id_release(struct inode *inode, struct file *filp)
-{
-	struct gk20a_event_id_data *event_id_data = filp->private_data;
-	struct gk20a *g = event_id_data->g;
-
-	if (event_id_data->is_tsg) {
-		struct tsg_gk20a *tsg = g->fifo.tsg + event_id_data->id;
-
-		nvgpu_mutex_acquire(&tsg->event_id_list_lock);
-		list_del_init(&event_id_data->event_id_node);
-		nvgpu_mutex_release(&tsg->event_id_list_lock);
-	} else {
-		struct channel_gk20a *ch = g->fifo.channel + event_id_data->id;
-
-		nvgpu_mutex_acquire(&ch->event_id_list_lock);
-		list_del_init(&event_id_data->event_id_node);
-		nvgpu_mutex_release(&ch->event_id_list_lock);
-	}
-
-	nvgpu_mutex_destroy(&event_id_data->lock);
-	gk20a_put(g);
-	nvgpu_kfree(g, event_id_data);
-	filp->private_data = NULL;
-
-	return 0;
-}
-
-const struct file_operations gk20a_event_id_ops = {
-	.owner = THIS_MODULE,
-	.poll = gk20a_event_id_poll,
-	.release = gk20a_event_id_release,
-};
-
-static int gk20a_channel_get_event_data_from_id(struct channel_gk20a *ch,
-				u32 event_id,
-				struct gk20a_event_id_data **event_id_data)
-{
-	struct gk20a_event_id_data *local_event_id_data;
-	bool event_found = false;
-
-	nvgpu_mutex_acquire(&ch->event_id_list_lock);
-	list_for_each_entry(local_event_id_data, &ch->event_id_list,
-						 event_id_node) {
-		if (local_event_id_data->event_id == event_id) {
-			event_found = true;
-			break;
-		}
-	}
-	nvgpu_mutex_release(&ch->event_id_list_lock);
-
-	if (event_found) {
-		*event_id_data = local_event_id_data;
-		return 0;
-	} else {
-		return -1;
-	}
-}
-
-void gk20a_channel_event_id_post_event(struct channel_gk20a *ch,
-				       u32 event_id)
-{
-	struct gk20a_event_id_data *event_id_data;
-	int err = 0;
-
-	err = gk20a_channel_get_event_data_from_id(ch, event_id,
-						&event_id_data);
-	if (err)
-		return;
-
-	nvgpu_mutex_acquire(&event_id_data->lock);
-
-	gk20a_dbg_info(
-		"posting event for event_id=%d on ch=%d\n",
-		event_id, ch->hw_chid);
-	event_id_data->event_posted = true;
-
-	wake_up_interruptible_all(&event_id_data->event_id_wq);
-
-	nvgpu_mutex_release(&event_id_data->lock);
-}
-
-static int gk20a_channel_event_id_enable(struct channel_gk20a *ch,
-					 int event_id,
-					 int *fd)
-{
-	struct gk20a *g;
-	int err = 0;
-	int local_fd;
-	struct file *file;
-	char name[64];
-	struct gk20a_event_id_data *event_id_data;
-
-	g = gk20a_get(ch->g);
-	if (!g)
-		return -ENODEV;
-
-	err = gk20a_channel_get_event_data_from_id(ch,
-				event_id, &event_id_data);
-	if (err == 0) {
-		/* We already have event enabled */
-		err = -EINVAL;
-		goto free_ref;
-	}
-
-	err = get_unused_fd_flags(O_RDWR);
-	if (err < 0)
-		goto free_ref;
-	local_fd = err;
-
-	snprintf(name, sizeof(name), "nvgpu-event%d-fd%d",
-		 event_id, local_fd);
-	file = anon_inode_getfile(name, &gk20a_event_id_ops,
-				  NULL, O_RDWR);
-	if (IS_ERR(file)) {
-		err = PTR_ERR(file);
-		goto clean_up;
-	}
-
-	event_id_data = nvgpu_kzalloc(ch->g, sizeof(*event_id_data));
-	if (!event_id_data) {
-		err = -ENOMEM;
-		goto clean_up_file;
-	}
-	event_id_data->g = g;
-	event_id_data->id = ch->hw_chid;
-	event_id_data->is_tsg = false;
-	event_id_data->event_id = event_id;
-
-	init_waitqueue_head(&event_id_data->event_id_wq);
-	err = nvgpu_mutex_init(&event_id_data->lock);
-	if (err)
-		goto clean_up_free;
-	INIT_LIST_HEAD(&event_id_data->event_id_node);
-
-	nvgpu_mutex_acquire(&ch->event_id_list_lock);
-	list_add_tail(&event_id_data->event_id_node, &ch->event_id_list);
-	nvgpu_mutex_release(&ch->event_id_list_lock);
-
-	fd_install(local_fd, file);
-	file->private_data = event_id_data;
-
-	*fd = local_fd;
-
-	return 0;
-
-clean_up_free:
-	kfree(event_id_data);
-clean_up_file:
-	fput(file);
-clean_up:
-	put_unused_fd(local_fd);
-free_ref:
-	gk20a_put(g);
-	return err;
-}
-
-static int gk20a_channel_event_id_ctrl(struct channel_gk20a *ch,
-		struct nvgpu_event_id_ctrl_args *args)
-{
-	int err = 0;
-	int fd = -1;
-
-	if (args->event_id >= NVGPU_IOCTL_CHANNEL_EVENT_ID_MAX)
-		return -EINVAL;
-
-	if (gk20a_is_channel_marked_as_tsg(ch))
-		return -EINVAL;
-
-	switch (args->cmd) {
-	case NVGPU_IOCTL_CHANNEL_EVENT_ID_CMD_ENABLE:
-		err = gk20a_channel_event_id_enable(ch, args->event_id, &fd);
-		if (!err)
-			args->event_fd = fd;
-		break;
-
-	default:
-		gk20a_err(dev_from_gk20a(ch->g),
-			   "unrecognized channel event id cmd: 0x%x",
-			   args->cmd);
-		err = -EINVAL;
-		break;
-	}
-
-	return err;
-}
-
-static int gk20a_channel_zcull_bind(struct channel_gk20a *ch,
-			    struct nvgpu_zcull_bind_args *args)
-{
-	struct gk20a *g = ch->g;
-	struct gr_gk20a *gr = &g->gr;
-
-	gk20a_dbg_fn("");
-
-	return g->ops.gr.bind_ctxsw_zcull(g, gr, ch,
-				args->gpu_va, args->mode);
-}
-
-/* in this context the "channel" is the host1x channel which
- * maps to *all* gk20a channels */
-int gk20a_channel_suspend(struct gk20a *g)
-{
-	struct fifo_gk20a *f = &g->fifo;
-	u32 chid;
-	bool channels_in_use = false;
-	u32 active_runlist_ids = 0;
-
-	gk20a_dbg_fn("");
-
-	for (chid = 0; chid < f->num_channels; chid++) {
-		struct channel_gk20a *ch = &f->channel[chid];
-		if (gk20a_channel_get(ch)) {
-			gk20a_dbg_info("suspend channel %d", chid);
-			/* disable channel */
-			gk20a_disable_channel_tsg(g, ch);
-			/* preempt the channel */
-			gk20a_fifo_preempt(g, ch);
-			/* wait for channel update notifiers */
-			if (ch->update_fn)
-				cancel_work_sync(&ch->update_fn_work);
-
-			channels_in_use = true;
-
-			active_runlist_ids |= BIT(ch->runlist_id);
-
-			gk20a_channel_put(ch);
-		}
-	}
-
-	if (channels_in_use) {
-		gk20a_fifo_update_runlist_ids(g, active_runlist_ids, ~0, false, true);
+	if (channels_in_use) {
+		gk20a_fifo_update_runlist_ids(g, active_runlist_ids, ~0, false, true);
 
 		for (chid = 0; chid < f->num_channels; chid++) {
 			if (gk20a_channel_get(&f->channel[chid])) {
@@ -3533,421 +2820,3 @@ void gk20a_channel_semaphore_wakeup(struct gk20a *g, bool post_events)
 		}
 	}
 }
-
-static int gk20a_ioctl_channel_submit_gpfifo(
-	struct channel_gk20a *ch,
-	struct nvgpu_submit_gpfifo_args *args)
-{
-	struct gk20a_fence *fence_out;
-	struct fifo_profile_gk20a *profile = NULL;
-
-	int ret = 0;
-	gk20a_dbg_fn("");
-
-#ifdef CONFIG_DEBUG_FS
-	profile = gk20a_fifo_profile_acquire(ch->g);
-
-	if (profile)
-		profile->timestamp[PROFILE_IOCTL_ENTRY] = sched_clock();
-#endif
-	if (ch->has_timedout)
-		return -ETIMEDOUT;
-	ret = gk20a_submit_channel_gpfifo(ch, NULL, args, args->num_entries,
-					  args->flags, &args->fence,
-					  &fence_out, false, profile);
-
-	if (ret)
-		goto clean_up;
-
-	/* Convert fence_out to something we can pass back to user space. */
-	if (args->flags & NVGPU_SUBMIT_GPFIFO_FLAGS_FENCE_GET) {
-		if (args->flags & NVGPU_SUBMIT_GPFIFO_FLAGS_SYNC_FENCE) {
-			int fd = gk20a_fence_install_fd(fence_out);
-			if (fd < 0)
-				ret = fd;
-			else
-				args->fence.id = fd;
-		} else {
-			args->fence.id = fence_out->syncpt_id;
-			args->fence.value = fence_out->syncpt_value;
-		}
-	}
-	gk20a_fence_put(fence_out);
-#ifdef CONFIG_DEBUG_FS
-	if (profile) {
-		profile->timestamp[PROFILE_IOCTL_EXIT] = sched_clock();
-		gk20a_fifo_profile_release(ch->g, profile);
-	}
-#endif
-clean_up:
-	return ret;
-}
-
-long gk20a_channel_ioctl(struct file *filp,
-	unsigned int cmd, unsigned long arg)
-{
-	struct channel_priv *priv = filp->private_data;
-	struct channel_gk20a *ch = priv->c;
-	struct gk20a *g = ch->g;
-	struct device *dev = g->dev;
-	u8 buf[NVGPU_IOCTL_CHANNEL_MAX_ARG_SIZE] = {0};
-	int err = 0;
-
-	gk20a_dbg_fn("start %d", _IOC_NR(cmd));
-
-	if ((_IOC_TYPE(cmd) != NVGPU_IOCTL_MAGIC) ||
-		(_IOC_NR(cmd) == 0) ||
-		(_IOC_NR(cmd) > NVGPU_IOCTL_CHANNEL_LAST) ||
-		(_IOC_SIZE(cmd) > NVGPU_IOCTL_CHANNEL_MAX_ARG_SIZE))
-		return -EINVAL;
-
-	if (_IOC_DIR(cmd) & _IOC_WRITE) {
-		if (copy_from_user(buf, (void __user *)arg, _IOC_SIZE(cmd)))
-			return -EFAULT;
-	}
-
-	/* take a ref or return timeout if channel refs can't be taken */
-	ch = gk20a_channel_get(ch);
-	if (!ch)
-		return -ETIMEDOUT;
-
-	/* protect our sanity for threaded userspace - most of the channel is
-	 * not thread safe */
-	nvgpu_mutex_acquire(&ch->ioctl_lock);
-
-	/* this ioctl call keeps a ref to the file which keeps a ref to the
-	 * channel */
-
-	switch (cmd) {
-	case NVGPU_IOCTL_CHANNEL_OPEN:
-		err = gk20a_channel_open_ioctl(ch->g,
-			(struct nvgpu_channel_open_args *)buf);
-		break;
-	case NVGPU_IOCTL_CHANNEL_SET_NVMAP_FD:
-		break;
-	case NVGPU_IOCTL_CHANNEL_ALLOC_OBJ_CTX:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = ch->g->ops.gr.alloc_obj_ctx(ch,
-				(struct nvgpu_alloc_obj_ctx_args *)buf);
-		gk20a_idle(g);
-		break;
-	case NVGPU_IOCTL_CHANNEL_ALLOC_GPFIFO_EX:
-	{
-		struct nvgpu_alloc_gpfifo_ex_args *alloc_gpfifo_ex_args =
-			(struct nvgpu_alloc_gpfifo_ex_args *)buf;
-
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-
-		if (!is_power_of_2(alloc_gpfifo_ex_args->num_entries)) {
-			err = -EINVAL;
-			gk20a_idle(g);
-			break;
-		}
-		err = gk20a_alloc_channel_gpfifo(ch, alloc_gpfifo_ex_args);
-		gk20a_idle(g);
-		break;
-	}
-	case NVGPU_IOCTL_CHANNEL_ALLOC_GPFIFO:
-	{
-		struct nvgpu_alloc_gpfifo_ex_args alloc_gpfifo_ex_args;
-		struct nvgpu_alloc_gpfifo_args *alloc_gpfifo_args =
-			(struct nvgpu_alloc_gpfifo_args *)buf;
-
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-
-		/* prepare new args structure */
-		memset(&alloc_gpfifo_ex_args, 0,
-				sizeof(struct nvgpu_alloc_gpfifo_ex_args));
-		/*
-		 * Kernel can insert one extra gpfifo entry before user
-		 * submitted gpfifos and another one after, for internal usage.
-		 * Triple the requested size.
-		 */
-		alloc_gpfifo_ex_args.num_entries = roundup_pow_of_two(
-				alloc_gpfifo_args->num_entries * 3);
-		alloc_gpfifo_ex_args.flags = alloc_gpfifo_args->flags;
-
-		err = gk20a_alloc_channel_gpfifo(ch, &alloc_gpfifo_ex_args);
-		gk20a_idle(g);
-		break;
-	}
-	case NVGPU_IOCTL_CHANNEL_SUBMIT_GPFIFO:
-		err = gk20a_ioctl_channel_submit_gpfifo(ch,
-				(struct nvgpu_submit_gpfifo_args *)buf);
-		break;
-	case NVGPU_IOCTL_CHANNEL_WAIT:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-
-		/* waiting is thread-safe, not dropping this mutex could
-		 * deadlock in certain conditions */
-		nvgpu_mutex_release(&ch->ioctl_lock);
-
-		err = gk20a_channel_wait(ch,
-				(struct nvgpu_wait_args *)buf);
-
-		nvgpu_mutex_acquire(&ch->ioctl_lock);
-
-		gk20a_idle(g);
-		break;
-	case NVGPU_IOCTL_CHANNEL_ZCULL_BIND:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = gk20a_channel_zcull_bind(ch,
-				(struct nvgpu_zcull_bind_args *)buf);
-		gk20a_idle(g);
-		break;
-	case NVGPU_IOCTL_CHANNEL_SET_ERROR_NOTIFIER:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = gk20a_init_error_notifier(ch,
-				(struct nvgpu_set_error_notifier *)buf);
-		gk20a_idle(g);
-		break;
-#ifdef CONFIG_GK20A_CYCLE_STATS
-	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = gk20a_channel_cycle_stats(ch,
-				(struct nvgpu_cycle_stats_args *)buf);
-		gk20a_idle(g);
-		break;
-#endif
-	case NVGPU_IOCTL_CHANNEL_SET_TIMEOUT:
-	{
-		u32 timeout =
-			(u32)((struct nvgpu_set_timeout_args *)buf)->timeout;
-		gk20a_dbg(gpu_dbg_gpu_dbg, "setting timeout (%d ms) for chid %d",
-			   timeout, ch->hw_chid);
-		ch->timeout_ms_max = timeout;
-		gk20a_channel_trace_sched_param(
-			trace_gk20a_channel_set_timeout, ch);
-		break;
-	}
-	case NVGPU_IOCTL_CHANNEL_SET_TIMEOUT_EX:
-	{
-		u32 timeout =
-			(u32)((struct nvgpu_set_timeout_args *)buf)->timeout;
-		bool timeout_debug_dump = !((u32)
-			((struct nvgpu_set_timeout_ex_args *)buf)->flags &
-			(1 << NVGPU_TIMEOUT_FLAG_DISABLE_DUMP));
-		gk20a_dbg(gpu_dbg_gpu_dbg, "setting timeout (%d ms) for chid %d",
-			   timeout, ch->hw_chid);
-		ch->timeout_ms_max = timeout;
-		ch->timeout_debug_dump = timeout_debug_dump;
-		gk20a_channel_trace_sched_param(
-			trace_gk20a_channel_set_timeout, ch);
-		break;
-	}
-	case NVGPU_IOCTL_CHANNEL_GET_TIMEDOUT:
-		((struct nvgpu_get_param_args *)buf)->value =
-			ch->has_timedout;
-		break;
-	case NVGPU_IOCTL_CHANNEL_SET_PRIORITY:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = ch->g->ops.fifo.channel_set_priority(ch,
-			((struct nvgpu_set_priority_args *)buf)->priority);
-
-		gk20a_idle(g);
-		gk20a_channel_trace_sched_param(
-			trace_gk20a_channel_set_priority, ch);
-		break;
-	case NVGPU_IOCTL_CHANNEL_ENABLE:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		if (ch->g->ops.fifo.enable_channel)
-			ch->g->ops.fifo.enable_channel(ch);
-		else
-			err = -ENOSYS;
-		gk20a_idle(g);
-		break;
-	case NVGPU_IOCTL_CHANNEL_DISABLE:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		if (ch->g->ops.fifo.disable_channel)
-			ch->g->ops.fifo.disable_channel(ch);
-		else
-			err = -ENOSYS;
-		gk20a_idle(g);
-		break;
-	case NVGPU_IOCTL_CHANNEL_PREEMPT:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = gk20a_fifo_preempt(ch->g, ch);
-		gk20a_idle(g);
-		break;
-	case NVGPU_IOCTL_CHANNEL_FORCE_RESET:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = ch->g->ops.fifo.force_reset_ch(ch,
-				NVGPU_CHANNEL_RESETCHANNEL_VERIF_ERROR, true);
-		gk20a_idle(g);
-		break;
-	case NVGPU_IOCTL_CHANNEL_EVENT_ID_CTRL:
-		err = gk20a_channel_event_id_ctrl(ch,
-			      (struct nvgpu_event_id_ctrl_args *)buf);
-		break;
-#ifdef CONFIG_GK20A_CYCLE_STATS
-	case NVGPU_IOCTL_CHANNEL_CYCLE_STATS_SNAPSHOT:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = gk20a_channel_cycle_stats_snapshot(ch,
-				(struct nvgpu_cycle_stats_snapshot_args *)buf);
-		gk20a_idle(g);
-		break;
-#endif
-	case NVGPU_IOCTL_CHANNEL_WDT:
-		err = gk20a_channel_set_wdt_status(ch,
-				(struct nvgpu_channel_wdt_args *)buf);
-		break;
-	case NVGPU_IOCTL_CHANNEL_SET_RUNLIST_INTERLEAVE:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = gk20a_channel_set_runlist_interleave(ch,
-			((struct nvgpu_runlist_interleave_args *)buf)->level);
-
-		gk20a_idle(g);
-		gk20a_channel_trace_sched_param(
-			trace_gk20a_channel_set_runlist_interleave, ch);
-		break;
-	case NVGPU_IOCTL_CHANNEL_SET_TIMESLICE:
-		err = gk20a_busy(g);
-		if (err) {
-			dev_err(dev,
-				"%s: failed to host gk20a for ioctl cmd: 0x%x",
-				__func__, cmd);
-			break;
-		}
-		err = ch->g->ops.fifo.channel_set_timeslice(ch,
-			((struct nvgpu_timeslice_args *)buf)->timeslice_us);
-
-		gk20a_idle(g);
-		gk20a_channel_trace_sched_param(
-			trace_gk20a_channel_set_timeslice, ch);
-		break;
-	case NVGPU_IOCTL_CHANNEL_SET_PREEMPTION_MODE:
-		if (ch->g->ops.gr.set_preemption_mode) {
-			err = gk20a_busy(g);
-			if (err) {
-				dev_err(dev,
-					"%s: failed to host gk20a for ioctl cmd: 0x%x",
-					__func__, cmd);
-				break;
-			}
-			err = ch->g->ops.gr.set_preemption_mode(ch,
-			     ((struct nvgpu_preemption_mode_args *)buf)->graphics_preempt_mode,
-			     ((struct nvgpu_preemption_mode_args *)buf)->compute_preempt_mode);
-			gk20a_idle(g);
-		} else {
-			err = -EINVAL;
-		}
-		break;
-	case NVGPU_IOCTL_CHANNEL_SET_BOOSTED_CTX:
-		if (ch->g->ops.gr.set_boosted_ctx) {
-			bool boost =
-				((struct nvgpu_boosted_ctx_args *)buf)->boost;
-
-			err = gk20a_busy(g);
-			if (err) {
-				dev_err(dev,
-					"%s: failed to host gk20a for ioctl cmd: 0x%x",
-					__func__, cmd);
-				break;
-			}
-			err = ch->g->ops.gr.set_boosted_ctx(ch, boost);
-			gk20a_idle(g);
-		} else {
-			err = -EINVAL;
-		}
-		break;
-	default:
-		dev_dbg(dev, "unrecognized ioctl cmd: 0x%x", cmd);
-		err = -ENOTTY;
-		break;
-	}
-
-	if ((err == 0) && (_IOC_DIR(cmd) & _IOC_READ))
-		err = copy_to_user((void __user *)arg, buf, _IOC_SIZE(cmd));
-
-	nvgpu_mutex_release(&ch->ioctl_lock);
-
-	gk20a_channel_put(ch);
-
-	gk20a_dbg_fn("end");
-
-	return err;
-}
diff --git a/drivers/gpu/nvgpu/gk20a/channel_gk20a.h b/drivers/gpu/nvgpu/gk20a/channel_gk20a.h
index 37b1d945..bcfdadec 100644
--- a/drivers/gpu/nvgpu/gk20a/channel_gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/channel_gk20a.h
@@ -18,13 +18,8 @@
 #ifndef CHANNEL_GK20A_H
 #define CHANNEL_GK20A_H
 
-#include <linux/log2.h>
-#include <linux/poll.h>
-#include <linux/semaphore.h>
-#include <linux/slab.h>
 #include <linux/stacktrace.h>
 #include <linux/wait.h>
-#include <uapi/linux/nvgpu.h>
 #include <nvgpu/list.h>
 
 #include <nvgpu/lock.h>
@@ -359,8 +354,13 @@ int gk20a_submit_channel_gpfifo(struct channel_gk20a *c,
 				bool force_need_sync_fence,
 				struct fifo_profile_gk20a *profile);
 
-int gk20a_alloc_channel_gpfifo(struct channel_gk20a *c,
-			       struct nvgpu_alloc_gpfifo_ex_args *args);
+int gk20a_channel_alloc_gpfifo(struct channel_gk20a *c,
+		unsigned int num_entries,
+		unsigned int num_inflight_jobs,
+		u32 flags);
+void gk20a_channel_free_error_notifiers(struct channel_gk20a *ch);
+void gk20a_channel_free_cycle_stats_buffer(struct channel_gk20a *ch);
+int gk20a_channel_free_cycle_stats_snapshot(struct channel_gk20a *ch);
 
 void gk20a_channel_timeout_restart_all_channels(struct gk20a *g);
 
diff --git a/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c b/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c
index 1c3ba9c2..2f6a85a5 100644
--- a/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c
@@ -22,6 +22,8 @@
 #include <linux/hashtable.h>
 #include <linux/debugfs.h>
 #include <linux/log2.h>
+#include <linux/uaccess.h>
+#include <linux/poll.h>
 #include <trace/events/gk20a.h>
 #include <uapi/linux/nvgpu.h>
 
diff --git a/drivers/gpu/nvgpu/gk20a/sched_gk20a.c b/drivers/gpu/nvgpu/gk20a/sched_gk20a.c
index 49a09e99..a58de920 100644
--- a/drivers/gpu/nvgpu/gk20a/sched_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/sched_gk20a.c
@@ -21,6 +21,8 @@
 #include <linux/hashtable.h>
 #include <linux/debugfs.h>
 #include <linux/log2.h>
+#include <linux/uaccess.h>
+#include <linux/poll.h>
 #include <uapi/linux/nvgpu.h>
 
 #include <nvgpu/kmem.h>
diff --git a/drivers/gpu/nvgpu/gp106/xve_gp106.c b/drivers/gpu/nvgpu/gp106/xve_gp106.c
index ecc6de60..64d60794 100644
--- a/drivers/gpu/nvgpu/gp106/xve_gp106.c
+++ b/drivers/gpu/nvgpu/gp106/xve_gp106.c
@@ -17,6 +17,7 @@
 #include <linux/delay.h>
 #include <linux/kernel.h>
 #include <linux/debugfs.h>
+#include <linux/uaccess.h>
 
 #include "gk20a/gk20a.h"
 #include "gm206/bios_gm206.h"
-- 
cgit v1.2.2