From 57fb527a7e33384341fc18f1f918d5a8225057f5 Mon Sep 17 00:00:00 2001
From: Peter Daifuku <pdaifuku@nvidia.com>
Date: Fri, 6 Oct 2017 16:27:14 -0700
Subject: gpu: nvgpu: vgpu: flatten out vgpu hal

Instead of calling the native HAL init function then adding
multiple layers of modification for VGPU, flatten out the sequence
so that all entry points are set statically and visible in a
single file.

JIRA ESRM-30

Change-Id: Ie424abb48bce5038874851d399baac5e4bb7d27c
Signed-off-by: Peter Daifuku <pdaifuku@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1574616
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/Makefile.nvgpu               |   4 +-
 drivers/gpu/nvgpu/gm20b/hal_gm20b.c            |   2 +-
 drivers/gpu/nvgpu/gm20b/hal_gm20b.h            |   3 +-
 drivers/gpu/nvgpu/gp10b/hal_gp10b.c            |   2 +-
 drivers/gpu/nvgpu/gp10b/hal_gp10b.h            |   3 +-
 drivers/gpu/nvgpu/vgpu/ce2_vgpu.c              |   7 +-
 drivers/gpu/nvgpu/vgpu/css_vgpu.c              |  22 +-
 drivers/gpu/nvgpu/vgpu/css_vgpu.h              |  40 ++
 drivers/gpu/nvgpu/vgpu/dbg_vgpu.c              |  29 +-
 drivers/gpu/nvgpu/vgpu/dbg_vgpu.h              |  47 ++
 drivers/gpu/nvgpu/vgpu/debug_vgpu.c            |  33 --
 drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.c       |  41 +-
 drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.h       |  23 +-
 drivers/gpu/nvgpu/vgpu/fifo_vgpu.c             |  61 +--
 drivers/gpu/nvgpu/vgpu/fifo_vgpu.h             |  65 +++
 drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.c   |   9 +-
 drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.h   |   4 +-
 drivers/gpu/nvgpu/vgpu/gm20b/vgpu_hal_gm20b.c  | 579 ++++++++++++++++++++++-
 drivers/gpu/nvgpu/vgpu/gp10b/vgpu_fifo_gp10b.h |  30 --
 drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.c   |  21 +-
 drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.h   |  19 +-
 drivers/gpu/nvgpu/vgpu/gp10b/vgpu_hal_gp10b.c  | 624 ++++++++++++++++++++++++-
 drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.c   |  15 +-
 drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.h   |  19 +-
 drivers/gpu/nvgpu/vgpu/gr_vgpu.c               |  69 +--
 drivers/gpu/nvgpu/vgpu/gr_vgpu.h               |  44 ++
 drivers/gpu/nvgpu/vgpu/ltc_vgpu.c              |  17 +-
 drivers/gpu/nvgpu/vgpu/ltc_vgpu.h              |  33 ++
 drivers/gpu/nvgpu/vgpu/mm_vgpu.c               |  33 +-
 drivers/gpu/nvgpu/vgpu/mm_vgpu.h               |  56 +++
 drivers/gpu/nvgpu/vgpu/tsg_vgpu.c              |  17 +-
 drivers/gpu/nvgpu/vgpu/vgpu.c                  |  23 +-
 drivers/gpu/nvgpu/vgpu/vgpu.h                  |  40 +-
 33 files changed, 1630 insertions(+), 404 deletions(-)
 create mode 100644 drivers/gpu/nvgpu/vgpu/css_vgpu.h
 create mode 100644 drivers/gpu/nvgpu/vgpu/dbg_vgpu.h
 delete mode 100644 drivers/gpu/nvgpu/vgpu/debug_vgpu.c
 create mode 100644 drivers/gpu/nvgpu/vgpu/fifo_vgpu.h
 delete mode 100644 drivers/gpu/nvgpu/vgpu/gp10b/vgpu_fifo_gp10b.h
 create mode 100644 drivers/gpu/nvgpu/vgpu/ltc_vgpu.h
 create mode 100644 drivers/gpu/nvgpu/vgpu/mm_vgpu.h

diff --git a/drivers/gpu/nvgpu/Makefile.nvgpu b/drivers/gpu/nvgpu/Makefile.nvgpu
index fa774566..9ba6f49a 100644
--- a/drivers/gpu/nvgpu/Makefile.nvgpu
+++ b/drivers/gpu/nvgpu/Makefile.nvgpu
@@ -153,7 +153,6 @@ nvgpu-$(CONFIG_TEGRA_GR_VIRTUALIZATION) += \
 	vgpu/fifo_vgpu.o \
 	vgpu/ce2_vgpu.o \
 	vgpu/mm_vgpu.o \
-	vgpu/debug_vgpu.o \
 	vgpu/vgpu.o \
 	vgpu/dbg_vgpu.o \
 	vgpu/fecs_trace_vgpu.o \
@@ -245,8 +244,7 @@ nvgpu-$(CONFIG_TEGRA_GK20A) += common/linux/platform_gp10b_tegra.o
 nvgpu-$(CONFIG_TEGRA_GR_VIRTUALIZATION) += \
 	vgpu/gp10b/vgpu_hal_gp10b.o  \
 	vgpu/gp10b/vgpu_gr_gp10b.o  \
-	vgpu/gp10b/vgpu_mm_gp10b.o \
-	vgpu/gp10b/vgpu_fifo_gp10b.o
+	vgpu/gp10b/vgpu_mm_gp10b.o
 endif
 
 ifeq ($(CONFIG_ARCH_TEGRA_19x_SOC),y)
diff --git a/drivers/gpu/nvgpu/gm20b/hal_gm20b.c b/drivers/gpu/nvgpu/gm20b/hal_gm20b.c
index 76c87c00..39d05978 100644
--- a/drivers/gpu/nvgpu/gm20b/hal_gm20b.c
+++ b/drivers/gpu/nvgpu/gm20b/hal_gm20b.c
@@ -71,7 +71,7 @@
 
 #define PRIV_SECURITY_DISABLE 0x01
 
-static int gm20b_get_litter_value(struct gk20a *g, int value)
+int gm20b_get_litter_value(struct gk20a *g, int value)
 {
 	int ret = EINVAL;
 	switch (value) {
diff --git a/drivers/gpu/nvgpu/gm20b/hal_gm20b.h b/drivers/gpu/nvgpu/gm20b/hal_gm20b.h
index 1e149ce2..22eae182 100644
--- a/drivers/gpu/nvgpu/gm20b/hal_gm20b.h
+++ b/drivers/gpu/nvgpu/gm20b/hal_gm20b.h
@@ -1,7 +1,7 @@
 /*
  * GM20B Graphics
  *
- * Copyright (c) 2014, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -27,4 +27,5 @@
 struct gk20a;
 
 int gm20b_init_hal(struct gk20a *g);
+int gm20b_get_litter_value(struct gk20a *g, int value);
 #endif
diff --git a/drivers/gpu/nvgpu/gp10b/hal_gp10b.c b/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
index f298f26c..61284225 100644
--- a/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
+++ b/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
@@ -80,7 +80,7 @@
 #include <nvgpu/hw/gp10b/hw_pram_gp10b.h>
 #include <nvgpu/hw/gp10b/hw_pwr_gp10b.h>
 
-static int gp10b_get_litter_value(struct gk20a *g, int value)
+int gp10b_get_litter_value(struct gk20a *g, int value)
 {
 	int ret = EINVAL;
 	switch (value) {
diff --git a/drivers/gpu/nvgpu/gp10b/hal_gp10b.h b/drivers/gpu/nvgpu/gp10b/hal_gp10b.h
index f2924809..cf3c295d 100644
--- a/drivers/gpu/nvgpu/gp10b/hal_gp10b.h
+++ b/drivers/gpu/nvgpu/gp10b/hal_gp10b.h
@@ -1,7 +1,7 @@
 /*
  * GP10B Tegra HAL interface
  *
- * Copyright (c) 2014, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -27,4 +27,5 @@
 struct gk20a;
 
 int gp10b_init_hal(struct gk20a *gops);
+int gp10b_get_litter_value(struct gk20a *g, int value);
 #endif
diff --git a/drivers/gpu/nvgpu/vgpu/ce2_vgpu.c b/drivers/gpu/nvgpu/vgpu/ce2_vgpu.c
index e53a3c18..bd225f0c 100644
--- a/drivers/gpu/nvgpu/vgpu/ce2_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/ce2_vgpu.c
@@ -43,14 +43,9 @@ int vgpu_ce2_nonstall_isr(struct gk20a *g,
 	return 0;
 }
 
-static u32 vgpu_ce_get_num_pce(struct gk20a *g)
+u32 vgpu_ce_get_num_pce(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
 	return priv->constants.num_pce;
 }
-
-void vgpu_init_ce2_ops(struct gpu_ops *gops)
-{
-	gops->ce2.get_num_pce = vgpu_ce_get_num_pce;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/css_vgpu.c b/drivers/gpu/nvgpu/vgpu/css_vgpu.c
index 0b3c6a25..bcb01fac 100644
--- a/drivers/gpu/nvgpu/vgpu/css_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/css_vgpu.c
@@ -29,6 +29,7 @@
 #include "gk20a/platform_gk20a.h"
 #include "gk20a/css_gr_gk20a.h"
 #include "vgpu.h"
+#include "css_vgpu.h"
 
 static struct tegra_hv_ivm_cookie *css_cookie;
 
@@ -93,7 +94,7 @@ fail:
 	return err;
 }
 
-static void vgpu_css_release_snapshot_buffer(struct gr_gk20a *gr)
+void vgpu_css_release_snapshot_buffer(struct gr_gk20a *gr)
 {
 	struct gk20a_cs_snapshot *data = gr->cs_data;
 
@@ -108,7 +109,7 @@ static void vgpu_css_release_snapshot_buffer(struct gr_gk20a *gr)
 	gk20a_dbg_info("cyclestats(vgpu): buffer for snapshots released\n");
 }
 
-static int vgpu_css_flush_snapshots(struct channel_gk20a *ch,
+int vgpu_css_flush_snapshots(struct channel_gk20a *ch,
 			u32 *pending, bool *hw_overflow)
 {
 	struct gk20a *g = ch->g;
@@ -164,7 +165,7 @@ static int vgpu_css_attach(struct channel_gk20a *ch,
 	return err;
 }
 
-static int vgpu_css_detach(struct channel_gk20a *ch,
+int vgpu_css_detach(struct channel_gk20a *ch,
 		struct gk20a_cs_snapshot_client *cs_client)
 {
 	struct gk20a *g = ch->g;
@@ -190,7 +191,7 @@ static int vgpu_css_detach(struct channel_gk20a *ch,
 	return err;
 }
 
-static int vgpu_css_enable_snapshot_buffer(struct channel_gk20a *ch,
+int vgpu_css_enable_snapshot_buffer(struct channel_gk20a *ch,
 				struct gk20a_cs_snapshot_client *cs_client)
 {
 	int ret;
@@ -202,17 +203,4 @@ static int vgpu_css_enable_snapshot_buffer(struct channel_gk20a *ch,
 	ret = vgpu_css_init_snapshot_buffer(&ch->g->gr);
 	return ret;
 }
-
-void vgpu_init_css_ops(struct gpu_ops *gops)
-{
-	gops->css.enable_snapshot = vgpu_css_enable_snapshot_buffer;
-	gops->css.disable_snapshot = vgpu_css_release_snapshot_buffer;
-	gops->css.check_data_available = vgpu_css_flush_snapshots;
-	gops->css.detach_snapshot = vgpu_css_detach;
-
-	/* Following entries are not used when virtual, NULL them */
-	gops->css.set_handled_snapshots = NULL;
-	gops->css.allocate_perfmon_ids = NULL;
-	gops->css.release_perfmon_ids = NULL;
-}
 #endif /* CONFIG_GK20A_CYCLE_STATS */
diff --git a/drivers/gpu/nvgpu/vgpu/css_vgpu.h b/drivers/gpu/nvgpu/vgpu/css_vgpu.h
new file mode 100644
index 00000000..b61c9862
--- /dev/null
+++ b/drivers/gpu/nvgpu/vgpu/css_vgpu.h
@@ -0,0 +1,40 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef _CSS_VGPU_H_
+#define _CSS_VGPU_H_
+
+#include <nvgpu/types.h>
+
+struct gr_gk20a;
+struct channel_gk20a;
+struct gk20a_cs_snapshot_client;
+
+void vgpu_css_release_snapshot_buffer(struct gr_gk20a *gr);
+int vgpu_css_flush_snapshots(struct channel_gk20a *ch,
+			u32 *pending, bool *hw_overflow);
+int vgpu_css_detach(struct channel_gk20a *ch,
+		struct gk20a_cs_snapshot_client *cs_client);
+int vgpu_css_enable_snapshot_buffer(struct channel_gk20a *ch,
+				struct gk20a_cs_snapshot_client *cs_client);
+
+#endif
diff --git a/drivers/gpu/nvgpu/vgpu/dbg_vgpu.c b/drivers/gpu/nvgpu/vgpu/dbg_vgpu.c
index 416b8903..6e8ab561 100644
--- a/drivers/gpu/nvgpu/vgpu/dbg_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/dbg_vgpu.c
@@ -27,10 +27,11 @@
 #include "gk20a/channel_gk20a.h"
 #include "gk20a/dbg_gpu_gk20a.h"
 #include "vgpu.h"
+#include "dbg_vgpu.h"
 
 #include <nvgpu/bug.h>
 
-static int vgpu_exec_regops(struct dbg_session_gk20a *dbg_s,
+int vgpu_exec_regops(struct dbg_session_gk20a *dbg_s,
 		      struct nvgpu_dbg_gpu_reg_op *ops,
 		      u64 num_ops)
 {
@@ -76,7 +77,7 @@ fail:
 	return err;
 }
 
-static int vgpu_dbg_set_powergate(struct dbg_session_gk20a *dbg_s, __u32 mode)
+int vgpu_dbg_set_powergate(struct dbg_session_gk20a *dbg_s, __u32 mode)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_set_powergate_params *p = &msg.params.set_powergate;
@@ -124,7 +125,7 @@ static int vgpu_sendrecv_prof_cmd(struct dbg_session_gk20a *dbg_s, u32 mode)
 	return err;
 }
 
-static bool vgpu_check_and_set_global_reservation(
+bool vgpu_check_and_set_global_reservation(
 				struct dbg_session_gk20a *dbg_s,
 				struct dbg_profiler_object_data *prof_obj)
 {
@@ -144,7 +145,7 @@ static bool vgpu_check_and_set_global_reservation(
 	return false;
 }
 
-static bool vgpu_check_and_set_context_reservation(
+bool vgpu_check_and_set_context_reservation(
 				struct dbg_session_gk20a *dbg_s,
 				struct dbg_profiler_object_data *prof_obj)
 {
@@ -167,7 +168,7 @@ static bool vgpu_check_and_set_context_reservation(
 	return false;
 }
 
-static void vgpu_release_profiler_reservation(
+void vgpu_release_profiler_reservation(
 				struct dbg_session_gk20a *dbg_s,
 				struct dbg_profiler_object_data *prof_obj)
 {
@@ -205,26 +206,12 @@ static int vgpu_sendrecv_perfbuf_cmd(struct gk20a *g, u64 offset, u32 size)
 	return err;
 }
 
-static int vgpu_perfbuffer_enable(struct gk20a *g, u64 offset, u32 size)
+int vgpu_perfbuffer_enable(struct gk20a *g, u64 offset, u32 size)
 {
 	return vgpu_sendrecv_perfbuf_cmd(g, offset, size);
 }
 
-static int vgpu_perfbuffer_disable(struct gk20a *g)
+int vgpu_perfbuffer_disable(struct gk20a *g)
 {
 	return vgpu_sendrecv_perfbuf_cmd(g, 0, 0);
 }
-
-void vgpu_init_dbg_session_ops(struct gpu_ops *gops)
-{
-	gops->dbg_session_ops.exec_reg_ops = vgpu_exec_regops;
-	gops->dbg_session_ops.dbg_set_powergate = vgpu_dbg_set_powergate;
-	gops->dbg_session_ops.check_and_set_global_reservation =
-					vgpu_check_and_set_global_reservation;
-	gops->dbg_session_ops.check_and_set_context_reservation =
-					vgpu_check_and_set_context_reservation;
-	gops->dbg_session_ops.release_profiler_reservation =
-					vgpu_release_profiler_reservation;
-	gops->dbg_session_ops.perfbuffer_enable = vgpu_perfbuffer_enable;
-	gops->dbg_session_ops.perfbuffer_disable = vgpu_perfbuffer_disable;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/dbg_vgpu.h b/drivers/gpu/nvgpu/vgpu/dbg_vgpu.h
new file mode 100644
index 00000000..fcdea931
--- /dev/null
+++ b/drivers/gpu/nvgpu/vgpu/dbg_vgpu.h
@@ -0,0 +1,47 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef _DBG_VGPU_H_
+#define _DBG_VGPU_H_
+
+struct dbg_session_gk20a;
+struct nvgpu_dbg_gpu_reg_op;
+struct dbg_profiler_object_data;
+struct gk20a;
+
+int vgpu_exec_regops(struct dbg_session_gk20a *dbg_s,
+		      struct nvgpu_dbg_gpu_reg_op *ops,
+		      u64 num_ops);
+int vgpu_dbg_set_powergate(struct dbg_session_gk20a *dbg_s, __u32 mode);
+bool vgpu_check_and_set_global_reservation(
+				struct dbg_session_gk20a *dbg_s,
+				struct dbg_profiler_object_data *prof_obj);
+bool vgpu_check_and_set_context_reservation(
+				struct dbg_session_gk20a *dbg_s,
+				struct dbg_profiler_object_data *prof_obj);
+
+void vgpu_release_profiler_reservation(
+				struct dbg_session_gk20a *dbg_s,
+				struct dbg_profiler_object_data *prof_obj);
+int vgpu_perfbuffer_enable(struct gk20a *g, u64 offset, u32 size);
+int vgpu_perfbuffer_disable(struct gk20a *g);
+#endif
diff --git a/drivers/gpu/nvgpu/vgpu/debug_vgpu.c b/drivers/gpu/nvgpu/vgpu/debug_vgpu.c
deleted file mode 100644
index cb858c22..00000000
--- a/drivers/gpu/nvgpu/vgpu/debug_vgpu.c
+++ /dev/null
@@ -1,33 +0,0 @@
-/*
- * Copyright (C) 2015 NVIDIA Corporation.  All rights reserved.
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
- * DEALINGS IN THE SOFTWARE.
- */
-
-#include "vgpu/vgpu.h"
-
-static void vgpu_debug_show_dump(struct gk20a *g, struct gk20a_debug_output *o)
-{
-	/* debug dump not supported */
-}
-
-void vgpu_init_debug_ops(struct gpu_ops *gops)
-{
-	gops->debug.show_dump = vgpu_debug_show_dump;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.c b/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.c
index 84de9d0b..762cc10a 100644
--- a/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.c
@@ -41,7 +41,7 @@ struct vgpu_fecs_trace {
 	void *buf;
 };
 
-static int vgpu_fecs_trace_init(struct gk20a *g)
+int vgpu_fecs_trace_init(struct gk20a *g)
 {
 	struct device *dev = dev_from_gk20a(g);
 	struct device_node *np = dev->of_node;
@@ -102,7 +102,7 @@ fail:
 	return err;
 }
 
-static int vgpu_fecs_trace_deinit(struct gk20a *g)
+int vgpu_fecs_trace_deinit(struct gk20a *g)
 {
 	struct vgpu_fecs_trace *vcst = (struct vgpu_fecs_trace *)g->fecs_trace;
 
@@ -112,7 +112,7 @@ static int vgpu_fecs_trace_deinit(struct gk20a *g)
 	return 0;
 }
 
-static int vgpu_fecs_trace_enable(struct gk20a *g)
+int vgpu_fecs_trace_enable(struct gk20a *g)
 {
 	struct vgpu_fecs_trace *vcst = (struct vgpu_fecs_trace *)g->fecs_trace;
 	struct tegra_vgpu_cmd_msg msg = {
@@ -128,7 +128,7 @@ static int vgpu_fecs_trace_enable(struct gk20a *g)
 	return err;
 }
 
-static int vgpu_fecs_trace_disable(struct gk20a *g)
+int vgpu_fecs_trace_disable(struct gk20a *g)
 {
 	struct vgpu_fecs_trace *vcst = (struct vgpu_fecs_trace *)g->fecs_trace;
 	struct tegra_vgpu_cmd_msg msg = {
@@ -144,14 +144,14 @@ static int vgpu_fecs_trace_disable(struct gk20a *g)
 	return err;
 }
 
-static bool vpgpu_fecs_trace_is_enabled(struct gk20a *g)
+bool vgpu_fecs_trace_is_enabled(struct gk20a *g)
 {
 	struct vgpu_fecs_trace *vcst = (struct vgpu_fecs_trace *)g->fecs_trace;
 
 	return (vcst && vcst->enabled);
 }
 
-static int vgpu_fecs_trace_poll(struct gk20a *g)
+int vgpu_fecs_trace_poll(struct gk20a *g)
 {
 	struct tegra_vgpu_cmd_msg msg = {
 		.cmd = TEGRA_VGPU_CMD_FECS_TRACE_POLL,
@@ -165,7 +165,7 @@ static int vgpu_fecs_trace_poll(struct gk20a *g)
 	return err;
 }
 
-static int vgpu_alloc_user_buffer(struct gk20a *g, void **buf, size_t *size)
+int vgpu_alloc_user_buffer(struct gk20a *g, void **buf, size_t *size)
 {
 	struct vgpu_fecs_trace *vcst = (struct vgpu_fecs_trace *)g->fecs_trace;
 
@@ -174,12 +174,12 @@ static int vgpu_alloc_user_buffer(struct gk20a *g, void **buf, size_t *size)
 	return 0;
 }
 
-static int vgpu_free_user_buffer(struct gk20a *g)
+int vgpu_free_user_buffer(struct gk20a *g)
 {
 	return 0;
 }
 
-static int vgpu_mmap_user_buffer(struct gk20a *g, struct vm_area_struct *vma)
+int vgpu_mmap_user_buffer(struct gk20a *g, struct vm_area_struct *vma)
 {
 	struct vgpu_fecs_trace *vcst = (struct vgpu_fecs_trace *)g->fecs_trace;
 	unsigned long size = vcst->cookie->size;
@@ -194,7 +194,7 @@ static int vgpu_mmap_user_buffer(struct gk20a *g, struct vm_area_struct *vma)
 			vma->vm_page_prot);
 }
 
-static int vgpu_fecs_trace_max_entries(struct gk20a *g,
+int vgpu_fecs_trace_max_entries(struct gk20a *g,
 			struct nvgpu_ctxsw_trace_filter *filter)
 {
 	struct vgpu_fecs_trace *vcst = (struct vgpu_fecs_trace *)g->fecs_trace;
@@ -206,7 +206,7 @@ static int vgpu_fecs_trace_max_entries(struct gk20a *g,
 #error "FECS trace filter size mismatch!"
 #endif
 
-static int vgpu_fecs_trace_set_filter(struct gk20a *g,
+int vgpu_fecs_trace_set_filter(struct gk20a *g,
 			struct nvgpu_ctxsw_trace_filter *filter)
 {
 	struct tegra_vgpu_cmd_msg msg = {
@@ -223,25 +223,6 @@ static int vgpu_fecs_trace_set_filter(struct gk20a *g,
 	return err;
 }
 
-void vgpu_init_fecs_trace_ops(struct gpu_ops *ops)
-{
-	ops->fecs_trace.init = vgpu_fecs_trace_init;
-	ops->fecs_trace.deinit = vgpu_fecs_trace_deinit;
-	ops->fecs_trace.enable = vgpu_fecs_trace_enable;
-	ops->fecs_trace.disable = vgpu_fecs_trace_disable;
-	ops->fecs_trace.is_enabled = vpgpu_fecs_trace_is_enabled;
-	ops->fecs_trace.reset = NULL;
-	ops->fecs_trace.flush = NULL;
-	ops->fecs_trace.poll = vgpu_fecs_trace_poll;
-	ops->fecs_trace.bind_channel = NULL;
-	ops->fecs_trace.unbind_channel = NULL;
-	ops->fecs_trace.max_entries = vgpu_fecs_trace_max_entries;
-	ops->fecs_trace.alloc_user_buffer = vgpu_alloc_user_buffer;
-	ops->fecs_trace.free_user_buffer = vgpu_free_user_buffer;
-	ops->fecs_trace.mmap_user_buffer = vgpu_mmap_user_buffer;
-	ops->fecs_trace.set_filter = vgpu_fecs_trace_set_filter;
-}
-
 void vgpu_fecs_trace_data_update(struct gk20a *g)
 {
 	gk20a_ctxsw_trace_wake_up(g, 0);
diff --git a/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.h b/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.h
index d20de773..392b344c 100644
--- a/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.h
+++ b/drivers/gpu/nvgpu/vgpu/fecs_trace_vgpu.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2016-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -23,8 +23,25 @@
 #ifndef __FECS_TRACE_VGPU_H
 #define __FECS_TRACE_VGPU_H
 
-struct gpu_ops;
-void vgpu_init_fecs_trace_ops(struct gpu_ops *ops);
+#include <nvgpu/types.h>
+
+struct gk20a;
+struct vm_area_struct;
+struct nvgpu_ctxsw_trace_filter;
+
 void vgpu_fecs_trace_data_update(struct gk20a *g);
+int vgpu_fecs_trace_init(struct gk20a *g);
+int vgpu_fecs_trace_deinit(struct gk20a *g);
+int vgpu_fecs_trace_enable(struct gk20a *g);
+int vgpu_fecs_trace_disable(struct gk20a *g);
+bool vgpu_fecs_trace_is_enabled(struct gk20a *g);
+int vgpu_fecs_trace_poll(struct gk20a *g);
+int vgpu_alloc_user_buffer(struct gk20a *g, void **buf, size_t *size);
+int vgpu_free_user_buffer(struct gk20a *g);
+int vgpu_mmap_user_buffer(struct gk20a *g, struct vm_area_struct *vma);
+int vgpu_fecs_trace_max_entries(struct gk20a *g,
+			struct nvgpu_ctxsw_trace_filter *filter);
+int vgpu_fecs_trace_set_filter(struct gk20a *g,
+			struct nvgpu_ctxsw_trace_filter *filter);
 
 #endif /* __FECS_TRACE_VGPU_H */
diff --git a/drivers/gpu/nvgpu/vgpu/fifo_vgpu.c b/drivers/gpu/nvgpu/vgpu/fifo_vgpu.c
index 73a67d91..582894b9 100644
--- a/drivers/gpu/nvgpu/vgpu/fifo_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/fifo_vgpu.c
@@ -32,12 +32,13 @@
 #include <nvgpu/barrier.h>
 
 #include "vgpu/vgpu.h"
+#include "vgpu/fifo_vgpu.h"
 #include "gk20a/ctxsw_trace_gk20a.h"
 
 #include <nvgpu/hw/gk20a/hw_fifo_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_ram_gk20a.h>
 
-static void vgpu_channel_bind(struct channel_gk20a *ch)
+void vgpu_channel_bind(struct channel_gk20a *ch)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_channel_config_params *p =
@@ -56,7 +57,7 @@ static void vgpu_channel_bind(struct channel_gk20a *ch)
 	nvgpu_atomic_set(&ch->bound, true);
 }
 
-static void vgpu_channel_unbind(struct channel_gk20a *ch)
+void vgpu_channel_unbind(struct channel_gk20a *ch)
 {
 
 	gk20a_dbg_fn("");
@@ -76,7 +77,7 @@ static void vgpu_channel_unbind(struct channel_gk20a *ch)
 
 }
 
-static int vgpu_channel_alloc_inst(struct gk20a *g, struct channel_gk20a *ch)
+int vgpu_channel_alloc_inst(struct gk20a *g, struct channel_gk20a *ch)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_channel_hwctx_params *p = &msg.params.channel_hwctx;
@@ -99,7 +100,7 @@ static int vgpu_channel_alloc_inst(struct gk20a *g, struct channel_gk20a *ch)
 	return 0;
 }
 
-static void vgpu_channel_free_inst(struct gk20a *g, struct channel_gk20a *ch)
+void vgpu_channel_free_inst(struct gk20a *g, struct channel_gk20a *ch)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_channel_hwctx_params *p = &msg.params.channel_hwctx;
@@ -114,7 +115,7 @@ static void vgpu_channel_free_inst(struct gk20a *g, struct channel_gk20a *ch)
 	WARN_ON(err || msg.ret);
 }
 
-static void vgpu_channel_enable(struct channel_gk20a *ch)
+void vgpu_channel_enable(struct channel_gk20a *ch)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_channel_config_params *p =
@@ -130,7 +131,7 @@ static void vgpu_channel_enable(struct channel_gk20a *ch)
 	WARN_ON(err || msg.ret);
 }
 
-static void vgpu_channel_disable(struct channel_gk20a *ch)
+void vgpu_channel_disable(struct channel_gk20a *ch)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_channel_config_params *p =
@@ -146,7 +147,7 @@ static void vgpu_channel_disable(struct channel_gk20a *ch)
 	WARN_ON(err || msg.ret);
 }
 
-static int vgpu_channel_setup_ramfc(struct channel_gk20a *ch, u64 gpfifo_base,
+int vgpu_channel_setup_ramfc(struct channel_gk20a *ch, u64 gpfifo_base,
 				u32 gpfifo_entries,
 				unsigned long acquire_timeout, u32 flags)
 {
@@ -170,7 +171,7 @@ static int vgpu_channel_setup_ramfc(struct channel_gk20a *ch, u64 gpfifo_base,
 	return (err || msg.ret) ? -ENOMEM : 0;
 }
 
-static int vgpu_fifo_init_engine_info(struct fifo_gk20a *f)
+int vgpu_fifo_init_engine_info(struct fifo_gk20a *f)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(f->g);
 	struct tegra_vgpu_engines_info *engines = &priv->constants.engines_info;
@@ -377,7 +378,7 @@ clean_up:
 	return err;
 }
 
-static int vgpu_init_fifo_setup_hw(struct gk20a *g)
+int vgpu_init_fifo_setup_hw(struct gk20a *g)
 {
 	gk20a_dbg_fn("");
 
@@ -440,7 +441,7 @@ int vgpu_init_fifo_support(struct gk20a *g)
 	return err;
 }
 
-static int vgpu_fifo_preempt_channel(struct gk20a *g, u32 chid)
+int vgpu_fifo_preempt_channel(struct gk20a *g, u32 chid)
 {
 	struct fifo_gk20a *f = &g->fifo;
 	struct channel_gk20a *ch = &f->channel[chid];
@@ -468,7 +469,7 @@ static int vgpu_fifo_preempt_channel(struct gk20a *g, u32 chid)
 	return err;
 }
 
-static int vgpu_fifo_preempt_tsg(struct gk20a *g, u32 tsgid)
+int vgpu_fifo_preempt_tsg(struct gk20a *g, u32 tsgid)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_tsg_preempt_params *p =
@@ -579,7 +580,7 @@ static int vgpu_fifo_update_runlist_locked(struct gk20a *g, u32 runlist_id,
    special cases below: runlist->active_channels will NOT be changed.
    (chid == ~0 && !add) means remove all active channels from runlist.
    (chid == ~0 &&  add) means restore all active channels on runlist. */
-static int vgpu_fifo_update_runlist(struct gk20a *g, u32 runlist_id,
+int vgpu_fifo_update_runlist(struct gk20a *g, u32 runlist_id,
 				u32 chid, bool add, bool wait_for_finish)
 {
 	struct fifo_runlist_info_gk20a *runlist = NULL;
@@ -599,14 +600,14 @@ static int vgpu_fifo_update_runlist(struct gk20a *g, u32 runlist_id,
 	return ret;
 }
 
-static int vgpu_fifo_wait_engine_idle(struct gk20a *g)
+int vgpu_fifo_wait_engine_idle(struct gk20a *g)
 {
 	gk20a_dbg_fn("");
 
 	return 0;
 }
 
-static int vgpu_channel_set_priority(struct channel_gk20a *ch, u32 priority)
+int vgpu_channel_set_priority(struct channel_gk20a *ch, u32 priority)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_channel_priority_params *p =
@@ -646,7 +647,7 @@ static int vgpu_fifo_tsg_set_runlist_interleave(struct gk20a *g,
 	return err ? err : msg.ret;
 }
 
-static int vgpu_fifo_set_runlist_interleave(struct gk20a *g,
+int vgpu_fifo_set_runlist_interleave(struct gk20a *g,
 					u32 id,
 					bool is_tsg,
 					u32 runlist_id,
@@ -674,7 +675,7 @@ static int vgpu_fifo_set_runlist_interleave(struct gk20a *g,
 	return err ? err : msg.ret;
 }
 
-static int vgpu_channel_set_timeslice(struct channel_gk20a *ch, u32 timeslice)
+int vgpu_channel_set_timeslice(struct channel_gk20a *ch, u32 timeslice)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_channel_timeslice_params *p =
@@ -695,7 +696,7 @@ static int vgpu_channel_set_timeslice(struct channel_gk20a *ch, u32 timeslice)
 	return err;
 }
 
-static int vgpu_fifo_force_reset_ch(struct channel_gk20a *ch,
+int vgpu_fifo_force_reset_ch(struct channel_gk20a *ch,
 					u32 err_code, bool verbose)
 {
 	struct tsg_gk20a *tsg = NULL;
@@ -818,29 +819,3 @@ u32 vgpu_fifo_default_timeslice_us(struct gk20a *g)
 
 	return priv->constants.default_timeslice_us;
 }
-
-void vgpu_init_fifo_ops(struct gpu_ops *gops)
-{
-	gops->fifo.init_fifo_setup_hw = vgpu_init_fifo_setup_hw;
-	gops->fifo.bind_channel = vgpu_channel_bind;
-	gops->fifo.unbind_channel = vgpu_channel_unbind;
-	gops->fifo.enable_channel = vgpu_channel_enable;
-	gops->fifo.disable_channel = vgpu_channel_disable;
-	gops->fifo.alloc_inst = vgpu_channel_alloc_inst;
-	gops->fifo.free_inst = vgpu_channel_free_inst;
-	gops->fifo.setup_ramfc = vgpu_channel_setup_ramfc;
-	gops->fifo.preempt_channel = vgpu_fifo_preempt_channel;
-	gops->fifo.preempt_tsg = vgpu_fifo_preempt_tsg;
-	gops->fifo.enable_tsg = gk20a_enable_tsg;
-	gops->fifo.disable_tsg = gk20a_disable_tsg;
-	/* Not supported yet for vgpu */
-	gops->fifo.tsg_verify_channel_status = NULL;
-	gops->fifo.update_runlist = vgpu_fifo_update_runlist;
-	gops->fifo.wait_engine_idle = vgpu_fifo_wait_engine_idle;
-	gops->fifo.channel_set_priority = vgpu_channel_set_priority;
-	gops->fifo.set_runlist_interleave = vgpu_fifo_set_runlist_interleave;
-	gops->fifo.channel_set_timeslice = vgpu_channel_set_timeslice;
-	gops->fifo.force_reset_ch = vgpu_fifo_force_reset_ch;
-	gops->fifo.init_engine_info = vgpu_fifo_init_engine_info;
-	gops->fifo.default_timeslice_us = vgpu_fifo_default_timeslice_us;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/fifo_vgpu.h b/drivers/gpu/nvgpu/vgpu/fifo_vgpu.h
new file mode 100644
index 00000000..c5a51f97
--- /dev/null
+++ b/drivers/gpu/nvgpu/vgpu/fifo_vgpu.h
@@ -0,0 +1,65 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef _FIFO_VGPU_H_
+#define _FIFO_VGPU_H_
+
+#include <nvgpu/types.h>
+
+struct gk20a;
+struct channel_gk20a;
+struct fifo_gk20a;
+struct tsg_gk20a;
+
+int vgpu_init_fifo_setup_hw(struct gk20a *g);
+void vgpu_channel_bind(struct channel_gk20a *ch);
+void vgpu_channel_unbind(struct channel_gk20a *ch);
+int vgpu_channel_alloc_inst(struct gk20a *g, struct channel_gk20a *ch);
+void vgpu_channel_free_inst(struct gk20a *g, struct channel_gk20a *ch);
+void vgpu_channel_enable(struct channel_gk20a *ch);
+void vgpu_channel_disable(struct channel_gk20a *ch);
+int vgpu_channel_setup_ramfc(struct channel_gk20a *ch, u64 gpfifo_base,
+				u32 gpfifo_entries,
+				unsigned long acquire_timeout, u32 flags);
+int vgpu_fifo_init_engine_info(struct fifo_gk20a *f);
+int vgpu_fifo_preempt_channel(struct gk20a *g, u32 chid);
+int vgpu_fifo_preempt_tsg(struct gk20a *g, u32 tsgid);
+int vgpu_fifo_update_runlist(struct gk20a *g, u32 runlist_id,
+				u32 chid, bool add, bool wait_for_finish);
+int vgpu_fifo_wait_engine_idle(struct gk20a *g);
+int vgpu_channel_set_priority(struct channel_gk20a *ch, u32 priority);
+int vgpu_fifo_set_runlist_interleave(struct gk20a *g,
+					u32 id,
+					bool is_tsg,
+					u32 runlist_id,
+					u32 new_level);
+int vgpu_channel_set_timeslice(struct channel_gk20a *ch, u32 timeslice);
+int vgpu_fifo_force_reset_ch(struct channel_gk20a *ch,
+					u32 err_code, bool verbose);
+u32 vgpu_fifo_default_timeslice_us(struct gk20a *g);
+int vgpu_tsg_open(struct tsg_gk20a *tsg);
+int vgpu_tsg_bind_channel(struct tsg_gk20a *tsg,
+			struct channel_gk20a *ch);
+int vgpu_tsg_unbind_channel(struct channel_gk20a *ch);
+int vgpu_tsg_set_timeslice(struct tsg_gk20a *tsg, u32 timeslice);
+
+#endif
diff --git a/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.c b/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.c
index 0acafa8e..06962a86 100644
--- a/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.c
+++ b/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.c
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015-2016, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -23,7 +23,7 @@
 #include "gk20a/gk20a.h"
 #include "vgpu_gr_gm20b.h"
 
-static int vgpu_gm20b_init_fs_state(struct gk20a *g)
+int vgpu_gm20b_init_fs_state(struct gk20a *g)
 {
 	struct gr_gk20a *gr = &g->gr;
 	u32 tpc_index, gpc_index;
@@ -44,8 +44,3 @@ static int vgpu_gm20b_init_fs_state(struct gk20a *g)
 	gr->no_of_sm = sm_id;
 	return 0;
 }
-
-void vgpu_gm20b_init_gr_ops(struct gpu_ops *gops)
-{
-	gops->gr.init_fs_state = vgpu_gm20b_init_fs_state;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.h b/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.h
index dda0de7b..993a8f3d 100644
--- a/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.h
+++ b/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_gr_gm20b.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -25,6 +25,6 @@
 
 #include "gk20a/gk20a.h"
 
-void vgpu_gm20b_init_gr_ops(struct gpu_ops *gops);
+int vgpu_gm20b_init_fs_state(struct gk20a *g);
 
 #endif
diff --git a/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_hal_gm20b.c b/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_hal_gm20b.c
index 348510df..618c80f8 100644
--- a/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_hal_gm20b.c
+++ b/drivers/gpu/nvgpu/vgpu/gm20b/vgpu_hal_gm20b.c
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -22,17 +22,582 @@
 
 #include "gm20b/hal_gm20b.h"
 #include "vgpu/vgpu.h"
+#include "vgpu/fifo_vgpu.h"
+#include "vgpu/gr_vgpu.h"
+#include "vgpu/ltc_vgpu.h"
+#include "vgpu/mm_vgpu.h"
+#include "vgpu/dbg_vgpu.h"
+#include "vgpu/fecs_trace_vgpu.h"
+#include "vgpu/css_vgpu.h"
 #include "vgpu_gr_gm20b.h"
 
+#include "gk20a/bus_gk20a.h"
+#include "gk20a/flcn_gk20a.h"
+#include "gk20a/mc_gk20a.h"
+#include "gk20a/fb_gk20a.h"
+
+#include "gm20b/gr_gm20b.h"
+#include "gm20b/fifo_gm20b.h"
+#include "gm20b/acr_gm20b.h"
+#include "gm20b/pmu_gm20b.h"
+#include "gm20b/fb_gm20b.h"
+#include "gm20b/bus_gm20b.h"
+#include "gm20b/cde_gm20b.h"
+#include "gm20b/regops_gm20b.h"
+#include "gm20b/clk_gm20b.h"
+#include "gm20b/therm_gm20b.h"
+#include "gm20b/mm_gm20b.h"
+#include "gm20b/gr_ctx_gm20b.h"
+#include "gm20b/gm20b_gating_reglist.h"
+#include "gm20b/ltc_gm20b.h"
+
+#include <nvgpu/enabled.h>
+
+#include <nvgpu/hw/gm20b/hw_fuse_gm20b.h>
+#include <nvgpu/hw/gm20b/hw_pwr_gm20b.h>
+#include <nvgpu/hw/gm20b/hw_fifo_gm20b.h>
+#include <nvgpu/hw/gm20b/hw_ram_gm20b.h>
+
+static const struct gpu_ops vgpu_gm20b_ops = {
+	.ltc = {
+		.determine_L2_size_bytes = vgpu_determine_L2_size_bytes,
+		.set_zbc_color_entry = gm20b_ltc_set_zbc_color_entry,
+		.set_zbc_depth_entry = gm20b_ltc_set_zbc_depth_entry,
+		.init_cbc = gm20b_ltc_init_cbc,
+		.init_fs_state = vgpu_ltc_init_fs_state,
+		.init_comptags = vgpu_ltc_init_comptags,
+		.cbc_ctrl = NULL,
+		.isr = gm20b_ltc_isr,
+		.cbc_fix_config = gm20b_ltc_cbc_fix_config,
+		.flush = gm20b_flush_ltc,
+		.set_enabled = gm20b_ltc_set_enabled,
+	},
+	.ce2 = {
+		.isr_stall = gk20a_ce2_isr,
+		.isr_nonstall = gk20a_ce2_nonstall_isr,
+		.get_num_pce = vgpu_ce_get_num_pce,
+	},
+	.gr = {
+		.init_gpc_mmu = gr_gm20b_init_gpc_mmu,
+		.bundle_cb_defaults = gr_gm20b_bundle_cb_defaults,
+		.cb_size_default = gr_gm20b_cb_size_default,
+		.calc_global_ctx_buffer_size =
+			gr_gm20b_calc_global_ctx_buffer_size,
+		.commit_global_attrib_cb = gr_gm20b_commit_global_attrib_cb,
+		.commit_global_bundle_cb = gr_gm20b_commit_global_bundle_cb,
+		.commit_global_cb_manager = gr_gm20b_commit_global_cb_manager,
+		.commit_global_pagepool = gr_gm20b_commit_global_pagepool,
+		.handle_sw_method = gr_gm20b_handle_sw_method,
+		.set_alpha_circular_buffer_size =
+			gr_gm20b_set_alpha_circular_buffer_size,
+		.set_circular_buffer_size = gr_gm20b_set_circular_buffer_size,
+		.enable_hww_exceptions = gr_gk20a_enable_hww_exceptions,
+		.is_valid_class = gr_gm20b_is_valid_class,
+		.is_valid_gfx_class = gr_gm20b_is_valid_gfx_class,
+		.is_valid_compute_class = gr_gm20b_is_valid_compute_class,
+		.get_sm_dsm_perf_regs = gr_gm20b_get_sm_dsm_perf_regs,
+		.get_sm_dsm_perf_ctrl_regs = gr_gm20b_get_sm_dsm_perf_ctrl_regs,
+		.init_fs_state = vgpu_gm20b_init_fs_state,
+		.set_hww_esr_report_mask = gr_gm20b_set_hww_esr_report_mask,
+		.falcon_load_ucode = gr_gm20b_load_ctxsw_ucode_segments,
+		.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode,
+		.set_gpc_tpc_mask = gr_gm20b_set_gpc_tpc_mask,
+		.get_gpc_tpc_mask = vgpu_gr_get_gpc_tpc_mask,
+		.free_channel_ctx = vgpu_gr_free_channel_ctx,
+		.alloc_obj_ctx = vgpu_gr_alloc_obj_ctx,
+		.bind_ctxsw_zcull = vgpu_gr_bind_ctxsw_zcull,
+		.get_zcull_info = vgpu_gr_get_zcull_info,
+		.is_tpc_addr = gr_gm20b_is_tpc_addr,
+		.get_tpc_num = gr_gm20b_get_tpc_num,
+		.detect_sm_arch = vgpu_gr_detect_sm_arch,
+		.add_zbc_color = gr_gk20a_add_zbc_color,
+		.add_zbc_depth = gr_gk20a_add_zbc_depth,
+		.zbc_set_table = vgpu_gr_add_zbc,
+		.zbc_query_table = vgpu_gr_query_zbc,
+		.pmu_save_zbc = gk20a_pmu_save_zbc,
+		.add_zbc = gr_gk20a_add_zbc,
+		.pagepool_default_size = gr_gm20b_pagepool_default_size,
+		.init_ctx_state = vgpu_gr_init_ctx_state,
+		.alloc_gr_ctx = vgpu_gr_alloc_gr_ctx,
+		.free_gr_ctx = vgpu_gr_free_gr_ctx,
+		.update_ctxsw_preemption_mode =
+			gr_gm20b_update_ctxsw_preemption_mode,
+		.dump_gr_regs = NULL,
+		.update_pc_sampling = gr_gm20b_update_pc_sampling,
+		.get_fbp_en_mask = vgpu_gr_get_fbp_en_mask,
+		.get_max_ltc_per_fbp = vgpu_gr_get_max_ltc_per_fbp,
+		.get_max_lts_per_ltc = vgpu_gr_get_max_lts_per_ltc,
+		.get_rop_l2_en_mask = vgpu_gr_rop_l2_en_mask,
+		.get_max_fbps_count = vgpu_gr_get_max_fbps_count,
+		.init_sm_dsm_reg_info = gr_gm20b_init_sm_dsm_reg_info,
+		.wait_empty = gr_gk20a_wait_idle,
+		.init_cyclestats = gr_gm20b_init_cyclestats,
+		.set_sm_debug_mode = vgpu_gr_set_sm_debug_mode,
+		.enable_cde_in_fecs = gr_gm20b_enable_cde_in_fecs,
+		.bpt_reg_info = gr_gm20b_bpt_reg_info,
+		.get_access_map = gr_gm20b_get_access_map,
+		.handle_fecs_error = gk20a_gr_handle_fecs_error,
+		.handle_sm_exception = gr_gk20a_handle_sm_exception,
+		.handle_tex_exception = gr_gk20a_handle_tex_exception,
+		.enable_gpc_exceptions = gk20a_gr_enable_gpc_exceptions,
+		.enable_exceptions = gk20a_gr_enable_exceptions,
+		.get_lrf_tex_ltc_dram_override = NULL,
+		.update_smpc_ctxsw_mode = vgpu_gr_update_smpc_ctxsw_mode,
+		.update_hwpm_ctxsw_mode = vgpu_gr_update_hwpm_ctxsw_mode,
+		.record_sm_error_state = gm20b_gr_record_sm_error_state,
+		.update_sm_error_state = gm20b_gr_update_sm_error_state,
+		.clear_sm_error_state = vgpu_gr_clear_sm_error_state,
+		.suspend_contexts = vgpu_gr_suspend_contexts,
+		.resume_contexts = vgpu_gr_resume_contexts,
+		.get_preemption_mode_flags = gr_gm20b_get_preemption_mode_flags,
+		.fuse_override = gm20b_gr_fuse_override,
+		.init_sm_id_table = gr_gk20a_init_sm_id_table,
+		.load_smid_config = gr_gm20b_load_smid_config,
+		.program_sm_id_numbering = gr_gm20b_program_sm_id_numbering,
+		.is_ltcs_ltss_addr = gr_gm20b_is_ltcs_ltss_addr,
+		.is_ltcn_ltss_addr = gr_gm20b_is_ltcn_ltss_addr,
+		.split_lts_broadcast_addr = gr_gm20b_split_lts_broadcast_addr,
+		.split_ltc_broadcast_addr = gr_gm20b_split_ltc_broadcast_addr,
+		.setup_rop_mapping = gr_gk20a_setup_rop_mapping,
+		.program_zcull_mapping = gr_gk20a_program_zcull_mapping,
+		.commit_global_timeslice = gr_gk20a_commit_global_timeslice,
+		.commit_inst = vgpu_gr_commit_inst,
+		.write_zcull_ptr = gr_gk20a_write_zcull_ptr,
+		.write_pm_ptr = gr_gk20a_write_pm_ptr,
+		.init_elcg_mode = gr_gk20a_init_elcg_mode,
+		.load_tpc_mask = gr_gm20b_load_tpc_mask,
+		.inval_icache = gr_gk20a_inval_icache,
+		.trigger_suspend = gr_gk20a_trigger_suspend,
+		.wait_for_pause = gr_gk20a_wait_for_pause,
+		.resume_from_pause = gr_gk20a_resume_from_pause,
+		.clear_sm_errors = gr_gk20a_clear_sm_errors,
+		.tpc_enabled_exceptions = gr_gk20a_tpc_enabled_exceptions,
+		.get_esr_sm_sel = gk20a_gr_get_esr_sm_sel,
+		.sm_debugger_attached = gk20a_gr_sm_debugger_attached,
+		.suspend_single_sm = gk20a_gr_suspend_single_sm,
+		.suspend_all_sms = gk20a_gr_suspend_all_sms,
+		.resume_single_sm = gk20a_gr_resume_single_sm,
+		.resume_all_sms = gk20a_gr_resume_all_sms,
+		.get_sm_hww_warp_esr = gk20a_gr_get_sm_hww_warp_esr,
+		.get_sm_hww_global_esr = gk20a_gr_get_sm_hww_global_esr,
+		.get_sm_no_lock_down_hww_global_esr_mask =
+			gk20a_gr_get_sm_no_lock_down_hww_global_esr_mask,
+		.lock_down_sm = gk20a_gr_lock_down_sm,
+		.wait_for_sm_lock_down = gk20a_gr_wait_for_sm_lock_down,
+		.clear_sm_hww = gm20b_gr_clear_sm_hww,
+		.init_ovr_sm_dsm_perf =  gk20a_gr_init_ovr_sm_dsm_perf,
+		.get_ovr_perf_regs = gk20a_gr_get_ovr_perf_regs,
+		.disable_rd_coalesce = gm20a_gr_disable_rd_coalesce,
+		.init_ctxsw_hdr_data = gk20a_gr_init_ctxsw_hdr_data,
+		.set_boosted_ctx = NULL,
+		.update_boosted_ctx = NULL,
+	},
+	.fb = {
+		.reset = fb_gk20a_reset,
+		.init_hw = gk20a_fb_init_hw,
+		.init_fs_state = fb_gm20b_init_fs_state,
+		.set_mmu_page_size = gm20b_fb_set_mmu_page_size,
+		.set_use_full_comp_tag_line =
+			gm20b_fb_set_use_full_comp_tag_line,
+		.compression_page_size = gm20b_fb_compression_page_size,
+		.compressible_page_size = gm20b_fb_compressible_page_size,
+		.vpr_info_fetch = gm20b_fb_vpr_info_fetch,
+		.dump_vpr_wpr_info = gm20b_fb_dump_vpr_wpr_info,
+		.read_wpr_info = gm20b_fb_read_wpr_info,
+		.is_debug_mode_enabled = NULL,
+		.set_debug_mode = vgpu_mm_mmu_set_debug_mode,
+		.tlb_invalidate = vgpu_mm_tlb_invalidate,
+	},
+	.clock_gating = {
+		.slcg_bus_load_gating_prod =
+			gm20b_slcg_bus_load_gating_prod,
+		.slcg_ce2_load_gating_prod =
+			gm20b_slcg_ce2_load_gating_prod,
+		.slcg_chiplet_load_gating_prod =
+			gm20b_slcg_chiplet_load_gating_prod,
+		.slcg_ctxsw_firmware_load_gating_prod =
+			gm20b_slcg_ctxsw_firmware_load_gating_prod,
+		.slcg_fb_load_gating_prod =
+			gm20b_slcg_fb_load_gating_prod,
+		.slcg_fifo_load_gating_prod =
+			gm20b_slcg_fifo_load_gating_prod,
+		.slcg_gr_load_gating_prod =
+			gr_gm20b_slcg_gr_load_gating_prod,
+		.slcg_ltc_load_gating_prod =
+			ltc_gm20b_slcg_ltc_load_gating_prod,
+		.slcg_perf_load_gating_prod =
+			gm20b_slcg_perf_load_gating_prod,
+		.slcg_priring_load_gating_prod =
+			gm20b_slcg_priring_load_gating_prod,
+		.slcg_pmu_load_gating_prod =
+			gm20b_slcg_pmu_load_gating_prod,
+		.slcg_therm_load_gating_prod =
+			gm20b_slcg_therm_load_gating_prod,
+		.slcg_xbar_load_gating_prod =
+			gm20b_slcg_xbar_load_gating_prod,
+		.blcg_bus_load_gating_prod =
+			gm20b_blcg_bus_load_gating_prod,
+		.blcg_ctxsw_firmware_load_gating_prod =
+			gm20b_blcg_ctxsw_firmware_load_gating_prod,
+		.blcg_fb_load_gating_prod =
+			gm20b_blcg_fb_load_gating_prod,
+		.blcg_fifo_load_gating_prod =
+			gm20b_blcg_fifo_load_gating_prod,
+		.blcg_gr_load_gating_prod =
+			gm20b_blcg_gr_load_gating_prod,
+		.blcg_ltc_load_gating_prod =
+			gm20b_blcg_ltc_load_gating_prod,
+		.blcg_pwr_csb_load_gating_prod =
+			gm20b_blcg_pwr_csb_load_gating_prod,
+		.blcg_xbar_load_gating_prod =
+			gm20b_blcg_xbar_load_gating_prod,
+		.blcg_pmu_load_gating_prod =
+			gm20b_blcg_pmu_load_gating_prod,
+		.pg_gr_load_gating_prod =
+			gr_gm20b_pg_gr_load_gating_prod,
+	},
+	.fifo = {
+		.init_fifo_setup_hw = vgpu_init_fifo_setup_hw,
+		.bind_channel = vgpu_channel_bind,
+		.unbind_channel = vgpu_channel_unbind,
+		.disable_channel = vgpu_channel_disable,
+		.enable_channel = vgpu_channel_enable,
+		.alloc_inst = vgpu_channel_alloc_inst,
+		.free_inst = vgpu_channel_free_inst,
+		.setup_ramfc = vgpu_channel_setup_ramfc,
+		.channel_set_priority = vgpu_channel_set_priority,
+		.channel_set_timeslice = vgpu_channel_set_timeslice,
+		.default_timeslice_us = vgpu_fifo_default_timeslice_us,
+		.setup_userd = gk20a_fifo_setup_userd,
+		.userd_gp_get = gk20a_fifo_userd_gp_get,
+		.userd_gp_put = gk20a_fifo_userd_gp_put,
+		.userd_pb_get = gk20a_fifo_userd_pb_get,
+		.pbdma_acquire_val = gk20a_fifo_pbdma_acquire_val,
+		.preempt_channel = vgpu_fifo_preempt_channel,
+		.preempt_tsg = vgpu_fifo_preempt_tsg,
+		.enable_tsg = gk20a_enable_tsg,
+		.disable_tsg = gk20a_disable_tsg,
+		.tsg_verify_channel_status = NULL,
+		.tsg_verify_status_ctx_reload = gm20b_fifo_tsg_verify_status_ctx_reload,
+		.update_runlist = vgpu_fifo_update_runlist,
+		.trigger_mmu_fault = gm20b_fifo_trigger_mmu_fault,
+		.get_mmu_fault_info = gk20a_fifo_get_mmu_fault_info,
+		.wait_engine_idle = vgpu_fifo_wait_engine_idle,
+		.get_num_fifos = gm20b_fifo_get_num_fifos,
+		.get_pbdma_signature = gk20a_fifo_get_pbdma_signature,
+		.set_runlist_interleave = vgpu_fifo_set_runlist_interleave,
+		.tsg_set_timeslice = vgpu_tsg_set_timeslice,
+		.tsg_open = vgpu_tsg_open,
+		.force_reset_ch = vgpu_fifo_force_reset_ch,
+		.engine_enum_from_type = gk20a_fifo_engine_enum_from_type,
+		.device_info_data_parse = gm20b_device_info_data_parse,
+		.eng_runlist_base_size = fifo_eng_runlist_base__size_1_v,
+		.init_engine_info = vgpu_fifo_init_engine_info,
+		.runlist_entry_size = ram_rl_entry_size_v,
+		.get_tsg_runlist_entry = gk20a_get_tsg_runlist_entry,
+		.get_ch_runlist_entry = gk20a_get_ch_runlist_entry,
+		.is_fault_engine_subid_gpc = gk20a_is_fault_engine_subid_gpc,
+		.dump_pbdma_status = gk20a_dump_pbdma_status,
+		.dump_eng_status = gk20a_dump_eng_status,
+		.dump_channel_status_ramfc = gk20a_dump_channel_status_ramfc,
+		.intr_0_error_mask = gk20a_fifo_intr_0_error_mask,
+		.is_preempt_pending = gk20a_fifo_is_preempt_pending,
+		.init_pbdma_intr_descs = gm20b_fifo_init_pbdma_intr_descs,
+		.reset_enable_hw = gk20a_init_fifo_reset_enable_hw,
+		.teardown_ch_tsg = gk20a_fifo_teardown_ch_tsg,
+		.handle_sched_error = gk20a_fifo_handle_sched_error,
+		.handle_pbdma_intr_0 = gk20a_fifo_handle_pbdma_intr_0,
+		.handle_pbdma_intr_1 = gk20a_fifo_handle_pbdma_intr_1,
+		.tsg_bind_channel = vgpu_tsg_bind_channel,
+		.tsg_unbind_channel = vgpu_tsg_unbind_channel,
+#ifdef CONFIG_TEGRA_GK20A_NVHOST
+		.alloc_syncpt_buf = gk20a_fifo_alloc_syncpt_buf,
+		.free_syncpt_buf = gk20a_fifo_free_syncpt_buf,
+		.add_syncpt_wait_cmd = gk20a_fifo_add_syncpt_wait_cmd,
+		.get_syncpt_wait_cmd_size = gk20a_fifo_get_syncpt_wait_cmd_size,
+		.add_syncpt_incr_cmd = gk20a_fifo_add_syncpt_incr_cmd,
+		.get_syncpt_incr_cmd_size = gk20a_fifo_get_syncpt_incr_cmd_size,
+#endif
+	},
+	.gr_ctx = {
+		.get_netlist_name = gr_gm20b_get_netlist_name,
+		.is_fw_defined = gr_gm20b_is_firmware_defined,
+	},
+	.mm = {
+		.support_sparse = gm20b_mm_support_sparse,
+		.gmmu_map = vgpu_locked_gmmu_map,
+		.gmmu_unmap = vgpu_locked_gmmu_unmap,
+		.vm_bind_channel = vgpu_vm_bind_channel,
+		.fb_flush = vgpu_mm_fb_flush,
+		.l2_invalidate = vgpu_mm_l2_invalidate,
+		.l2_flush = vgpu_mm_l2_flush,
+		.cbc_clean = gk20a_mm_cbc_clean,
+		.set_big_page_size = gm20b_mm_set_big_page_size,
+		.get_big_page_sizes = gm20b_mm_get_big_page_sizes,
+		.get_default_big_page_size = gm20b_mm_get_default_big_page_size,
+		.gpu_phys_addr = gm20b_gpu_phys_addr,
+		.get_iommu_bit = gk20a_mm_get_iommu_bit,
+		.get_mmu_levels = gk20a_mm_get_mmu_levels,
+		.init_pdb = gk20a_mm_init_pdb,
+		.init_mm_setup_hw = NULL,
+		.is_bar1_supported = gm20b_mm_is_bar1_supported,
+		.init_inst_block = gk20a_init_inst_block,
+		.mmu_fault_pending = gk20a_fifo_mmu_fault_pending,
+	},
+	.therm = {
+		.init_therm_setup_hw = gm20b_init_therm_setup_hw,
+		.elcg_init_idle_filters = gk20a_elcg_init_idle_filters,
+	},
+	.pmu = {
+		.pmu_setup_elpg = gm20b_pmu_setup_elpg,
+		.pmu_get_queue_head = pwr_pmu_queue_head_r,
+		.pmu_get_queue_head_size = pwr_pmu_queue_head__size_1_v,
+		.pmu_get_queue_tail = pwr_pmu_queue_tail_r,
+		.pmu_get_queue_tail_size = pwr_pmu_queue_tail__size_1_v,
+		.pmu_queue_head = gk20a_pmu_queue_head,
+		.pmu_queue_tail = gk20a_pmu_queue_tail,
+		.pmu_msgq_tail = gk20a_pmu_msgq_tail,
+		.pmu_mutex_size = pwr_pmu_mutex__size_1_v,
+		.pmu_mutex_acquire = gk20a_pmu_mutex_acquire,
+		.pmu_mutex_release = gk20a_pmu_mutex_release,
+		.write_dmatrfbase = gm20b_write_dmatrfbase,
+		.pmu_elpg_statistics = gk20a_pmu_elpg_statistics,
+		.pmu_pg_init_param = NULL,
+		.pmu_pg_supported_engines_list = gk20a_pmu_pg_engines_list,
+		.pmu_pg_engines_feature_list = gk20a_pmu_pg_feature_list,
+		.pmu_is_lpwr_feature_supported = NULL,
+		.pmu_lpwr_enable_pg = NULL,
+		.pmu_lpwr_disable_pg = NULL,
+		.pmu_pg_param_post_init = NULL,
+		.dump_secure_fuses = pmu_dump_security_fuses_gm20b,
+		.reset_engine = gk20a_pmu_engine_reset,
+		.is_engine_in_reset = gk20a_pmu_is_engine_in_reset,
+	},
+	.clk = {
+		.init_clk_support = gm20b_init_clk_support,
+		.suspend_clk_support = gm20b_suspend_clk_support,
+#ifdef CONFIG_DEBUG_FS
+		.init_debugfs = gm20b_clk_init_debugfs,
+#endif
+		.get_voltage = gm20b_clk_get_voltage,
+		.get_gpcclk_clock_counter = gm20b_clk_get_gpcclk_clock_counter,
+		.pll_reg_write = gm20b_clk_pll_reg_write,
+		.get_pll_debug_data = gm20b_clk_get_pll_debug_data,
+	},
+	.regops = {
+		.get_global_whitelist_ranges =
+			gm20b_get_global_whitelist_ranges,
+		.get_global_whitelist_ranges_count =
+			gm20b_get_global_whitelist_ranges_count,
+		.get_context_whitelist_ranges =
+			gm20b_get_context_whitelist_ranges,
+		.get_context_whitelist_ranges_count =
+			gm20b_get_context_whitelist_ranges_count,
+		.get_runcontrol_whitelist = gm20b_get_runcontrol_whitelist,
+		.get_runcontrol_whitelist_count =
+			gm20b_get_runcontrol_whitelist_count,
+		.get_runcontrol_whitelist_ranges =
+			gm20b_get_runcontrol_whitelist_ranges,
+		.get_runcontrol_whitelist_ranges_count =
+			gm20b_get_runcontrol_whitelist_ranges_count,
+		.get_qctl_whitelist = gm20b_get_qctl_whitelist,
+		.get_qctl_whitelist_count = gm20b_get_qctl_whitelist_count,
+		.get_qctl_whitelist_ranges = gm20b_get_qctl_whitelist_ranges,
+		.get_qctl_whitelist_ranges_count =
+			gm20b_get_qctl_whitelist_ranges_count,
+		.apply_smpc_war = gm20b_apply_smpc_war,
+	},
+	.mc = {
+		.intr_enable = mc_gk20a_intr_enable,
+		.intr_unit_config = mc_gk20a_intr_unit_config,
+		.isr_stall = mc_gk20a_isr_stall,
+		.intr_stall = mc_gk20a_intr_stall,
+		.intr_stall_pause = mc_gk20a_intr_stall_pause,
+		.intr_stall_resume = mc_gk20a_intr_stall_resume,
+		.intr_nonstall = mc_gk20a_intr_nonstall,
+		.intr_nonstall_pause = mc_gk20a_intr_nonstall_pause,
+		.intr_nonstall_resume = mc_gk20a_intr_nonstall_resume,
+		.enable = gk20a_mc_enable,
+		.disable = gk20a_mc_disable,
+		.reset = gk20a_mc_reset,
+		.boot_0 = gk20a_mc_boot_0,
+		.is_intr1_pending = mc_gk20a_is_intr1_pending,
+	},
+	.debug = {
+		.show_dump = NULL,
+	},
+	.dbg_session_ops = {
+		.exec_reg_ops = vgpu_exec_regops,
+		.dbg_set_powergate = vgpu_dbg_set_powergate,
+		.check_and_set_global_reservation =
+			vgpu_check_and_set_global_reservation,
+		.check_and_set_context_reservation =
+			vgpu_check_and_set_context_reservation,
+		.release_profiler_reservation =
+			vgpu_release_profiler_reservation,
+		.perfbuffer_enable = vgpu_perfbuffer_enable,
+		.perfbuffer_disable = vgpu_perfbuffer_disable,
+	},
+	.cde = {
+		.get_program_numbers = gm20b_cde_get_program_numbers,
+	},
+	.bus = {
+		.init_hw = gk20a_bus_init_hw,
+		.isr = gk20a_bus_isr,
+		.read_ptimer = vgpu_read_ptimer,
+		.get_timestamps_zipper = vgpu_get_timestamps_zipper,
+		.bar1_bind = gm20b_bus_bar1_bind,
+	},
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+	.css = {
+		.enable_snapshot = vgpu_css_enable_snapshot_buffer,
+		.disable_snapshot = vgpu_css_release_snapshot_buffer,
+		.check_data_available = vgpu_css_flush_snapshots,
+		.detach_snapshot = vgpu_css_detach,
+		.set_handled_snapshots = NULL,
+		.allocate_perfmon_ids = NULL,
+		.release_perfmon_ids = NULL,
+	},
+#endif
+	.falcon = {
+		.falcon_hal_sw_init = gk20a_falcon_hal_sw_init,
+	},
+	.priv_ring = {
+		.isr = gk20a_priv_ring_isr,
+	},
+	.chip_init_gpu_characteristics = vgpu_init_gpu_characteristics,
+	.get_litter_value = gm20b_get_litter_value,
+};
+
 int vgpu_gm20b_init_hal(struct gk20a *g)
 {
-	int err;
+	struct gpu_ops *gops = &g->ops;
+	struct nvgpu_gpu_characteristics *c = &g->gpu_characteristics;
+	u32 val;
+
+	gops->ltc = vgpu_gm20b_ops.ltc;
+	gops->ce2 = vgpu_gm20b_ops.ce2;
+	gops->gr = vgpu_gm20b_ops.gr;
+	gops->fb = vgpu_gm20b_ops.fb;
+	gops->clock_gating = vgpu_gm20b_ops.clock_gating;
+	gops->fifo = vgpu_gm20b_ops.fifo;
+	gops->gr_ctx = vgpu_gm20b_ops.gr_ctx;
+	gops->mm = vgpu_gm20b_ops.mm;
+	gops->therm = vgpu_gm20b_ops.therm;
+	gops->pmu = vgpu_gm20b_ops.pmu;
+	/*
+	 * clk must be assigned member by member
+	 * since some clk ops are assigned during probe prior to HAL init
+	 */
+	gops->clk.init_clk_support = vgpu_gm20b_ops.clk.init_clk_support;
+	gops->clk.suspend_clk_support = vgpu_gm20b_ops.clk.suspend_clk_support;
+	gops->clk.get_voltage = vgpu_gm20b_ops.clk.get_voltage;
+	gops->clk.get_gpcclk_clock_counter =
+		vgpu_gm20b_ops.clk.get_gpcclk_clock_counter;
+	gops->clk.pll_reg_write = vgpu_gm20b_ops.clk.pll_reg_write;
+	gops->clk.get_pll_debug_data = vgpu_gm20b_ops.clk.get_pll_debug_data;
+
+	gops->regops = vgpu_gm20b_ops.regops;
+	gops->mc = vgpu_gm20b_ops.mc;
+	gops->dbg_session_ops = vgpu_gm20b_ops.dbg_session_ops;
+	gops->debug = vgpu_gm20b_ops.debug;
+	gops->cde = vgpu_gm20b_ops.cde;
+	gops->bus = vgpu_gm20b_ops.bus;
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+	gops->css = vgpu_gm20b_ops.css;
+#endif
+	gops->falcon = vgpu_gm20b_ops.falcon;
+
+	gops->priv_ring = vgpu_gm20b_ops.priv_ring;
+
+	/* Lone functions */
+	gops->chip_init_gpu_characteristics =
+		vgpu_gm20b_ops.chip_init_gpu_characteristics;
+	gops->get_litter_value = vgpu_gm20b_ops.get_litter_value;
+
+	__nvgpu_set_enabled(g, NVGPU_GR_USE_DMA_FOR_FW_BOOTSTRAP, true);
+	__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+	__nvgpu_set_enabled(g, NVGPU_PMU_PSTATE, false);
+
+#ifdef CONFIG_TEGRA_ACR
+	if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+		__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+	} else {
+		val = gk20a_readl(g, fuse_opt_priv_sec_en_r());
+		if (!val) {
+			gk20a_dbg_info("priv security is disabled in HW");
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+		} else {
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+		}
+	}
+#else
+	if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+		gk20a_dbg_info("running ASIM with PRIV security disabled");
+		__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+	} else {
+		val = gk20a_readl(g, fuse_opt_priv_sec_en_r());
+		if (!val) {
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+		} else {
+			gk20a_dbg_info("priv security is not supported but enabled");
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+			return -EPERM;
+		}
+	}
+#endif
+
+	/* priv security dependent ops */
+	if (nvgpu_is_enabled(g, NVGPU_SEC_PRIVSECURITY)) {
+		/* Add in ops from gm20b acr */
+		gops->pmu.is_pmu_supported = gm20b_is_pmu_supported;
+		gops->pmu.prepare_ucode = prepare_ucode_blob;
+		gops->pmu.pmu_setup_hw_and_bootstrap = gm20b_bootstrap_hs_flcn;
+		gops->pmu.is_lazy_bootstrap = gm20b_is_lazy_bootstrap;
+		gops->pmu.is_priv_load = gm20b_is_priv_load;
+		gops->pmu.get_wpr = gm20b_wpr_info;
+		gops->pmu.alloc_blob_space = gm20b_alloc_blob_space;
+		gops->pmu.pmu_populate_loader_cfg =
+			gm20b_pmu_populate_loader_cfg;
+		gops->pmu.flcn_populate_bl_dmem_desc =
+			gm20b_flcn_populate_bl_dmem_desc;
+		gops->pmu.falcon_wait_for_halt = pmu_wait_for_halt;
+		gops->pmu.falcon_clear_halt_interrupt_status =
+			clear_halt_interrupt_status;
+		gops->pmu.init_falcon_setup_hw = gm20b_init_pmu_setup_hw1;
+
+		gops->pmu.init_wpr_region = gm20b_pmu_init_acr;
+		gops->pmu.load_lsfalcon_ucode = gm20b_load_falcon_ucode;
+
+		gops->gr.load_ctxsw_ucode = gr_gm20b_load_ctxsw_ucode;
+	} else {
+		/* Inherit from gk20a */
+		gops->pmu.is_pmu_supported = gk20a_is_pmu_supported;
+		gops->pmu.prepare_ucode = nvgpu_pmu_prepare_ns_ucode_blob;
+		gops->pmu.pmu_setup_hw_and_bootstrap = gk20a_init_pmu_setup_hw1;
+		gops->pmu.pmu_nsbootstrap = pmu_bootstrap;
+
+		gops->pmu.load_lsfalcon_ucode = NULL;
+		gops->pmu.init_wpr_region = NULL;
+
+		gops->gr.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode;
+	}
+
+	__nvgpu_set_enabled(g, NVGPU_PMU_FECS_BOOTSTRAP_DONE, false);
+	g->pmu_lsf_pmu_wpr_init_done = 0;
+	g->bootstrap_owner = LSF_BOOTSTRAP_OWNER_DEFAULT;
+
+	gm20b_init_uncompressed_kind_map();
+	gm20b_init_kind_attr();
+
+	g->name = "gm20b";
 
-	err = gm20b_init_hal(g);
-	if (err)
-		return err;
-	vgpu_init_hal_common(g);
-	vgpu_gm20b_init_gr_ops(&g->ops);
+	c->twod_class = FERMI_TWOD_A;
+	c->threed_class = MAXWELL_B;
+	c->compute_class = MAXWELL_COMPUTE_B;
+	c->gpfifo_class = MAXWELL_CHANNEL_GPFIFO_A;
+	c->inline_to_memory_class = KEPLER_INLINE_TO_MEMORY_B;
+	c->dma_copy_class = MAXWELL_DMA_COPY_A;
 
 	return 0;
 }
diff --git a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_fifo_gp10b.h b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_fifo_gp10b.h
deleted file mode 100644
index 8dd016aa..00000000
--- a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_fifo_gp10b.h
+++ /dev/null
@@ -1,30 +0,0 @@
-/*
- * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
- * DEALINGS IN THE SOFTWARE.
- */
-
-#ifndef __VGPU_FIFO_GP10B_H__
-#define __VGPU_FIFO_GP10B_H__
-
-#include "gk20a/gk20a.h"
-
-void vgpu_gp10b_init_fifo_ops(struct gpu_ops *gops);
-
-#endif
diff --git a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.c b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.c
index ec2fcd8e..fa6109ad 100644
--- a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.c
+++ b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.c
@@ -31,7 +31,7 @@
 
 #include <nvgpu/hw/gp10b/hw_gr_gp10b.h>
 
-static void vgpu_gr_gp10b_free_gr_ctx(struct gk20a *g, struct vm_gk20a *vm,
+void vgpu_gr_gp10b_free_gr_ctx(struct gk20a *g, struct vm_gk20a *vm,
 				struct gr_ctx_desc *gr_ctx)
 {
 	struct tegra_vgpu_cmd_msg msg = {0};
@@ -59,7 +59,7 @@ static void vgpu_gr_gp10b_free_gr_ctx(struct gk20a *g, struct vm_gk20a *vm,
 	nvgpu_kfree(g, gr_ctx);
 }
 
-static int vgpu_gr_gp10b_alloc_gr_ctx(struct gk20a *g,
+int vgpu_gr_gp10b_alloc_gr_ctx(struct gk20a *g,
 				struct gr_ctx_desc **__gr_ctx,
 				struct vm_gk20a *vm,
 				u32 class,
@@ -115,7 +115,7 @@ fail:
 	return err;
 }
 
-static int vgpu_gr_gp10b_set_ctxsw_preemption_mode(struct gk20a *g,
+int vgpu_gr_gp10b_set_ctxsw_preemption_mode(struct gk20a *g,
 				struct gr_ctx_desc *gr_ctx,
 				struct vm_gk20a *vm, u32 class,
 				u32 graphics_preempt_mode,
@@ -267,7 +267,7 @@ fail:
 	return err;
 }
 
-static int vgpu_gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
+int vgpu_gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
 					u32 graphics_preempt_mode,
 					u32 compute_preempt_mode)
 {
@@ -316,7 +316,7 @@ static int vgpu_gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
 	return err;
 }
 
-static int vgpu_gr_gp10b_init_ctx_state(struct gk20a *g)
+int vgpu_gr_gp10b_init_ctx_state(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 	int err;
@@ -334,14 +334,3 @@ static int vgpu_gr_gp10b_init_ctx_state(struct gk20a *g)
 
 	return 0;
 }
-
-void vgpu_gp10b_init_gr_ops(struct gpu_ops *gops)
-{
-	vgpu_gm20b_init_gr_ops(gops);
-	gops->gr.alloc_gr_ctx = vgpu_gr_gp10b_alloc_gr_ctx;
-	gops->gr.free_gr_ctx = vgpu_gr_gp10b_free_gr_ctx;
-	gops->gr.init_ctx_state = vgpu_gr_gp10b_init_ctx_state;
-	gops->gr.set_preemption_mode = vgpu_gr_gp10b_set_preemption_mode;
-	gops->gr.set_ctxsw_preemption_mode =
-			vgpu_gr_gp10b_set_ctxsw_preemption_mode;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.h b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.h
index 9505749e..baf5a8e9 100644
--- a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.h
+++ b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_gr_gp10b.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -25,6 +25,21 @@
 
 #include "gk20a/gk20a.h"
 
-void vgpu_gp10b_init_gr_ops(struct gpu_ops *gops);
+void vgpu_gr_gp10b_free_gr_ctx(struct gk20a *g, struct vm_gk20a *vm,
+				struct gr_ctx_desc *gr_ctx);
+int vgpu_gr_gp10b_alloc_gr_ctx(struct gk20a *g,
+				struct gr_ctx_desc **__gr_ctx,
+				struct vm_gk20a *vm,
+				u32 class,
+				u32 flags);
+int vgpu_gr_gp10b_set_ctxsw_preemption_mode(struct gk20a *g,
+				struct gr_ctx_desc *gr_ctx,
+				struct vm_gk20a *vm, u32 class,
+				u32 graphics_preempt_mode,
+				u32 compute_preempt_mode);
+int vgpu_gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
+					u32 graphics_preempt_mode,
+					u32 compute_preempt_mode);
+int vgpu_gr_gp10b_init_ctx_state(struct gk20a *g);
 
 #endif
diff --git a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_hal_gp10b.c b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_hal_gp10b.c
index 8a367f94..aae74e3f 100644
--- a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_hal_gp10b.c
+++ b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_hal_gp10b.c
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -21,24 +21,626 @@
  */
 
 #include "vgpu/vgpu.h"
+#include "vgpu/fifo_vgpu.h"
+#include "vgpu/gr_vgpu.h"
+#include "vgpu/ltc_vgpu.h"
+#include "vgpu/mm_vgpu.h"
+#include "vgpu/dbg_vgpu.h"
+#include "vgpu/fecs_trace_vgpu.h"
+#include "vgpu/css_vgpu.h"
+#include "gp10b/gp10b.h"
 #include "gp10b/hal_gp10b.h"
+#include "vgpu/gm20b/vgpu_gr_gm20b.h"
 #include "vgpu_gr_gp10b.h"
-#include "vgpu_fifo_gp10b.h"
 #include "vgpu_mm_gp10b.h"
 
+#include "gk20a/bus_gk20a.h"
+#include "gk20a/pramin_gk20a.h"
+#include "gk20a/flcn_gk20a.h"
+#include "gk20a/mc_gk20a.h"
+#include "gk20a/fb_gk20a.h"
+
+#include "gp10b/mc_gp10b.h"
+#include "gp10b/ltc_gp10b.h"
+#include "gp10b/mm_gp10b.h"
+#include "gp10b/ce_gp10b.h"
+#include "gp10b/fb_gp10b.h"
+#include "gp10b/pmu_gp10b.h"
+#include "gp10b/gr_ctx_gp10b.h"
+#include "gp10b/fifo_gp10b.h"
+#include "gp10b/gp10b_gating_reglist.h"
+#include "gp10b/regops_gp10b.h"
+#include "gp10b/cde_gp10b.h"
+#include "gp10b/therm_gp10b.h"
+#include "gp10b/priv_ring_gp10b.h"
+
+#include "gm20b/ltc_gm20b.h"
+#include "gm20b/gr_gm20b.h"
+#include "gm20b/fifo_gm20b.h"
+#include "gm20b/acr_gm20b.h"
+#include "gm20b/pmu_gm20b.h"
+#include "gm20b/fb_gm20b.h"
+#include "gm20b/mm_gm20b.h"
+
+#include <nvgpu/enabled.h>
+
+#include <nvgpu/hw/gp10b/hw_fuse_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fifo_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_ram_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_top_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_pram_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_pwr_gp10b.h>
+
+static const struct gpu_ops vgpu_gp10b_ops = {
+	.ltc = {
+		.determine_L2_size_bytes = vgpu_determine_L2_size_bytes,
+		.set_zbc_color_entry = gm20b_ltc_set_zbc_color_entry,
+		.set_zbc_depth_entry = gm20b_ltc_set_zbc_depth_entry,
+		.init_cbc = gm20b_ltc_init_cbc,
+		.init_fs_state = vgpu_ltc_init_fs_state,
+		.init_comptags = vgpu_ltc_init_comptags,
+		.cbc_ctrl = NULL,
+		.isr = gp10b_ltc_isr,
+		.cbc_fix_config = gm20b_ltc_cbc_fix_config,
+		.flush = gm20b_flush_ltc,
+		.set_enabled = gp10b_ltc_set_enabled,
+	},
+	.ce2 = {
+		.isr_stall = gp10b_ce_isr,
+		.isr_nonstall = gp10b_ce_nonstall_isr,
+		.get_num_pce = vgpu_ce_get_num_pce,
+	},
+	.gr = {
+		.init_gpc_mmu = gr_gm20b_init_gpc_mmu,
+		.bundle_cb_defaults = gr_gm20b_bundle_cb_defaults,
+		.cb_size_default = gr_gp10b_cb_size_default,
+		.calc_global_ctx_buffer_size =
+			gr_gp10b_calc_global_ctx_buffer_size,
+		.commit_global_attrib_cb = gr_gp10b_commit_global_attrib_cb,
+		.commit_global_bundle_cb = gr_gp10b_commit_global_bundle_cb,
+		.commit_global_cb_manager = gr_gp10b_commit_global_cb_manager,
+		.commit_global_pagepool = gr_gp10b_commit_global_pagepool,
+		.handle_sw_method = gr_gp10b_handle_sw_method,
+		.set_alpha_circular_buffer_size =
+			gr_gp10b_set_alpha_circular_buffer_size,
+		.set_circular_buffer_size = gr_gp10b_set_circular_buffer_size,
+		.enable_hww_exceptions = gr_gk20a_enable_hww_exceptions,
+		.is_valid_class = gr_gp10b_is_valid_class,
+		.is_valid_gfx_class = gr_gp10b_is_valid_gfx_class,
+		.is_valid_compute_class = gr_gp10b_is_valid_compute_class,
+		.get_sm_dsm_perf_regs = gr_gm20b_get_sm_dsm_perf_regs,
+		.get_sm_dsm_perf_ctrl_regs = gr_gm20b_get_sm_dsm_perf_ctrl_regs,
+		.init_fs_state = vgpu_gm20b_init_fs_state,
+		.set_hww_esr_report_mask = gr_gm20b_set_hww_esr_report_mask,
+		.falcon_load_ucode = gr_gm20b_load_ctxsw_ucode_segments,
+		.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode,
+		.set_gpc_tpc_mask = gr_gp10b_set_gpc_tpc_mask,
+		.get_gpc_tpc_mask = vgpu_gr_get_gpc_tpc_mask,
+		.free_channel_ctx = vgpu_gr_free_channel_ctx,
+		.alloc_obj_ctx = vgpu_gr_alloc_obj_ctx,
+		.bind_ctxsw_zcull = vgpu_gr_bind_ctxsw_zcull,
+		.get_zcull_info = vgpu_gr_get_zcull_info,
+		.is_tpc_addr = gr_gm20b_is_tpc_addr,
+		.get_tpc_num = gr_gm20b_get_tpc_num,
+		.detect_sm_arch = vgpu_gr_detect_sm_arch,
+		.add_zbc_color = gr_gp10b_add_zbc_color,
+		.add_zbc_depth = gr_gp10b_add_zbc_depth,
+		.zbc_set_table = vgpu_gr_add_zbc,
+		.zbc_query_table = vgpu_gr_query_zbc,
+		.pmu_save_zbc = gk20a_pmu_save_zbc,
+		.add_zbc = gr_gk20a_add_zbc,
+		.pagepool_default_size = gr_gp10b_pagepool_default_size,
+		.init_ctx_state = vgpu_gr_gp10b_init_ctx_state,
+		.alloc_gr_ctx = vgpu_gr_gp10b_alloc_gr_ctx,
+		.free_gr_ctx = vgpu_gr_gp10b_free_gr_ctx,
+		.update_ctxsw_preemption_mode =
+			gr_gp10b_update_ctxsw_preemption_mode,
+		.dump_gr_regs = NULL,
+		.update_pc_sampling = gr_gm20b_update_pc_sampling,
+		.get_fbp_en_mask = vgpu_gr_get_fbp_en_mask,
+		.get_max_ltc_per_fbp = vgpu_gr_get_max_ltc_per_fbp,
+		.get_max_lts_per_ltc = vgpu_gr_get_max_lts_per_ltc,
+		.get_rop_l2_en_mask = vgpu_gr_rop_l2_en_mask,
+		.get_max_fbps_count = vgpu_gr_get_max_fbps_count,
+		.init_sm_dsm_reg_info = gr_gm20b_init_sm_dsm_reg_info,
+		.wait_empty = gr_gp10b_wait_empty,
+		.init_cyclestats = gr_gp10b_init_cyclestats,
+		.set_sm_debug_mode = vgpu_gr_set_sm_debug_mode,
+		.enable_cde_in_fecs = gr_gm20b_enable_cde_in_fecs,
+		.bpt_reg_info = gr_gm20b_bpt_reg_info,
+		.get_access_map = gr_gp10b_get_access_map,
+		.handle_fecs_error = gr_gp10b_handle_fecs_error,
+		.handle_sm_exception = gr_gp10b_handle_sm_exception,
+		.handle_tex_exception = gr_gp10b_handle_tex_exception,
+		.enable_gpc_exceptions = gk20a_gr_enable_gpc_exceptions,
+		.enable_exceptions = gk20a_gr_enable_exceptions,
+		.get_lrf_tex_ltc_dram_override = get_ecc_override_val,
+		.update_smpc_ctxsw_mode = vgpu_gr_update_smpc_ctxsw_mode,
+		.update_hwpm_ctxsw_mode = vgpu_gr_update_hwpm_ctxsw_mode,
+		.record_sm_error_state = gm20b_gr_record_sm_error_state,
+		.update_sm_error_state = gm20b_gr_update_sm_error_state,
+		.clear_sm_error_state = vgpu_gr_clear_sm_error_state,
+		.suspend_contexts = vgpu_gr_suspend_contexts,
+		.resume_contexts = vgpu_gr_resume_contexts,
+		.get_preemption_mode_flags = gr_gp10b_get_preemption_mode_flags,
+		.fuse_override = gp10b_gr_fuse_override,
+		.init_sm_id_table = gr_gk20a_init_sm_id_table,
+		.load_smid_config = gr_gp10b_load_smid_config,
+		.program_sm_id_numbering = gr_gm20b_program_sm_id_numbering,
+		.is_ltcs_ltss_addr = gr_gm20b_is_ltcs_ltss_addr,
+		.is_ltcn_ltss_addr = gr_gm20b_is_ltcn_ltss_addr,
+		.split_lts_broadcast_addr = gr_gm20b_split_lts_broadcast_addr,
+		.split_ltc_broadcast_addr = gr_gm20b_split_ltc_broadcast_addr,
+		.setup_rop_mapping = gr_gk20a_setup_rop_mapping,
+		.program_zcull_mapping = gr_gk20a_program_zcull_mapping,
+		.commit_global_timeslice = gr_gk20a_commit_global_timeslice,
+		.commit_inst = vgpu_gr_commit_inst,
+		.write_zcull_ptr = gr_gk20a_write_zcull_ptr,
+		.write_pm_ptr = gr_gk20a_write_pm_ptr,
+		.init_elcg_mode = gr_gk20a_init_elcg_mode,
+		.load_tpc_mask = gr_gm20b_load_tpc_mask,
+		.inval_icache = gr_gk20a_inval_icache,
+		.trigger_suspend = gr_gk20a_trigger_suspend,
+		.wait_for_pause = gr_gk20a_wait_for_pause,
+		.resume_from_pause = gr_gk20a_resume_from_pause,
+		.clear_sm_errors = gr_gk20a_clear_sm_errors,
+		.tpc_enabled_exceptions = gr_gk20a_tpc_enabled_exceptions,
+		.get_esr_sm_sel = gk20a_gr_get_esr_sm_sel,
+		.sm_debugger_attached = gk20a_gr_sm_debugger_attached,
+		.suspend_single_sm = gk20a_gr_suspend_single_sm,
+		.suspend_all_sms = gk20a_gr_suspend_all_sms,
+		.resume_single_sm = gk20a_gr_resume_single_sm,
+		.resume_all_sms = gk20a_gr_resume_all_sms,
+		.get_sm_hww_warp_esr = gp10b_gr_get_sm_hww_warp_esr,
+		.get_sm_hww_global_esr = gk20a_gr_get_sm_hww_global_esr,
+		.get_sm_no_lock_down_hww_global_esr_mask =
+			gk20a_gr_get_sm_no_lock_down_hww_global_esr_mask,
+		.lock_down_sm = gk20a_gr_lock_down_sm,
+		.wait_for_sm_lock_down = gk20a_gr_wait_for_sm_lock_down,
+		.clear_sm_hww = gm20b_gr_clear_sm_hww,
+		.init_ovr_sm_dsm_perf =  gk20a_gr_init_ovr_sm_dsm_perf,
+		.get_ovr_perf_regs = gk20a_gr_get_ovr_perf_regs,
+		.disable_rd_coalesce = gm20a_gr_disable_rd_coalesce,
+		.set_boosted_ctx = NULL,
+		.set_preemption_mode = vgpu_gr_gp10b_set_preemption_mode,
+		.set_czf_bypass = gr_gp10b_set_czf_bypass,
+		.pre_process_sm_exception = gr_gp10b_pre_process_sm_exception,
+		.set_preemption_buffer_va = gr_gp10b_set_preemption_buffer_va,
+		.init_preemption_state = gr_gp10b_init_preemption_state,
+		.update_boosted_ctx = NULL,
+		.set_bes_crop_debug3 = gr_gp10b_set_bes_crop_debug3,
+		.create_gr_sysfs = gr_gp10b_create_sysfs,
+		.set_ctxsw_preemption_mode =
+					vgpu_gr_gp10b_set_ctxsw_preemption_mode,
+		.init_ctxsw_hdr_data = gr_gp10b_init_ctxsw_hdr_data,
+	},
+	.fb = {
+		.reset = fb_gk20a_reset,
+		.init_hw = gk20a_fb_init_hw,
+		.init_fs_state = fb_gm20b_init_fs_state,
+		.set_mmu_page_size = gm20b_fb_set_mmu_page_size,
+		.set_use_full_comp_tag_line =
+			gm20b_fb_set_use_full_comp_tag_line,
+		.compression_page_size = gp10b_fb_compression_page_size,
+		.compressible_page_size = gp10b_fb_compressible_page_size,
+		.vpr_info_fetch = gm20b_fb_vpr_info_fetch,
+		.dump_vpr_wpr_info = gm20b_fb_dump_vpr_wpr_info,
+		.read_wpr_info = gm20b_fb_read_wpr_info,
+		.is_debug_mode_enabled = NULL,
+		.set_debug_mode = vgpu_mm_mmu_set_debug_mode,
+		.tlb_invalidate = vgpu_mm_tlb_invalidate,
+	},
+	.clock_gating = {
+		.slcg_bus_load_gating_prod =
+			gp10b_slcg_bus_load_gating_prod,
+		.slcg_ce2_load_gating_prod =
+			gp10b_slcg_ce2_load_gating_prod,
+		.slcg_chiplet_load_gating_prod =
+			gp10b_slcg_chiplet_load_gating_prod,
+		.slcg_ctxsw_firmware_load_gating_prod =
+			gp10b_slcg_ctxsw_firmware_load_gating_prod,
+		.slcg_fb_load_gating_prod =
+			gp10b_slcg_fb_load_gating_prod,
+		.slcg_fifo_load_gating_prod =
+			gp10b_slcg_fifo_load_gating_prod,
+		.slcg_gr_load_gating_prod =
+			gr_gp10b_slcg_gr_load_gating_prod,
+		.slcg_ltc_load_gating_prod =
+			ltc_gp10b_slcg_ltc_load_gating_prod,
+		.slcg_perf_load_gating_prod =
+			gp10b_slcg_perf_load_gating_prod,
+		.slcg_priring_load_gating_prod =
+			gp10b_slcg_priring_load_gating_prod,
+		.slcg_pmu_load_gating_prod =
+			gp10b_slcg_pmu_load_gating_prod,
+		.slcg_therm_load_gating_prod =
+			gp10b_slcg_therm_load_gating_prod,
+		.slcg_xbar_load_gating_prod =
+			gp10b_slcg_xbar_load_gating_prod,
+		.blcg_bus_load_gating_prod =
+			gp10b_blcg_bus_load_gating_prod,
+		.blcg_ce_load_gating_prod =
+			gp10b_blcg_ce_load_gating_prod,
+		.blcg_ctxsw_firmware_load_gating_prod =
+			gp10b_blcg_ctxsw_firmware_load_gating_prod,
+		.blcg_fb_load_gating_prod =
+			gp10b_blcg_fb_load_gating_prod,
+		.blcg_fifo_load_gating_prod =
+			gp10b_blcg_fifo_load_gating_prod,
+		.blcg_gr_load_gating_prod =
+			gp10b_blcg_gr_load_gating_prod,
+		.blcg_ltc_load_gating_prod =
+			gp10b_blcg_ltc_load_gating_prod,
+		.blcg_pwr_csb_load_gating_prod =
+			gp10b_blcg_pwr_csb_load_gating_prod,
+		.blcg_pmu_load_gating_prod =
+			gp10b_blcg_pmu_load_gating_prod,
+		.blcg_xbar_load_gating_prod =
+			gp10b_blcg_xbar_load_gating_prod,
+		.pg_gr_load_gating_prod =
+			gr_gp10b_pg_gr_load_gating_prod,
+	},
+	.fifo = {
+		.init_fifo_setup_hw = vgpu_init_fifo_setup_hw,
+		.bind_channel = vgpu_channel_bind,
+		.unbind_channel = vgpu_channel_unbind,
+		.disable_channel = vgpu_channel_disable,
+		.enable_channel = vgpu_channel_enable,
+		.alloc_inst = vgpu_channel_alloc_inst,
+		.free_inst = vgpu_channel_free_inst,
+		.setup_ramfc = vgpu_channel_setup_ramfc,
+		.channel_set_priority = vgpu_channel_set_priority,
+		.channel_set_timeslice = vgpu_channel_set_timeslice,
+		.default_timeslice_us = vgpu_fifo_default_timeslice_us,
+		.setup_userd = gk20a_fifo_setup_userd,
+		.userd_gp_get = gk20a_fifo_userd_gp_get,
+		.userd_gp_put = gk20a_fifo_userd_gp_put,
+		.userd_pb_get = gk20a_fifo_userd_pb_get,
+		.pbdma_acquire_val = gk20a_fifo_pbdma_acquire_val,
+		.preempt_channel = vgpu_fifo_preempt_channel,
+		.preempt_tsg = vgpu_fifo_preempt_tsg,
+		.enable_tsg = gk20a_enable_tsg,
+		.disable_tsg = gk20a_disable_tsg,
+		.tsg_verify_channel_status = NULL,
+		.tsg_verify_status_ctx_reload = gm20b_fifo_tsg_verify_status_ctx_reload,
+		.reschedule_runlist = NULL,
+		.update_runlist = vgpu_fifo_update_runlist,
+		.trigger_mmu_fault = gm20b_fifo_trigger_mmu_fault,
+		.get_mmu_fault_info = gp10b_fifo_get_mmu_fault_info,
+		.wait_engine_idle = vgpu_fifo_wait_engine_idle,
+		.get_num_fifos = gm20b_fifo_get_num_fifos,
+		.get_pbdma_signature = gp10b_fifo_get_pbdma_signature,
+		.set_runlist_interleave = vgpu_fifo_set_runlist_interleave,
+		.tsg_set_timeslice = vgpu_tsg_set_timeslice,
+		.tsg_open = vgpu_tsg_open,
+		.force_reset_ch = vgpu_fifo_force_reset_ch,
+		.engine_enum_from_type = gp10b_fifo_engine_enum_from_type,
+		.device_info_data_parse = gp10b_device_info_data_parse,
+		.eng_runlist_base_size = fifo_eng_runlist_base__size_1_v,
+		.init_engine_info = vgpu_fifo_init_engine_info,
+		.runlist_entry_size = ram_rl_entry_size_v,
+		.get_tsg_runlist_entry = gk20a_get_tsg_runlist_entry,
+		.get_ch_runlist_entry = gk20a_get_ch_runlist_entry,
+		.is_fault_engine_subid_gpc = gk20a_is_fault_engine_subid_gpc,
+		.dump_pbdma_status = gk20a_dump_pbdma_status,
+		.dump_eng_status = gk20a_dump_eng_status,
+		.dump_channel_status_ramfc = gk20a_dump_channel_status_ramfc,
+		.intr_0_error_mask = gk20a_fifo_intr_0_error_mask,
+		.is_preempt_pending = gk20a_fifo_is_preempt_pending,
+		.init_pbdma_intr_descs = gp10b_fifo_init_pbdma_intr_descs,
+		.reset_enable_hw = gk20a_init_fifo_reset_enable_hw,
+		.teardown_ch_tsg = gk20a_fifo_teardown_ch_tsg,
+		.handle_sched_error = gk20a_fifo_handle_sched_error,
+		.handle_pbdma_intr_0 = gk20a_fifo_handle_pbdma_intr_0,
+		.handle_pbdma_intr_1 = gk20a_fifo_handle_pbdma_intr_1,
+		.tsg_bind_channel = vgpu_tsg_bind_channel,
+		.tsg_unbind_channel = vgpu_tsg_unbind_channel,
+#ifdef CONFIG_TEGRA_GK20A_NVHOST
+		.alloc_syncpt_buf = gk20a_fifo_alloc_syncpt_buf,
+		.free_syncpt_buf = gk20a_fifo_free_syncpt_buf,
+		.add_syncpt_wait_cmd = gk20a_fifo_add_syncpt_wait_cmd,
+		.get_syncpt_wait_cmd_size = gk20a_fifo_get_syncpt_wait_cmd_size,
+		.add_syncpt_incr_cmd = gk20a_fifo_add_syncpt_incr_cmd,
+		.get_syncpt_incr_cmd_size = gk20a_fifo_get_syncpt_incr_cmd_size,
+#endif
+		.resetup_ramfc = NULL,
+		.device_info_fault_id = top_device_info_data_fault_id_enum_v,
+	},
+	.gr_ctx = {
+		.get_netlist_name = gr_gp10b_get_netlist_name,
+		.is_fw_defined = gr_gp10b_is_firmware_defined,
+	},
+#ifdef CONFIG_GK20A_CTXSW_TRACE
+	.fecs_trace = {
+		.alloc_user_buffer = vgpu_alloc_user_buffer,
+		.free_user_buffer = vgpu_free_user_buffer,
+		.mmap_user_buffer = vgpu_mmap_user_buffer,
+		.init = vgpu_fecs_trace_init,
+		.deinit = vgpu_fecs_trace_deinit,
+		.enable = vgpu_fecs_trace_enable,
+		.disable = vgpu_fecs_trace_disable,
+		.is_enabled = vgpu_fecs_trace_is_enabled,
+		.reset = NULL,
+		.flush = NULL,
+		.poll = vgpu_fecs_trace_poll,
+		.bind_channel = NULL,
+		.unbind_channel = NULL,
+		.max_entries = vgpu_fecs_trace_max_entries,
+		.set_filter = vgpu_fecs_trace_set_filter,
+	},
+#endif /* CONFIG_GK20A_CTXSW_TRACE */
+	.mm = {
+		/* FIXME: add support for sparse mappings */
+		.support_sparse = NULL,
+		.gmmu_map = vgpu_gp10b_locked_gmmu_map,
+		.gmmu_unmap = vgpu_locked_gmmu_unmap,
+		.vm_bind_channel = vgpu_vm_bind_channel,
+		.fb_flush = vgpu_mm_fb_flush,
+		.l2_invalidate = vgpu_mm_l2_invalidate,
+		.l2_flush = vgpu_mm_l2_flush,
+		.cbc_clean = gk20a_mm_cbc_clean,
+		.set_big_page_size = gm20b_mm_set_big_page_size,
+		.get_big_page_sizes = gm20b_mm_get_big_page_sizes,
+		.get_default_big_page_size = gp10b_mm_get_default_big_page_size,
+		.gpu_phys_addr = gm20b_gpu_phys_addr,
+		.get_iommu_bit = gk20a_mm_get_iommu_bit,
+		.get_mmu_levels = gp10b_mm_get_mmu_levels,
+		.init_pdb = gp10b_mm_init_pdb,
+		.init_mm_setup_hw = vgpu_gp10b_init_mm_setup_hw,
+		.is_bar1_supported = gm20b_mm_is_bar1_supported,
+		.init_inst_block = gk20a_init_inst_block,
+		.mmu_fault_pending = gk20a_fifo_mmu_fault_pending,
+		.init_bar2_vm = gb10b_init_bar2_vm,
+		.init_bar2_mm_hw_setup = gb10b_init_bar2_mm_hw_setup,
+		.remove_bar2_vm = gp10b_remove_bar2_vm,
+	},
+	.pramin = {
+		.enter = gk20a_pramin_enter,
+		.exit = gk20a_pramin_exit,
+		.data032_r = pram_data032_r,
+	},
+	.therm = {
+		.init_therm_setup_hw = gp10b_init_therm_setup_hw,
+		.elcg_init_idle_filters = gp10b_elcg_init_idle_filters,
+	},
+	.pmu = {
+		.pmu_setup_elpg = gp10b_pmu_setup_elpg,
+		.pmu_get_queue_head = pwr_pmu_queue_head_r,
+		.pmu_get_queue_head_size = pwr_pmu_queue_head__size_1_v,
+		.pmu_get_queue_tail = pwr_pmu_queue_tail_r,
+		.pmu_get_queue_tail_size = pwr_pmu_queue_tail__size_1_v,
+		.pmu_queue_head = gk20a_pmu_queue_head,
+		.pmu_queue_tail = gk20a_pmu_queue_tail,
+		.pmu_msgq_tail = gk20a_pmu_msgq_tail,
+		.pmu_mutex_size = pwr_pmu_mutex__size_1_v,
+		.pmu_mutex_acquire = gk20a_pmu_mutex_acquire,
+		.pmu_mutex_release = gk20a_pmu_mutex_release,
+		.write_dmatrfbase = gp10b_write_dmatrfbase,
+		.pmu_elpg_statistics = gp10b_pmu_elpg_statistics,
+		.pmu_pg_init_param = gp10b_pg_gr_init,
+		.pmu_pg_supported_engines_list = gk20a_pmu_pg_engines_list,
+		.pmu_pg_engines_feature_list = gk20a_pmu_pg_feature_list,
+		.dump_secure_fuses = pmu_dump_security_fuses_gp10b,
+		.reset_engine = gk20a_pmu_engine_reset,
+		.is_engine_in_reset = gk20a_pmu_is_engine_in_reset,
+	},
+	.regops = {
+		.get_global_whitelist_ranges =
+			gp10b_get_global_whitelist_ranges,
+		.get_global_whitelist_ranges_count =
+			gp10b_get_global_whitelist_ranges_count,
+		.get_context_whitelist_ranges =
+			gp10b_get_context_whitelist_ranges,
+		.get_context_whitelist_ranges_count =
+			gp10b_get_context_whitelist_ranges_count,
+		.get_runcontrol_whitelist = gp10b_get_runcontrol_whitelist,
+		.get_runcontrol_whitelist_count =
+			gp10b_get_runcontrol_whitelist_count,
+		.get_runcontrol_whitelist_ranges =
+			gp10b_get_runcontrol_whitelist_ranges,
+		.get_runcontrol_whitelist_ranges_count =
+			gp10b_get_runcontrol_whitelist_ranges_count,
+		.get_qctl_whitelist = gp10b_get_qctl_whitelist,
+		.get_qctl_whitelist_count = gp10b_get_qctl_whitelist_count,
+		.get_qctl_whitelist_ranges = gp10b_get_qctl_whitelist_ranges,
+		.get_qctl_whitelist_ranges_count =
+			gp10b_get_qctl_whitelist_ranges_count,
+		.apply_smpc_war = gp10b_apply_smpc_war,
+	},
+	.mc = {
+		.intr_enable = mc_gp10b_intr_enable,
+		.intr_unit_config = mc_gp10b_intr_unit_config,
+		.isr_stall = mc_gp10b_isr_stall,
+		.intr_stall = mc_gp10b_intr_stall,
+		.intr_stall_pause = mc_gp10b_intr_stall_pause,
+		.intr_stall_resume = mc_gp10b_intr_stall_resume,
+		.intr_nonstall = mc_gp10b_intr_nonstall,
+		.intr_nonstall_pause = mc_gp10b_intr_nonstall_pause,
+		.intr_nonstall_resume = mc_gp10b_intr_nonstall_resume,
+		.enable = gk20a_mc_enable,
+		.disable = gk20a_mc_disable,
+		.reset = gk20a_mc_reset,
+		.boot_0 = gk20a_mc_boot_0,
+		.is_intr1_pending = mc_gp10b_is_intr1_pending,
+	},
+	.debug = {
+		.show_dump = NULL,
+	},
+	.dbg_session_ops = {
+		.exec_reg_ops = vgpu_exec_regops,
+		.dbg_set_powergate = vgpu_dbg_set_powergate,
+		.check_and_set_global_reservation =
+			vgpu_check_and_set_global_reservation,
+		.check_and_set_context_reservation =
+			vgpu_check_and_set_context_reservation,
+		.release_profiler_reservation =
+			vgpu_release_profiler_reservation,
+		.perfbuffer_enable = vgpu_perfbuffer_enable,
+		.perfbuffer_disable = vgpu_perfbuffer_disable,
+	},
+	.cde = {
+		.get_program_numbers = gp10b_cde_get_program_numbers,
+		.need_scatter_buffer = gp10b_need_scatter_buffer,
+		.populate_scatter_buffer = gp10b_populate_scatter_buffer,
+	},
+	.bus = {
+		.init_hw = gk20a_bus_init_hw,
+		.isr = gk20a_bus_isr,
+		.read_ptimer = vgpu_read_ptimer,
+		.get_timestamps_zipper = vgpu_get_timestamps_zipper,
+		.bar1_bind = gk20a_bus_bar1_bind,
+	},
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+	.css = {
+		.enable_snapshot = vgpu_css_enable_snapshot_buffer,
+		.disable_snapshot = vgpu_css_release_snapshot_buffer,
+		.check_data_available = vgpu_css_flush_snapshots,
+		.detach_snapshot = vgpu_css_detach,
+		.set_handled_snapshots = NULL,
+		.allocate_perfmon_ids = NULL,
+		.release_perfmon_ids = NULL,
+	},
+#endif
+	.falcon = {
+		.falcon_hal_sw_init = gk20a_falcon_hal_sw_init,
+	},
+	.priv_ring = {
+		.isr = gp10b_priv_ring_isr,
+	},
+	.chip_init_gpu_characteristics = vgpu_init_gpu_characteristics,
+	.get_litter_value = gp10b_get_litter_value,
+};
+
 int vgpu_gp10b_init_hal(struct gk20a *g)
 {
-	int err;
+	struct gpu_ops *gops = &g->ops;
+	struct nvgpu_gpu_characteristics *c = &g->gpu_characteristics;
+	u32 val;
+
+	gops->ltc = vgpu_gp10b_ops.ltc;
+	gops->ce2 = vgpu_gp10b_ops.ce2;
+	gops->gr = vgpu_gp10b_ops.gr;
+	gops->fb = vgpu_gp10b_ops.fb;
+	gops->clock_gating = vgpu_gp10b_ops.clock_gating;
+	gops->fifo = vgpu_gp10b_ops.fifo;
+	gops->gr_ctx = vgpu_gp10b_ops.gr_ctx;
+	gops->fecs_trace = vgpu_gp10b_ops.fecs_trace;
+	gops->mm = vgpu_gp10b_ops.mm;
+	gops->pramin = vgpu_gp10b_ops.pramin;
+	gops->therm = vgpu_gp10b_ops.therm;
+	gops->pmu = vgpu_gp10b_ops.pmu;
+	gops->regops = vgpu_gp10b_ops.regops;
+	gops->mc = vgpu_gp10b_ops.mc;
+	gops->debug = vgpu_gp10b_ops.debug;
+	gops->dbg_session_ops = vgpu_gp10b_ops.dbg_session_ops;
+	gops->cde = vgpu_gp10b_ops.cde;
+	gops->bus = vgpu_gp10b_ops.bus;
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+	gops->css = vgpu_gp10b_ops.css;
+#endif
+	gops->falcon = vgpu_gp10b_ops.falcon;
+
+	gops->priv_ring = vgpu_gp10b_ops.priv_ring;
+
+	/* Lone Functions */
+	gops->chip_init_gpu_characteristics =
+		vgpu_gp10b_ops.chip_init_gpu_characteristics;
+	gops->get_litter_value = vgpu_gp10b_ops.get_litter_value;
+
+	__nvgpu_set_enabled(g, NVGPU_GR_USE_DMA_FOR_FW_BOOTSTRAP, true);
+	__nvgpu_set_enabled(g, NVGPU_PMU_PSTATE, false);
+
+#ifdef CONFIG_TEGRA_ACR
+	if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+		__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+		__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+	} else if (g->is_virtual) {
+		__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+		__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+	} else {
+		val = gk20a_readl(g, fuse_opt_priv_sec_en_r());
+		if (val) {
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+			__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+		} else {
+			gk20a_dbg_info("priv security is disabled in HW");
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+			__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+		}
+	}
+#else
+	if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+		gk20a_dbg_info("running simulator with PRIV security disabled");
+		__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+		__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+	} else {
+		val = gk20a_readl(g, fuse_opt_priv_sec_en_r());
+		if (val) {
+			gk20a_dbg_info("priv security is not supported but enabled");
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+			__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+			return -EPERM;
+		} else {
+			__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+			__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+		}
+	}
+#endif
+
+	/* priv security dependent ops */
+	if (nvgpu_is_enabled(g, NVGPU_SEC_PRIVSECURITY)) {
+		/* Add in ops from gm20b acr */
+		gops->pmu.is_pmu_supported = gm20b_is_pmu_supported,
+		gops->pmu.prepare_ucode = prepare_ucode_blob,
+		gops->pmu.pmu_setup_hw_and_bootstrap = gm20b_bootstrap_hs_flcn,
+		gops->pmu.is_lazy_bootstrap = gm20b_is_lazy_bootstrap,
+		gops->pmu.is_priv_load = gm20b_is_priv_load,
+		gops->pmu.get_wpr = gm20b_wpr_info,
+		gops->pmu.alloc_blob_space = gm20b_alloc_blob_space,
+		gops->pmu.pmu_populate_loader_cfg =
+			gm20b_pmu_populate_loader_cfg,
+		gops->pmu.flcn_populate_bl_dmem_desc =
+			gm20b_flcn_populate_bl_dmem_desc,
+		gops->pmu.falcon_wait_for_halt = pmu_wait_for_halt,
+		gops->pmu.falcon_clear_halt_interrupt_status =
+			clear_halt_interrupt_status,
+		gops->pmu.init_falcon_setup_hw = gm20b_init_pmu_setup_hw1,
+
+		gops->pmu.init_wpr_region = gm20b_pmu_init_acr;
+		gops->pmu.load_lsfalcon_ucode = gp10b_load_falcon_ucode;
+		gops->pmu.is_lazy_bootstrap = gp10b_is_lazy_bootstrap;
+		gops->pmu.is_priv_load = gp10b_is_priv_load;
+
+		gops->gr.load_ctxsw_ucode = gr_gm20b_load_ctxsw_ucode;
+	} else {
+		/* Inherit from gk20a */
+		gops->pmu.is_pmu_supported = gk20a_is_pmu_supported,
+		gops->pmu.prepare_ucode = nvgpu_pmu_prepare_ns_ucode_blob,
+		gops->pmu.pmu_setup_hw_and_bootstrap = gk20a_init_pmu_setup_hw1,
+		gops->pmu.pmu_nsbootstrap = pmu_bootstrap,
+
+		gops->pmu.load_lsfalcon_ucode = NULL;
+		gops->pmu.init_wpr_region = NULL;
+		gops->pmu.pmu_setup_hw_and_bootstrap = gp10b_init_pmu_setup_hw1;
+
+		gops->gr.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode;
+	}
+
+	__nvgpu_set_enabled(g, NVGPU_PMU_FECS_BOOTSTRAP_DONE, false);
+	g->pmu_lsf_pmu_wpr_init_done = 0;
+	g->bootstrap_owner = LSF_BOOTSTRAP_OWNER_DEFAULT;
+
+	gp10b_init_uncompressed_kind_map();
+	gp10b_init_kind_attr();
 
-	gk20a_dbg_fn("");
+	g->name = "gp10b";
 
-	err = gp10b_init_hal(g);
-	if (err)
-		return err;
+	c->twod_class = FERMI_TWOD_A;
+	c->threed_class = PASCAL_A;
+	c->compute_class = PASCAL_COMPUTE_A;
+	c->gpfifo_class = PASCAL_CHANNEL_GPFIFO_A;
+	c->inline_to_memory_class = KEPLER_INLINE_TO_MEMORY_B;
+	c->dma_copy_class = PASCAL_DMA_COPY_A;
 
-	vgpu_init_hal_common(g);
-	vgpu_gp10b_init_gr_ops(&g->ops);
-	vgpu_gp10b_init_fifo_ops(&g->ops);
-	vgpu_gp10b_init_mm_ops(&g->ops);
 	return 0;
 }
diff --git a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.c b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.c
index cb7008ba..f063961f 100644
--- a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.c
+++ b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.c
@@ -28,7 +28,7 @@
 
 #include <nvgpu/bug.h>
 
-static int vgpu_gp10b_init_mm_setup_hw(struct gk20a *g)
+int vgpu_gp10b_init_mm_setup_hw(struct gk20a *g)
 {
 	g->mm.bypass_smmu = true;
 	g->mm.disable_bigpage = true;
@@ -47,7 +47,7 @@ static inline int add_mem_desc(struct tegra_vgpu_mem_desc *mem_desc,
 	return 0;
 }
 
-static u64 vgpu_gp10b_locked_gmmu_map(struct vm_gk20a *vm,
+u64 vgpu_gp10b_locked_gmmu_map(struct vm_gk20a *vm,
 				u64 map_offset,
 				struct nvgpu_sgt *sgt,
 				u64 buffer_offset,
@@ -200,14 +200,3 @@ fail:
 
 	return 0;
 }
-
-void vgpu_gp10b_init_mm_ops(struct gpu_ops *gops)
-{
-	gk20a_dbg_fn("");
-
-	gops->mm.gmmu_map = vgpu_gp10b_locked_gmmu_map;
-	gops->mm.init_mm_setup_hw = vgpu_gp10b_init_mm_setup_hw;
-
-	/* FIXME: add support for sparse mappings */
-	gops->mm.support_sparse = NULL;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.h b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.h
index a8f0b7bc..fd6760ff 100644
--- a/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.h
+++ b/drivers/gpu/nvgpu/vgpu/gp10b/vgpu_mm_gp10b.h
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -25,6 +25,21 @@
 
 #include "gk20a/gk20a.h"
 
-void vgpu_gp10b_init_mm_ops(struct gpu_ops *gops);
+u64 vgpu_gp10b_locked_gmmu_map(struct vm_gk20a *vm,
+				u64 map_offset,
+				struct nvgpu_sgt *sgt,
+				u64 buffer_offset,
+				u64 size,
+				int pgsz_idx,
+				u8 kind_v,
+				u32 ctag_offset,
+				u32 flags,
+				int rw_flag,
+				bool clear_ctags,
+				bool sparse,
+				bool priv,
+				struct vm_gk20a_mapping_batch *batch,
+				enum nvgpu_aperture aperture);
+int vgpu_gp10b_init_mm_setup_hw(struct gk20a *g);
 
 #endif
diff --git a/drivers/gpu/nvgpu/vgpu/gr_vgpu.c b/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
index 7f267f26..96d21c0a 100644
--- a/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/gr_vgpu.c
@@ -26,11 +26,12 @@
 #include <nvgpu/bug.h>
 
 #include "vgpu/vgpu.h"
+#include "vgpu/gr_vgpu.h"
 #include "gk20a/dbg_gpu_gk20a.h"
 
 #include <nvgpu/hw/gk20a/hw_gr_gk20a.h>
 
-static void vgpu_gr_detect_sm_arch(struct gk20a *g)
+void vgpu_gr_detect_sm_arch(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
@@ -427,7 +428,7 @@ static void vgpu_gr_free_channel_pm_ctx(struct channel_gk20a *c)
 	pm_ctx->mem.gpu_va = 0;
 }
 
-static void vgpu_gr_free_channel_ctx(struct channel_gk20a *c, bool is_tsg)
+void vgpu_gr_free_channel_ctx(struct channel_gk20a *c, bool is_tsg)
 {
 	gk20a_dbg_fn("");
 
@@ -484,7 +485,7 @@ static int vgpu_gr_tsg_bind_gr_ctx(struct tsg_gk20a *tsg)
 	return err;
 }
 
-static int vgpu_gr_alloc_obj_ctx(struct channel_gk20a  *c,
+int vgpu_gr_alloc_obj_ctx(struct channel_gk20a  *c,
 				struct nvgpu_alloc_obj_ctx_args *args)
 {
 	struct gk20a *g = c->g;
@@ -666,7 +667,7 @@ cleanup:
 	return -ENOMEM;
 }
 
-static int vgpu_gr_bind_ctxsw_zcull(struct gk20a *g, struct gr_gk20a *gr,
+int vgpu_gr_bind_ctxsw_zcull(struct gk20a *g, struct gr_gk20a *gr,
 				struct channel_gk20a *c, u64 zcull_va,
 				u32 mode)
 {
@@ -686,7 +687,7 @@ static int vgpu_gr_bind_ctxsw_zcull(struct gk20a *g, struct gr_gk20a *gr,
 	return (err || msg.ret) ? -ENOMEM : 0;
 }
 
-static int vgpu_gr_get_zcull_info(struct gk20a *g, struct gr_gk20a *gr,
+int vgpu_gr_get_zcull_info(struct gk20a *g, struct gr_gk20a *gr,
 				struct gr_zcull_info *zcull_params)
 {
 	struct tegra_vgpu_cmd_msg msg;
@@ -717,14 +718,14 @@ static int vgpu_gr_get_zcull_info(struct gk20a *g, struct gr_gk20a *gr,
 	return 0;
 }
 
-static u32 vgpu_gr_get_gpc_tpc_mask(struct gk20a *g, u32 gpc_index)
+u32 vgpu_gr_get_gpc_tpc_mask(struct gk20a *g, u32 gpc_index)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
 	return priv->constants.gpc_tpc_mask[gpc_index];
 }
 
-static u32 vgpu_gr_get_max_fbps_count(struct gk20a *g)
+u32 vgpu_gr_get_max_fbps_count(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
@@ -733,7 +734,7 @@ static u32 vgpu_gr_get_max_fbps_count(struct gk20a *g)
 	return priv->constants.num_fbps;
 }
 
-static u32 vgpu_gr_get_fbp_en_mask(struct gk20a *g)
+u32 vgpu_gr_get_fbp_en_mask(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
@@ -742,7 +743,7 @@ static u32 vgpu_gr_get_fbp_en_mask(struct gk20a *g)
 	return priv->constants.fbp_en_mask;
 }
 
-static u32 vgpu_gr_get_max_ltc_per_fbp(struct gk20a *g)
+u32 vgpu_gr_get_max_ltc_per_fbp(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
@@ -751,7 +752,7 @@ static u32 vgpu_gr_get_max_ltc_per_fbp(struct gk20a *g)
 	return priv->constants.ltc_per_fbp;
 }
 
-static u32 vgpu_gr_get_max_lts_per_ltc(struct gk20a *g)
+u32 vgpu_gr_get_max_lts_per_ltc(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
@@ -760,13 +761,13 @@ static u32 vgpu_gr_get_max_lts_per_ltc(struct gk20a *g)
 	return priv->constants.max_lts_per_ltc;
 }
 
-static u32 *vgpu_gr_rop_l2_en_mask(struct gk20a *g)
+u32 *vgpu_gr_rop_l2_en_mask(struct gk20a *g)
 {
 	/* no one use it yet */
 	return NULL;
 }
 
-static int vgpu_gr_add_zbc(struct gk20a *g, struct gr_gk20a *gr,
+int vgpu_gr_add_zbc(struct gk20a *g, struct gr_gk20a *gr,
 			   struct zbc_entry *zbc_val)
 {
 	struct tegra_vgpu_cmd_msg msg = {0};
@@ -797,7 +798,7 @@ static int vgpu_gr_add_zbc(struct gk20a *g, struct gr_gk20a *gr,
 	return (err || msg.ret) ? -ENOMEM : 0;
 }
 
-static int vgpu_gr_query_zbc(struct gk20a *g, struct gr_gk20a *gr,
+int vgpu_gr_query_zbc(struct gk20a *g, struct gr_gk20a *gr,
 			struct zbc_query_params *query_params)
 {
 	struct tegra_vgpu_cmd_msg msg = {0};
@@ -997,7 +998,7 @@ int vgpu_gr_nonstall_isr(struct gk20a *g,
 	return 0;
 }
 
-static int vgpu_gr_set_sm_debug_mode(struct gk20a *g,
+int vgpu_gr_set_sm_debug_mode(struct gk20a *g,
 	struct channel_gk20a *ch, u64 sms, bool enable)
 {
 	struct tegra_vgpu_cmd_msg msg;
@@ -1017,7 +1018,7 @@ static int vgpu_gr_set_sm_debug_mode(struct gk20a *g,
 	return err ? err : msg.ret;
 }
 
-static int vgpu_gr_update_smpc_ctxsw_mode(struct gk20a *g,
+int vgpu_gr_update_smpc_ctxsw_mode(struct gk20a *g,
 	struct channel_gk20a *ch, bool enable)
 {
 	struct tegra_vgpu_cmd_msg msg;
@@ -1041,7 +1042,7 @@ static int vgpu_gr_update_smpc_ctxsw_mode(struct gk20a *g,
 	return err ? err : msg.ret;
 }
 
-static int vgpu_gr_update_hwpm_ctxsw_mode(struct gk20a *g,
+int vgpu_gr_update_hwpm_ctxsw_mode(struct gk20a *g,
 	struct channel_gk20a *ch, bool enable)
 {
 	struct channel_ctx_gk20a *ch_ctx = &ch->ch_ctx;
@@ -1079,7 +1080,7 @@ static int vgpu_gr_update_hwpm_ctxsw_mode(struct gk20a *g,
 	return err ? err : msg.ret;
 }
 
-static int vgpu_gr_clear_sm_error_state(struct gk20a *g,
+int vgpu_gr_clear_sm_error_state(struct gk20a *g,
 		struct channel_gk20a *ch, u32 sm_id)
 {
 	struct gr_gk20a *gr = &g->gr;
@@ -1172,7 +1173,7 @@ done:
 	return err;
 }
 
-static int vgpu_gr_suspend_contexts(struct gk20a *g,
+int vgpu_gr_suspend_contexts(struct gk20a *g,
 		struct dbg_session_gk20a *dbg_s,
 		int *ctx_resident_ch_fd)
 {
@@ -1180,7 +1181,7 @@ static int vgpu_gr_suspend_contexts(struct gk20a *g,
 			ctx_resident_ch_fd, TEGRA_VGPU_CMD_SUSPEND_CONTEXTS);
 }
 
-static int vgpu_gr_resume_contexts(struct gk20a *g,
+int vgpu_gr_resume_contexts(struct gk20a *g,
 		struct dbg_session_gk20a *dbg_s,
 		int *ctx_resident_ch_fd)
 {
@@ -1213,33 +1214,3 @@ void vgpu_gr_handle_sm_esr_event(struct gk20a *g,
 
 	nvgpu_mutex_release(&g->dbg_sessions_lock);
 }
-
-void vgpu_init_gr_ops(struct gpu_ops *gops)
-{
-	gops->gr.detect_sm_arch = vgpu_gr_detect_sm_arch;
-	gops->gr.free_channel_ctx = vgpu_gr_free_channel_ctx;
-	gops->gr.alloc_obj_ctx = vgpu_gr_alloc_obj_ctx;
-	gops->gr.alloc_gr_ctx = vgpu_gr_alloc_gr_ctx;
-	gops->gr.free_gr_ctx = vgpu_gr_free_gr_ctx;
-	gops->gr.bind_ctxsw_zcull = vgpu_gr_bind_ctxsw_zcull;
-	gops->gr.get_zcull_info = vgpu_gr_get_zcull_info;
-	gops->gr.get_gpc_tpc_mask = vgpu_gr_get_gpc_tpc_mask;
-	gops->gr.get_max_fbps_count = vgpu_gr_get_max_fbps_count;
-	gops->gr.get_fbp_en_mask = vgpu_gr_get_fbp_en_mask;
-	gops->gr.get_max_ltc_per_fbp = vgpu_gr_get_max_ltc_per_fbp;
-	gops->gr.get_max_lts_per_ltc = vgpu_gr_get_max_lts_per_ltc;
-	gops->gr.get_rop_l2_en_mask = vgpu_gr_rop_l2_en_mask;
-	gops->gr.zbc_set_table = vgpu_gr_add_zbc;
-	gops->gr.zbc_query_table = vgpu_gr_query_zbc;
-	gops->gr.init_ctx_state = vgpu_gr_init_ctx_state;
-	gops->gr.set_sm_debug_mode = vgpu_gr_set_sm_debug_mode;
-	gops->gr.update_smpc_ctxsw_mode = vgpu_gr_update_smpc_ctxsw_mode;
-	gops->gr.update_hwpm_ctxsw_mode = vgpu_gr_update_hwpm_ctxsw_mode;
-	gops->gr.clear_sm_error_state = vgpu_gr_clear_sm_error_state;
-	gops->gr.suspend_contexts = vgpu_gr_suspend_contexts;
-	gops->gr.resume_contexts = vgpu_gr_resume_contexts;
-	gops->gr.commit_inst = vgpu_gr_commit_inst;
-	gops->gr.dump_gr_regs = NULL;
-	gops->gr.set_boosted_ctx = NULL;
-	gops->gr.update_boosted_ctx = NULL;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/gr_vgpu.h b/drivers/gpu/nvgpu/vgpu/gr_vgpu.h
index b6df991e..5a5e0928 100644
--- a/drivers/gpu/nvgpu/vgpu/gr_vgpu.h
+++ b/drivers/gpu/nvgpu/vgpu/gr_vgpu.h
@@ -23,6 +23,50 @@
 #ifndef _GR_VGPU_H_
 #define _GR_VGPU_H_
 
+#include <nvgpu/types.h>
+
+struct gk20a;
+struct channel_gk20a;
+struct nvgpu_alloc_obj_ctx_args;
+struct gr_gk20a;
+struct gr_zcull_info;
+struct zbc_entry;
+struct zbc_query_params;
+struct dbg_session_gk20a;
+
+void vgpu_gr_detect_sm_arch(struct gk20a *g);
+void vgpu_gr_free_channel_ctx(struct channel_gk20a *c, bool is_tsg);
+int vgpu_gr_alloc_obj_ctx(struct channel_gk20a  *c,
+				struct nvgpu_alloc_obj_ctx_args *args);
+int vgpu_gr_bind_ctxsw_zcull(struct gk20a *g, struct gr_gk20a *gr,
+				struct channel_gk20a *c, u64 zcull_va,
+				u32 mode);
+int vgpu_gr_get_zcull_info(struct gk20a *g, struct gr_gk20a *gr,
+				struct gr_zcull_info *zcull_params);
+u32 vgpu_gr_get_gpc_tpc_mask(struct gk20a *g, u32 gpc_index);
+u32 vgpu_gr_get_max_fbps_count(struct gk20a *g);
+u32 vgpu_gr_get_fbp_en_mask(struct gk20a *g);
+u32 vgpu_gr_get_max_ltc_per_fbp(struct gk20a *g);
+u32 vgpu_gr_get_max_lts_per_ltc(struct gk20a *g);
+u32 *vgpu_gr_rop_l2_en_mask(struct gk20a *g);
+int vgpu_gr_add_zbc(struct gk20a *g, struct gr_gk20a *gr,
+			   struct zbc_entry *zbc_val);
+int vgpu_gr_query_zbc(struct gk20a *g, struct gr_gk20a *gr,
+			struct zbc_query_params *query_params);
+int vgpu_gr_set_sm_debug_mode(struct gk20a *g,
+	struct channel_gk20a *ch, u64 sms, bool enable);
+int vgpu_gr_update_smpc_ctxsw_mode(struct gk20a *g,
+	struct channel_gk20a *ch, bool enable);
+int vgpu_gr_update_hwpm_ctxsw_mode(struct gk20a *g,
+	struct channel_gk20a *ch, bool enable);
+int vgpu_gr_clear_sm_error_state(struct gk20a *g,
+		struct channel_gk20a *ch, u32 sm_id);
+int vgpu_gr_suspend_contexts(struct gk20a *g,
+		struct dbg_session_gk20a *dbg_s,
+		int *ctx_resident_ch_fd);
+int vgpu_gr_resume_contexts(struct gk20a *g,
+		struct dbg_session_gk20a *dbg_s,
+		int *ctx_resident_ch_fd);
 int vgpu_gr_commit_inst(struct channel_gk20a *c, u64 gpu_va);
 
 #endif
diff --git a/drivers/gpu/nvgpu/vgpu/ltc_vgpu.c b/drivers/gpu/nvgpu/vgpu/ltc_vgpu.c
index db39b309..a6848872 100644
--- a/drivers/gpu/nvgpu/vgpu/ltc_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/ltc_vgpu.c
@@ -1,7 +1,7 @@
 /*
  * Virtualized GPU L2
  *
- * Copyright (c) 2014-2016 NVIDIA CORPORATION.  All rights reserved.
+ * Copyright (c) 2014-2017 NVIDIA CORPORATION.  All rights reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
@@ -23,8 +23,9 @@
  */
 
 #include "vgpu/vgpu.h"
+#include "vgpu/ltc_vgpu.h"
 
-static int vgpu_determine_L2_size_bytes(struct gk20a *g)
+int vgpu_determine_L2_size_bytes(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
@@ -33,7 +34,7 @@ static int vgpu_determine_L2_size_bytes(struct gk20a *g)
 	return priv->constants.l2_size;
 }
 
-static int vgpu_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr)
+int vgpu_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 	u32 max_comptag_lines = 0;
@@ -56,7 +57,7 @@ static int vgpu_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr)
 	return 0;
 }
 
-static void vgpu_ltc_init_fs_state(struct gk20a *g)
+void vgpu_ltc_init_fs_state(struct gk20a *g)
 {
 	struct vgpu_priv_data *priv = vgpu_get_priv_data(g);
 
@@ -64,11 +65,3 @@ static void vgpu_ltc_init_fs_state(struct gk20a *g)
 
 	g->ltc_count = priv->constants.ltc_count;
 }
-
-void vgpu_init_ltc_ops(struct gpu_ops *gops)
-{
-	gops->ltc.determine_L2_size_bytes = vgpu_determine_L2_size_bytes;
-	gops->ltc.init_comptags = vgpu_ltc_init_comptags;
-	gops->ltc.init_fs_state = vgpu_ltc_init_fs_state;
-	gops->ltc.cbc_ctrl = NULL;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/ltc_vgpu.h b/drivers/gpu/nvgpu/vgpu/ltc_vgpu.h
new file mode 100644
index 00000000..3437b4cb
--- /dev/null
+++ b/drivers/gpu/nvgpu/vgpu/ltc_vgpu.h
@@ -0,0 +1,33 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef _LTC_VGPU_H_
+#define _LTC_VGPU_H_
+
+struct gk20a;
+struct gr_gk20a;
+
+int vgpu_determine_L2_size_bytes(struct gk20a *g);
+int vgpu_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr);
+void vgpu_ltc_init_fs_state(struct gk20a *g);
+
+#endif
diff --git a/drivers/gpu/nvgpu/vgpu/mm_vgpu.c b/drivers/gpu/nvgpu/vgpu/mm_vgpu.c
index 49517b9a..8dcca0a1 100644
--- a/drivers/gpu/nvgpu/vgpu/mm_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/mm_vgpu.c
@@ -35,6 +35,7 @@
 #include <nvgpu/linux/nvgpu_mem.h>
 
 #include "vgpu/vgpu.h"
+#include "vgpu/mm_vgpu.h"
 #include "gk20a/mm_gk20a.h"
 #include "gm20b/mm_gm20b.h"
 
@@ -85,7 +86,7 @@ int vgpu_init_mm_support(struct gk20a *g)
 	return err;
 }
 
-static u64 vgpu_locked_gmmu_map(struct vm_gk20a *vm,
+u64 vgpu_locked_gmmu_map(struct vm_gk20a *vm,
 				u64 map_offset,
 				struct nvgpu_sgt *sgt,
 				u64 buffer_offset,
@@ -171,7 +172,7 @@ fail:
 	return 0;
 }
 
-static void vgpu_locked_gmmu_unmap(struct vm_gk20a *vm,
+void vgpu_locked_gmmu_unmap(struct vm_gk20a *vm,
 				u64 vaddr,
 				u64 size,
 				int pgsz_idx,
@@ -274,7 +275,7 @@ u64 vgpu_bar1_map(struct gk20a *g, struct sg_table **sgt, u64 size)
 	return addr;
 }
 
-static int vgpu_vm_bind_channel(struct gk20a_as_share *as_share,
+int vgpu_vm_bind_channel(struct gk20a_as_share *as_share,
 				struct channel_gk20a *ch)
 {
 	struct vm_gk20a *vm = as_share->vm;
@@ -315,7 +316,7 @@ static void vgpu_cache_maint(u64 handle, u8 op)
 	WARN_ON(err || msg.ret);
 }
 
-static int vgpu_mm_fb_flush(struct gk20a *g)
+int vgpu_mm_fb_flush(struct gk20a *g)
 {
 
 	gk20a_dbg_fn("");
@@ -324,7 +325,7 @@ static int vgpu_mm_fb_flush(struct gk20a *g)
 	return 0;
 }
 
-static void vgpu_mm_l2_invalidate(struct gk20a *g)
+void vgpu_mm_l2_invalidate(struct gk20a *g)
 {
 
 	gk20a_dbg_fn("");
@@ -332,7 +333,7 @@ static void vgpu_mm_l2_invalidate(struct gk20a *g)
 	vgpu_cache_maint(vgpu_get_handle(g), TEGRA_VGPU_L2_MAINT_INV);
 }
 
-static void vgpu_mm_l2_flush(struct gk20a *g, bool invalidate)
+void vgpu_mm_l2_flush(struct gk20a *g, bool invalidate)
 {
 	u8 op;
 
@@ -346,14 +347,14 @@ static void vgpu_mm_l2_flush(struct gk20a *g, bool invalidate)
 	vgpu_cache_maint(vgpu_get_handle(g), op);
 }
 
-static void vgpu_mm_tlb_invalidate(struct gk20a *g, struct nvgpu_mem *pdb)
+void vgpu_mm_tlb_invalidate(struct gk20a *g, struct nvgpu_mem *pdb)
 {
 	gk20a_dbg_fn("");
 
 	nvgpu_err(g, "call to RM server not supported");
 }
 
-static void vgpu_mm_mmu_set_debug_mode(struct gk20a *g, bool enable)
+void vgpu_mm_mmu_set_debug_mode(struct gk20a *g, bool enable)
 {
 	struct tegra_vgpu_cmd_msg msg;
 	struct tegra_vgpu_mmu_debug_mode *p = &msg.params.mmu_debug_mode;
@@ -367,19 +368,3 @@ static void vgpu_mm_mmu_set_debug_mode(struct gk20a *g, bool enable)
 	err = vgpu_comm_sendrecv(&msg, sizeof(msg), sizeof(msg));
 	WARN_ON(err || msg.ret);
 }
-
-void vgpu_init_mm_ops(struct gpu_ops *gops)
-{
-	gops->fb.is_debug_mode_enabled = NULL;
-	gops->fb.set_debug_mode = vgpu_mm_mmu_set_debug_mode;
-	gops->mm.gmmu_map = vgpu_locked_gmmu_map;
-	gops->mm.gmmu_unmap = vgpu_locked_gmmu_unmap;
-	gops->mm.vm_bind_channel = vgpu_vm_bind_channel;
-	gops->mm.fb_flush = vgpu_mm_fb_flush;
-	gops->mm.l2_invalidate = vgpu_mm_l2_invalidate;
-	gops->mm.l2_flush = vgpu_mm_l2_flush;
-	gops->fb.tlb_invalidate = vgpu_mm_tlb_invalidate;
-	gops->mm.get_iommu_bit = gk20a_mm_get_iommu_bit;
-	gops->mm.gpu_phys_addr = gm20b_gpu_phys_addr;
-	gops->mm.init_mm_setup_hw = NULL;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/mm_vgpu.h b/drivers/gpu/nvgpu/vgpu/mm_vgpu.h
new file mode 100644
index 00000000..ed66282c
--- /dev/null
+++ b/drivers/gpu/nvgpu/vgpu/mm_vgpu.h
@@ -0,0 +1,56 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef _MM_VGPU_H_
+#define _MM_VGPU_H_
+
+u64 vgpu_locked_gmmu_map(struct vm_gk20a *vm,
+				u64 map_offset,
+				struct nvgpu_sgt *sgt,
+				u64 buffer_offset,
+				u64 size,
+				int pgsz_idx,
+				u8 kind_v,
+				u32 ctag_offset,
+				u32 flags,
+				int rw_flag,
+				bool clear_ctags,
+				bool sparse,
+				bool priv,
+				struct vm_gk20a_mapping_batch *batch,
+				enum nvgpu_aperture aperture);
+void vgpu_locked_gmmu_unmap(struct vm_gk20a *vm,
+				u64 vaddr,
+				u64 size,
+				int pgsz_idx,
+				bool va_allocated,
+				int rw_flag,
+				bool sparse,
+				struct vm_gk20a_mapping_batch *batch);
+int vgpu_vm_bind_channel(struct gk20a_as_share *as_share,
+				struct channel_gk20a *ch);
+int vgpu_mm_fb_flush(struct gk20a *g);
+void vgpu_mm_l2_invalidate(struct gk20a *g);
+void vgpu_mm_l2_flush(struct gk20a *g, bool invalidate);
+void vgpu_mm_tlb_invalidate(struct gk20a *g, struct nvgpu_mem *pdb);
+void vgpu_mm_mmu_set_debug_mode(struct gk20a *g, bool enable);
+#endif
diff --git a/drivers/gpu/nvgpu/vgpu/tsg_vgpu.c b/drivers/gpu/nvgpu/vgpu/tsg_vgpu.c
index 39d78983..2be102e3 100644
--- a/drivers/gpu/nvgpu/vgpu/tsg_vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/tsg_vgpu.c
@@ -27,10 +27,11 @@
 #include "gk20a/platform_gk20a.h"
 #include "gk20a/tsg_gk20a.h"
 #include "vgpu.h"
+#include "fifo_vgpu.h"
 
 #include <nvgpu/bug.h>
 
-static int vgpu_tsg_open(struct tsg_gk20a *tsg)
+int vgpu_tsg_open(struct tsg_gk20a *tsg)
 {
 	struct tegra_vgpu_cmd_msg msg = {};
 	struct tegra_vgpu_tsg_open_params *p =
@@ -52,7 +53,7 @@ static int vgpu_tsg_open(struct tsg_gk20a *tsg)
 	return err;
 }
 
-static int vgpu_tsg_bind_channel(struct tsg_gk20a *tsg,
+int vgpu_tsg_bind_channel(struct tsg_gk20a *tsg,
 			struct channel_gk20a *ch)
 {
 	struct tegra_vgpu_cmd_msg msg = {};
@@ -82,7 +83,7 @@ static int vgpu_tsg_bind_channel(struct tsg_gk20a *tsg,
 	return err;
 }
 
-static int vgpu_tsg_unbind_channel(struct channel_gk20a *ch)
+int vgpu_tsg_unbind_channel(struct channel_gk20a *ch)
 {
 	struct tegra_vgpu_cmd_msg msg = {};
 	struct tegra_vgpu_tsg_bind_unbind_channel_params *p =
@@ -105,7 +106,7 @@ static int vgpu_tsg_unbind_channel(struct channel_gk20a *ch)
 	return err;
 }
 
-static int vgpu_tsg_set_timeslice(struct tsg_gk20a *tsg, u32 timeslice)
+int vgpu_tsg_set_timeslice(struct tsg_gk20a *tsg, u32 timeslice)
 {
 	struct tegra_vgpu_cmd_msg msg = {0};
 	struct tegra_vgpu_tsg_timeslice_params *p =
@@ -126,11 +127,3 @@ static int vgpu_tsg_set_timeslice(struct tsg_gk20a *tsg, u32 timeslice)
 
 	return err;
 }
-
-void vgpu_init_tsg_ops(struct gpu_ops *gops)
-{
-	gops->fifo.tsg_bind_channel = vgpu_tsg_bind_channel;
-	gops->fifo.tsg_unbind_channel = vgpu_tsg_unbind_channel;
-	gops->fifo.tsg_set_timeslice = vgpu_tsg_set_timeslice;
-	gops->fifo.tsg_open = vgpu_tsg_open;
-}
diff --git a/drivers/gpu/nvgpu/vgpu/vgpu.c b/drivers/gpu/nvgpu/vgpu/vgpu.c
index b63202c1..7949ff24 100644
--- a/drivers/gpu/nvgpu/vgpu/vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/vgpu.c
@@ -378,7 +378,7 @@ int vgpu_init_gpu_characteristics(struct gk20a *g)
 	return 0;
 }
 
-static int vgpu_read_ptimer(struct gk20a *g, u64 *value)
+int vgpu_read_ptimer(struct gk20a *g, u64 *value)
 {
 	struct tegra_vgpu_cmd_msg msg = {0};
 	struct tegra_vgpu_read_ptimer_params *p = &msg.params.read_ptimer;
@@ -441,27 +441,6 @@ int vgpu_get_timestamps_zipper(struct gk20a *g,
 	return err;
 }
 
-void vgpu_init_hal_common(struct gk20a *g)
-{
-	struct gpu_ops *gops = &g->ops;
-
-	vgpu_init_fifo_ops(gops);
-	vgpu_init_gr_ops(gops);
-	vgpu_init_ltc_ops(gops);
-	vgpu_init_mm_ops(gops);
-	vgpu_init_debug_ops(gops);
-	vgpu_init_dbg_session_ops(gops);
-	vgpu_init_fecs_trace_ops(gops);
-	vgpu_init_tsg_ops(gops);
-#if defined(CONFIG_GK20A_CYCLE_STATS)
-	vgpu_init_css_ops(gops);
-#endif
-	vgpu_init_ce2_ops(gops);
-	gops->chip_init_gpu_characteristics = vgpu_init_gpu_characteristics;
-	gops->bus.read_ptimer = vgpu_read_ptimer;
-	gops->bus.get_timestamps_zipper = vgpu_get_timestamps_zipper;
-}
-
 static int vgpu_init_hal(struct gk20a *g)
 {
 	u32 ver = g->gpu_characteristics.arch + g->gpu_characteristics.impl;
diff --git a/drivers/gpu/nvgpu/vgpu/vgpu.h b/drivers/gpu/nvgpu/vgpu/vgpu.h
index 7364a8d9..d5c49c0f 100644
--- a/drivers/gpu/nvgpu/vgpu/vgpu.h
+++ b/drivers/gpu/nvgpu/vgpu/vgpu.h
@@ -94,16 +94,7 @@ int vgpu_fifo_nonstall_isr(struct gk20a *g,
 			struct tegra_vgpu_fifo_nonstall_intr_info *info);
 int vgpu_ce2_nonstall_isr(struct gk20a *g,
 			struct tegra_vgpu_ce2_nonstall_intr_info *info);
-void vgpu_init_fifo_ops(struct gpu_ops *gops);
-void vgpu_init_gr_ops(struct gpu_ops *gops);
-void vgpu_init_ltc_ops(struct gpu_ops *gops);
-void vgpu_init_mm_ops(struct gpu_ops *gops);
-void vgpu_init_debug_ops(struct gpu_ops *gops);
-void vgpu_init_tsg_ops(struct gpu_ops *gops);
-#if defined(CONFIG_GK20A_CYCLE_STATS)
-void vgpu_init_css_ops(struct gpu_ops *gops);
-#endif
-void vgpu_init_ce2_ops(struct gpu_ops *gops);
+u32 vgpu_ce_get_num_pce(struct gk20a *g);
 int vgpu_init_mm_support(struct gk20a *g);
 int vgpu_init_gr_support(struct gk20a *g);
 int vgpu_init_fifo_support(struct gk20a *g);
@@ -112,15 +103,17 @@ int vgpu_get_attribute(u64 handle, u32 attrib, u32 *value);
 int vgpu_comm_sendrecv(struct tegra_vgpu_cmd_msg *msg, size_t size_in,
 		size_t size_out);
 
-void vgpu_init_hal_common(struct gk20a *g);
 int vgpu_gm20b_init_hal(struct gk20a *g);
 int vgpu_gp10b_init_hal(struct gk20a *g);
 
-void vgpu_init_dbg_session_ops(struct gpu_ops *gops);
 int vgpu_init_gpu_characteristics(struct gk20a *g);
 
 void vgpu_create_sysfs(struct device *dev);
 void vgpu_remove_sysfs(struct device *dev);
+int vgpu_read_ptimer(struct gk20a *g, u64 *value);
+int vgpu_get_timestamps_zipper(struct gk20a *g,
+		u32 source_id, u32 count,
+		struct nvgpu_cpu_time_correlation_sample *samples);
 #else
 static inline int vgpu_pm_prepare_poweroff(struct device *dev)
 {
@@ -169,29 +162,6 @@ static inline int vgpu_fifo_isr(struct gk20a *g,
 {
 	return 0;
 }
-static inline void vgpu_init_fifo_ops(struct gpu_ops *gops)
-{
-}
-static inline void vgpu_init_gr_ops(struct gpu_ops *gops)
-{
-}
-static inline void vgpu_init_ltc_ops(struct gpu_ops *gops)
-{
-}
-static inline void vgpu_init_mm_ops(struct gpu_ops *gops)
-{
-}
-static inline void vgpu_init_debug_ops(struct gpu_ops *gops)
-{
-}
-#if defined(CONFIG_GK20A_CYCLE_STATS)
-static inline void vgpu_init_css_ops(struct gpu_ops *gops)
-{
-}
-#endif
-static inline void vgpu_init_ce2_ops(struct gpu_ops *gops)
-{
-}
 static inline int vgpu_init_mm_support(struct gk20a *g)
 {
 	return -ENOSYS;
-- 
cgit v1.2.2