36 files changed, 7578 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/gp10b/ce_gp10b.c b/drivers/gpu/nvgpu/gp10b/ce_gp10b.c
new file mode 100644
index 00000000..86a2b751
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/ce_gp10b.c
@@ -0,0 +1,78 @@
+/*
+ * Pascal GPU series Copy Engine.
+ *
+ * Copyright (c) 2011-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include "ce_gp10b.h"
+#include <nvgpu/hw/gp10b/hw_ce_gp10b.h>
+static u32 ce_blockpipe_isr(struct gk20a *g, u32 fifo_intr)
+{
+        gk20a_dbg(gpu_dbg_intr, "ce blocking pipe interrupt\n");
+        return ce_intr_status_blockpipe_pending_f();
+}
+static u32 ce_launcherr_isr(struct gk20a *g, u32 fifo_intr)
+{
+        gk20a_dbg(gpu_dbg_intr, "ce launch error interrupt\n");
+        return ce_intr_status_launcherr_pending_f();
+}
+void gp10b_ce_isr(struct gk20a *g, u32 inst_id, u32 pri_base)
+{
+        u32 ce_intr = gk20a_readl(g, ce_intr_status_r(inst_id));
+        u32 clear_intr = 0;
+        gk20a_dbg(gpu_dbg_intr, "ce isr %08x %08x\n", ce_intr, inst_id);
+        /* clear blocking interrupts: they exibit broken behavior */
+        if (ce_intr & ce_intr_status_blockpipe_pending_f())
+                clear_intr |= ce_blockpipe_isr(g, ce_intr);
+        if (ce_intr & ce_intr_status_launcherr_pending_f())
+                clear_intr |= ce_launcherr_isr(g, ce_intr);
+        gk20a_writel(g, ce_intr_status_r(inst_id), clear_intr);
+        return;
+}
+int gp10b_ce_nonstall_isr(struct gk20a *g, u32 inst_id, u32 pri_base)
+{
+        int ops = 0;
+        u32 ce_intr = gk20a_readl(g, ce_intr_status_r(inst_id));
+        gk20a_dbg(gpu_dbg_intr, "ce nonstall isr %08x %08x\n", ce_intr, inst_id);
+        if (ce_intr & ce_intr_status_nonblockpipe_pending_f()) {
+                gk20a_writel(g, ce_intr_status_r(inst_id),
+                        ce_intr_status_nonblockpipe_pending_f());
+                ops |= (gk20a_nonstall_ops_wakeup_semaphore |
+                        gk20a_nonstall_ops_post_events);
+        }
+        return ops;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/ce_gp10b.h b/drivers/gpu/nvgpu/gp10b/ce_gp10b.h
new file mode 100644
index 00000000..7b747751
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/ce_gp10b.h
@@ -0,0 +1,33 @@
+/*
+ * Pascal GPU series Copy Engine.
+ *
+ * Copyright (c) 2011-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef __CE_GP10B_H__
+#define __CE_GP10B_H__
+#include "gk20a/channel_gk20a.h"
+#include "gk20a/tsg_gk20a.h"
+void gp10b_ce_isr(struct gk20a *g, u32 inst_id, u32 pri_base);
+int gp10b_ce_nonstall_isr(struct gk20a *g, u32 inst_id, u32 pri_base);
+#endif /*__CE2_GP10B_H__*/
diff --git a/drivers/gpu/nvgpu/gp10b/ecc_gp10b.h b/drivers/gpu/nvgpu/gp10b/ecc_gp10b.h
new file mode 100644
index 00000000..a4a6e35b
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/ecc_gp10b.h
@@ -0,0 +1,50 @@
+/*
+ * GP10B ECC
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef _NVGPU_ECC_GP10B_H_
+#define _NVGPU_ECC_GP10B_H_
+struct gk20a_ecc_stat;
+struct ecc_gr_t18x {
+        struct gk20a_ecc_stat sm_lrf_single_err_count;
+        struct gk20a_ecc_stat sm_lrf_double_err_count;
+        struct gk20a_ecc_stat sm_shm_sec_count;
+        struct gk20a_ecc_stat sm_shm_sed_count;
+        struct gk20a_ecc_stat sm_shm_ded_count;
+        struct gk20a_ecc_stat tex_total_sec_pipe0_count;
+        struct gk20a_ecc_stat tex_total_ded_pipe0_count;
+        struct gk20a_ecc_stat tex_unique_sec_pipe0_count;
+        struct gk20a_ecc_stat tex_unique_ded_pipe0_count;
+        struct gk20a_ecc_stat tex_total_sec_pipe1_count;
+        struct gk20a_ecc_stat tex_total_ded_pipe1_count;
+        struct gk20a_ecc_stat tex_unique_sec_pipe1_count;
+        struct gk20a_ecc_stat tex_unique_ded_pipe1_count;
+        struct gk20a_ecc_stat l2_sec_count;
+        struct gk20a_ecc_stat l2_ded_count;
+};
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/fb_gp10b.c b/drivers/gpu/nvgpu/gp10b/fb_gp10b.c
new file mode 100644
index 00000000..9df4c851
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/fb_gp10b.c
@@ -0,0 +1,36 @@
+/*
+ * GP10B FB
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+*
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include "fb_gp10b.h"
+unsigned int gp10b_fb_compression_page_size(struct gk20a *g)
+{
+        return SZ_64K;
+}
+unsigned int gp10b_fb_compressible_page_size(struct gk20a *g)
+{
+        return SZ_4K;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/fb_gp10b.h b/drivers/gpu/nvgpu/gp10b/fb_gp10b.h
new file mode 100644
index 00000000..52aa2a75
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/fb_gp10b.h
@@ -0,0 +1,32 @@
+/*
+ * GP10B FB
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef _NVGPU_GP10B_FB
+#define _NVGPU_GP10B_FB
+struct gk20a;
+unsigned int gp10b_fb_compression_page_size(struct gk20a *g);
+unsigned int gp10b_fb_compressible_page_size(struct gk20a *g);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/fecs_trace_gp10b.c b/drivers/gpu/nvgpu/gp10b/fecs_trace_gp10b.c
new file mode 100644
index 00000000..511d565a
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/fecs_trace_gp10b.c
@@ -0,0 +1,55 @@
+/*
+ * GP10B GPU FECS traces
+ *
+ * Copyright (c) 2016-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include "gk20a/fecs_trace_gk20a.h"
+#include "fecs_trace_gp10b.h"
+#include <nvgpu/hw/gp10b/hw_ctxsw_prog_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_gr_gp10b.h>
+#ifdef CONFIG_GK20A_CTXSW_TRACE
+int gp10b_fecs_trace_flush(struct gk20a *g)
+{
+        struct fecs_method_op_gk20a op = {
+                .mailbox = { .id = 0, .data = 0,
+                        .clr = ~0, .ok = 0, .fail = 0},
+                .method.addr = gr_fecs_method_push_adr_write_timestamp_record_v(),
+                .method.data = 0,
+                .cond.ok = GR_IS_UCODE_OP_NOT_EQUAL,
+                .cond.fail = GR_IS_UCODE_OP_SKIP,
+        };
+        int err;
+        gk20a_dbg(gpu_dbg_fn|gpu_dbg_ctxsw, "");
+        err = gr_gk20a_elpg_protected_call(g,
+                        gr_gk20a_submit_fecs_method_op(g, op, false));
+        if (err)
+                nvgpu_err(g, "write timestamp record failed");
+        return err;
+}
+#endif /* CONFIG_GK20A_CTXSW_TRACE */
diff --git a/drivers/gpu/nvgpu/gp10b/fecs_trace_gp10b.h b/drivers/gpu/nvgpu/gp10b/fecs_trace_gp10b.h
new file mode 100644
index 00000000..f192617c
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/fecs_trace_gp10b.h
@@ -0,0 +1,32 @@
+/*
+ * GP10B GPU FECS traces
+ *
+ * Copyright (c) 2016-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef _NVGPU_FECS_TRACE_GP10B_H_
+#define _NVGPU_FECS_TRACE_GP10B_H_
+struct gk20a;
+int gp10b_fecs_trace_flush(struct gk20a *g);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/fifo_gp10b.c b/drivers/gpu/nvgpu/gp10b/fifo_gp10b.c
new file mode 100644
index 00000000..1c9249d1
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/fifo_gp10b.c
@@ -0,0 +1,320 @@
+/*
+ * GP10B fifo
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <uapi/linux/nvgpu.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/log2.h>
+#include "fifo_gp10b.h"
+#include "gk20a/gk20a.h"
+#include "gm20b/fifo_gm20b.h"
+#include <nvgpu/hw/gp10b/hw_pbdma_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_ccsr_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fifo_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_ram_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_top_gp10b.h>
+static void gp10b_set_pdb_fault_replay_flags(struct gk20a *g,
+                                struct nvgpu_mem *mem)
+{
+        u32 val;
+        gk20a_dbg_fn("");
+        val = nvgpu_mem_rd32(g, mem,
+                        ram_in_page_dir_base_fault_replay_tex_w());
+        val &= ~ram_in_page_dir_base_fault_replay_tex_m();
+        val |= ram_in_page_dir_base_fault_replay_tex_true_f();
+        nvgpu_mem_wr32(g, mem,
+                ram_in_page_dir_base_fault_replay_tex_w(), val);
+        val = nvgpu_mem_rd32(g, mem,
+                        ram_in_page_dir_base_fault_replay_gcc_w());
+        val &= ~ram_in_page_dir_base_fault_replay_gcc_m();
+        val |= ram_in_page_dir_base_fault_replay_gcc_true_f();
+        nvgpu_mem_wr32(g, mem,
+                ram_in_page_dir_base_fault_replay_gcc_w(), val);
+        gk20a_dbg_fn("done");
+}
+int channel_gp10b_commit_userd(struct channel_gk20a *c)
+{
+        u32 addr_lo;
+        u32 addr_hi;
+        struct gk20a *g = c->g;
+        gk20a_dbg_fn("");
+        addr_lo = u64_lo32(c->userd_iova >> ram_userd_base_shift_v());
+        addr_hi = u64_hi32(c->userd_iova);
+        gk20a_dbg_info("channel %d : set ramfc userd 0x%16llx",
+                c->chid, (u64)c->userd_iova);
+        nvgpu_mem_wr32(g, &c->inst_block,
+                       ram_in_ramfc_w() + ram_fc_userd_w(),
+                       nvgpu_aperture_mask(g, &g->fifo.userd,
+                        pbdma_userd_target_sys_mem_ncoh_f(),
+                        pbdma_userd_target_vid_mem_f()) |
+                       pbdma_userd_addr_f(addr_lo));
+        nvgpu_mem_wr32(g, &c->inst_block,
+                       ram_in_ramfc_w() + ram_fc_userd_hi_w(),
+                       pbdma_userd_hi_addr_f(addr_hi));
+        return 0;
+}
+int channel_gp10b_setup_ramfc(struct channel_gk20a *c,
+                        u64 gpfifo_base, u32 gpfifo_entries,
+                        unsigned long acquire_timeout, u32 flags)
+{
+        struct gk20a *g = c->g;
+        struct nvgpu_mem *mem = &c->inst_block;
+        gk20a_dbg_fn("");
+        nvgpu_memset(g, mem, 0, 0, ram_fc_size_val_v());
+        nvgpu_mem_wr32(g, mem, ram_fc_gp_base_w(),
+                pbdma_gp_base_offset_f(
+                u64_lo32(gpfifo_base >> pbdma_gp_base_rsvd_s())));
+        nvgpu_mem_wr32(g, mem, ram_fc_gp_base_hi_w(),
+                pbdma_gp_base_hi_offset_f(u64_hi32(gpfifo_base)) |
+                pbdma_gp_base_hi_limit2_f(ilog2(gpfifo_entries)));
+        nvgpu_mem_wr32(g, mem, ram_fc_signature_w(),
+                 c->g->ops.fifo.get_pbdma_signature(c->g));
+        nvgpu_mem_wr32(g, mem, ram_fc_formats_w(),
+                pbdma_formats_gp_fermi0_f() |
+                pbdma_formats_pb_fermi1_f() |
+                pbdma_formats_mp_fermi0_f());
+        nvgpu_mem_wr32(g, mem, ram_fc_pb_header_w(),
+                pbdma_pb_header_priv_user_f() |
+                pbdma_pb_header_method_zero_f() |
+                pbdma_pb_header_subchannel_zero_f() |
+                pbdma_pb_header_level_main_f() |
+                pbdma_pb_header_first_true_f() |
+                pbdma_pb_header_type_inc_f());
+        nvgpu_mem_wr32(g, mem, ram_fc_subdevice_w(),
+                pbdma_subdevice_id_f(1) |
+                pbdma_subdevice_status_active_f() |
+                pbdma_subdevice_channel_dma_enable_f());
+        nvgpu_mem_wr32(g, mem, ram_fc_target_w(), pbdma_target_engine_sw_f());
+        nvgpu_mem_wr32(g, mem, ram_fc_acquire_w(),
+                g->ops.fifo.pbdma_acquire_val(acquire_timeout));
+        nvgpu_mem_wr32(g, mem, ram_fc_runlist_timeslice_w(),
+                pbdma_runlist_timeslice_timeout_128_f() |
+                pbdma_runlist_timeslice_timescale_3_f() |
+                pbdma_runlist_timeslice_enable_true_f());
+        if ( flags & NVGPU_ALLOC_GPFIFO_FLAGS_REPLAYABLE_FAULTS_ENABLE)
+                gp10b_set_pdb_fault_replay_flags(c->g, mem);
+        nvgpu_mem_wr32(g, mem, ram_fc_chid_w(), ram_fc_chid_id_f(c->chid));
+        if (c->is_privileged_channel) {
+                /* Set privilege level for channel */
+                nvgpu_mem_wr32(g, mem, ram_fc_config_w(),
+                        pbdma_config_auth_level_privileged_f());
+                gk20a_fifo_setup_ramfc_for_privileged_channel(c);
+        }
+        return channel_gp10b_commit_userd(c);
+}
+u32 gp10b_fifo_get_pbdma_signature(struct gk20a *g)
+{
+        return g->ops.get_litter_value(g, GPU_LIT_GPFIFO_CLASS)
+                | pbdma_signature_sw_zero_f();
+}
+int gp10b_fifo_resetup_ramfc(struct channel_gk20a *c)
+{
+        u32 new_syncpt = 0, old_syncpt;
+        u32 v;
+        gk20a_dbg_fn("");
+        v = nvgpu_mem_rd32(c->g, &c->inst_block,
+                        ram_fc_allowed_syncpoints_w());
+        old_syncpt = pbdma_allowed_syncpoints_0_index_v(v);
+        if (c->sync)
+                new_syncpt = c->sync->syncpt_id(c->sync);
+        if (new_syncpt && new_syncpt != old_syncpt) {
+                /* disable channel */
+                gk20a_disable_channel_tsg(c->g, c);
+                /* preempt the channel */
+                WARN_ON(gk20a_fifo_preempt(c->g, c));
+                v = pbdma_allowed_syncpoints_0_valid_f(1);
+                gk20a_dbg_info("Channel %d, syncpt id %d\n",
+                                c->chid, new_syncpt);
+                v |= pbdma_allowed_syncpoints_0_index_f(new_syncpt);
+                nvgpu_mem_wr32(c->g, &c->inst_block,
+                                ram_fc_allowed_syncpoints_w(), v);
+        }
+        /* enable channel */
+        gk20a_enable_channel_tsg(c->g, c);
+        gk20a_dbg_fn("done");
+        return 0;
+}
+int gp10b_fifo_engine_enum_from_type(struct gk20a *g, u32 engine_type,
+                                        u32 *inst_id)
+{
+        int ret = ENGINE_INVAL_GK20A;
+        gk20a_dbg_info("engine type %d", engine_type);
+        if (engine_type == top_device_info_type_enum_graphics_v())
+                ret = ENGINE_GR_GK20A;
+        else if (engine_type == top_device_info_type_enum_lce_v()) {
+                /* Default assumptions - all the CE engine have separate runlist */
+                ret = ENGINE_ASYNC_CE_GK20A;
+        }
+        return ret;
+}
+void gp10b_device_info_data_parse(struct gk20a *g, u32 table_entry,
+                                u32 *inst_id, u32 *pri_base, u32 *fault_id)
+{
+        if (top_device_info_data_type_v(table_entry) ==
+            top_device_info_data_type_enum2_v()) {
+                if (inst_id)
+                        *inst_id = top_device_info_data_inst_id_v(table_entry);
+                if (pri_base) {
+                        *pri_base =
+                            (top_device_info_data_pri_base_v(table_entry)
+                            << top_device_info_data_pri_base_align_v());
+                        gk20a_dbg_info("device info: pri_base: %d", *pri_base);
+                }
+                if (fault_id && (top_device_info_data_fault_id_v(table_entry) ==
+                    top_device_info_data_fault_id_valid_v())) {
+                        *fault_id =
+                                 g->ops.fifo.device_info_fault_id(table_entry);
+                        gk20a_dbg_info("device info: fault_id: %d", *fault_id);
+                }
+        } else
+                nvgpu_err(g, "unknown device_info_data %d",
+                        top_device_info_data_type_v(table_entry));
+}
+void gp10b_fifo_init_pbdma_intr_descs(struct fifo_gk20a *f)
+{
+        /*
+         * These are all errors which indicate something really wrong
+         * going on in the device
+         */
+        f->intr.pbdma.device_fatal_0 =
+                pbdma_intr_0_memreq_pending_f() |
+                pbdma_intr_0_memack_timeout_pending_f() |
+                pbdma_intr_0_memack_extra_pending_f() |
+                pbdma_intr_0_memdat_timeout_pending_f() |
+                pbdma_intr_0_memdat_extra_pending_f() |
+                pbdma_intr_0_memflush_pending_f() |
+                pbdma_intr_0_memop_pending_f() |
+                pbdma_intr_0_lbconnect_pending_f() |
+                pbdma_intr_0_lback_timeout_pending_f() |
+                pbdma_intr_0_lback_extra_pending_f() |
+                pbdma_intr_0_lbdat_timeout_pending_f() |
+                pbdma_intr_0_lbdat_extra_pending_f() |
+                pbdma_intr_0_pri_pending_f();
+        /*
+         * These are data parsing, framing errors or others which can be
+         * recovered from with intervention... or just resetting the
+         * channel
+         */
+        f->intr.pbdma.channel_fatal_0 =
+                pbdma_intr_0_gpfifo_pending_f() |
+                pbdma_intr_0_gpptr_pending_f() |
+                pbdma_intr_0_gpentry_pending_f() |
+                pbdma_intr_0_gpcrc_pending_f() |
+                pbdma_intr_0_pbptr_pending_f() |
+                pbdma_intr_0_pbentry_pending_f() |
+                pbdma_intr_0_pbcrc_pending_f() |
+                pbdma_intr_0_method_pending_f() |
+                pbdma_intr_0_methodcrc_pending_f() |
+                pbdma_intr_0_pbseg_pending_f() |
+                pbdma_intr_0_syncpoint_illegal_pending_f() |
+                pbdma_intr_0_signature_pending_f();
+        /* Can be used for sw-methods, or represents a recoverable timeout. */
+        f->intr.pbdma.restartable_0 =
+                pbdma_intr_0_device_pending_f();
+}
+void gp10b_fifo_get_mmu_fault_info(struct gk20a *g, u32 mmu_fault_id,
+        struct mmu_fault_info *mmfault)
+{
+        u32 fault_info;
+        u32 addr_lo, addr_hi;
+        gk20a_dbg_fn("mmu_fault_id %d", mmu_fault_id);
+        memset(mmfault, 0, sizeof(*mmfault));
+        fault_info = gk20a_readl(g,
+                fifo_intr_mmu_fault_info_r(mmu_fault_id));
+        mmfault->fault_type =
+                fifo_intr_mmu_fault_info_type_v(fault_info);
+        mmfault->access_type =
+                fifo_intr_mmu_fault_info_access_type_v(fault_info);
+        mmfault->client_type =
+                fifo_intr_mmu_fault_info_client_type_v(fault_info);
+        mmfault->client_id =
+                fifo_intr_mmu_fault_info_client_v(fault_info);
+        addr_lo = gk20a_readl(g, fifo_intr_mmu_fault_lo_r(mmu_fault_id));
+        addr_hi = gk20a_readl(g, fifo_intr_mmu_fault_hi_r(mmu_fault_id));
+        mmfault->fault_addr = hi32_lo32_to_u64(addr_hi, addr_lo);
+        /* note:ignoring aperture */
+        mmfault->inst_ptr = fifo_intr_mmu_fault_inst_ptr_v(
+                 gk20a_readl(g, fifo_intr_mmu_fault_inst_r(mmu_fault_id)));
+        /* note: inst_ptr is a 40b phys addr.  */
+        mmfault->inst_ptr <<= fifo_intr_mmu_fault_inst_ptr_align_shift_v();
+}
diff --git a/drivers/gpu/nvgpu/gp10b/fifo_gp10b.h b/drivers/gpu/nvgpu/gp10b/fifo_gp10b.h
new file mode 100644
index 00000000..20918483
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/fifo_gp10b.h
@@ -0,0 +1,47 @@
+/*
+ * GP10B Fifo
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef FIFO_GP10B_H
+#define FIFO_GP10B_H
+struct gpu_ops;
+struct channel_gk20a;
+struct fifo_gk20a;
+struct mmu_fault_info;
+int channel_gp10b_setup_ramfc(struct channel_gk20a *c,
+                        u64 gpfifo_base, u32 gpfifo_entries,
+                        unsigned long acquire_timeout, u32 flags);
+u32 gp10b_fifo_get_pbdma_signature(struct gk20a *g);
+int gp10b_fifo_resetup_ramfc(struct channel_gk20a *c);
+int gp10b_fifo_engine_enum_from_type(struct gk20a *g, u32 engine_type,
+                                        u32 *inst_id);
+void gp10b_device_info_data_parse(struct gk20a *g, u32 table_entry,
+                                u32 *inst_id, u32 *pri_base, u32 *fault_id);
+void gp10b_fifo_init_pbdma_intr_descs(struct fifo_gk20a *f);
+void gp10b_fifo_get_mmu_fault_info(struct gk20a *g, u32 mmu_fault_id,
+        struct mmu_fault_info *mmfault);
+int channel_gp10b_commit_userd(struct channel_gk20a *c);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/gp10b.c b/drivers/gpu/nvgpu/gp10b/gp10b.c
new file mode 100644
index 00000000..51dc4301
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gp10b.c
@@ -0,0 +1,120 @@
+/*
+ * GP10B Graphics
+ *
+ * Copyright (c) 2016-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include <nvgpu/enabled.h>
+#include "gp10b.h"
+#include <nvgpu/hw/gp10b/hw_fuse_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_gr_gp10b.h>
+static void gp10b_detect_ecc_enabled_units(struct gk20a *g)
+{
+        u32 opt_ecc_en = gk20a_readl(g, fuse_opt_ecc_en_r());
+        u32 opt_feature_fuses_override_disable =
+                        gk20a_readl(g,
+                                fuse_opt_feature_fuses_override_disable_r());
+        u32 fecs_feature_override_ecc =
+                                gk20a_readl(g,
+                                        gr_fecs_feature_override_ecc_r());
+        if (opt_feature_fuses_override_disable) {
+                if (opt_ecc_en) {
+                        __nvgpu_set_enabled(g, NVGPU_ECC_ENABLED_SM_LRF, true);
+                        __nvgpu_set_enabled(g, NVGPU_ECC_ENABLED_SM_SHM, true);
+                        __nvgpu_set_enabled(g, NVGPU_ECC_ENABLED_TEX, true);
+                        __nvgpu_set_enabled(g, NVGPU_ECC_ENABLED_LTC, true);
+                }
+        } else {
+                /* SM LRF */
+                if (gr_fecs_feature_override_ecc_sm_lrf_override_v(
+                                                fecs_feature_override_ecc)) {
+                        if (gr_fecs_feature_override_ecc_sm_lrf_v(
+                                                fecs_feature_override_ecc)) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_SM_LRF, true);
+                        }
+                } else {
+                        if (opt_ecc_en) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_SM_LRF, true);
+                        }
+                }
+                /* SM SHM */
+                if (gr_fecs_feature_override_ecc_sm_shm_override_v(
+                                                fecs_feature_override_ecc)) {
+                        if (gr_fecs_feature_override_ecc_sm_shm_v(
+                                                fecs_feature_override_ecc)) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_SM_SHM, true);
+                        }
+                } else {
+                        if (opt_ecc_en) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_SM_SHM, true);
+                        }
+                }
+                /* TEX */
+                if (gr_fecs_feature_override_ecc_tex_override_v(
+                                                fecs_feature_override_ecc)) {
+                        if (gr_fecs_feature_override_ecc_tex_v(
+                                                fecs_feature_override_ecc)) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_TEX, true);
+                        }
+                } else {
+                        if (opt_ecc_en) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_TEX, true);
+                        }
+                }
+                /* LTC */
+                if (gr_fecs_feature_override_ecc_ltc_override_v(
+                                                fecs_feature_override_ecc)) {
+                        if (gr_fecs_feature_override_ecc_ltc_v(
+                                                fecs_feature_override_ecc)) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_LTC, true);
+                        }
+                } else {
+                        if (opt_ecc_en) {
+                                __nvgpu_set_enabled(g,
+                                                NVGPU_ECC_ENABLED_LTC, true);
+                        }
+                }
+        }
+}
+int gp10b_init_gpu_characteristics(struct gk20a *g)
+{
+        gk20a_init_gpu_characteristics(g);
+        gp10b_detect_ecc_enabled_units(g);
+        __nvgpu_set_enabled(g, NVGPU_SUPPORT_RESCHEDULE_RUNLIST, true);
+        return 0;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/gp10b.h b/drivers/gpu/nvgpu/gp10b/gp10b.h
new file mode 100644
index 00000000..cd850a07
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gp10b.h
@@ -0,0 +1,32 @@
+/*
+ * GP10B Graphics
+ *
+ * Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef GP10B_H
+#define GP10B_H
+#include "gk20a/gk20a.h"
+int gp10b_init_gpu_characteristics(struct gk20a *g);
+#endif /* GP10B_H */
diff --git a/drivers/gpu/nvgpu/gp10b/gp10b_gating_reglist.c b/drivers/gpu/nvgpu/gp10b/gp10b_gating_reglist.c
new file mode 100644
index 00000000..456f3fa0
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gp10b_gating_reglist.c
@@ -0,0 +1,741 @@
+/*
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ *
+ * This file is autogenerated.  Do not edit.
+ */
+#ifndef __gp10b_gating_reglist_h__
+#define __gp10b_gating_reglist_h__
+#include "gp10b_gating_reglist.h"
+#include <nvgpu/enabled.h>
+struct gating_desc {
+        u32 addr;
+        u32 prod;
+        u32 disable;
+};
+/* slcg bus */
+static const struct gating_desc gp10b_slcg_bus[] = {
+        {.addr = 0x00001c04, .prod = 0x00000000, .disable = 0x000003fe},
+};
+/* slcg ce2 */
+static const struct gating_desc gp10b_slcg_ce2[] = {
+        {.addr = 0x00104204, .prod = 0x00000000, .disable = 0x000007fe},
+};
+/* slcg chiplet */
+static const struct gating_desc gp10b_slcg_chiplet[] = {
+        {.addr = 0x0010c07c, .prod = 0x00000000, .disable = 0x00000007},
+        {.addr = 0x0010e07c, .prod = 0x00000000, .disable = 0x00000007},
+        {.addr = 0x0010d07c, .prod = 0x00000000, .disable = 0x00000007},
+        {.addr = 0x0010e17c, .prod = 0x00000000, .disable = 0x00000007},
+};
+/* slcg fb */
+static const struct gating_desc gp10b_slcg_fb[] = {
+        {.addr = 0x00100d14, .prod = 0x00000000, .disable = 0xfffffffe},
+        {.addr = 0x00100c9c, .prod = 0x00000000, .disable = 0x000001fe},
+};
+/* slcg fifo */
+static const struct gating_desc gp10b_slcg_fifo[] = {
+        {.addr = 0x000026ac, .prod = 0x00000f40, .disable = 0x0001fffe},
+};
+/* slcg gr */
+static const struct gating_desc gp10b_slcg_gr[] = {
+        {.addr = 0x004041f4, .prod = 0x00000002, .disable = 0x03fffffe},
+        {.addr = 0x0040917c, .prod = 0x00020008, .disable = 0x0003fffe},
+        {.addr = 0x00409894, .prod = 0x00000040, .disable = 0x03fffffe},
+        {.addr = 0x004078c4, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x00406004, .prod = 0x00000200, .disable = 0x0001fffe},
+        {.addr = 0x00405864, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x00405910, .prod = 0xfffffff0, .disable = 0xfffffffe},
+        {.addr = 0x00408044, .prod = 0x00000000, .disable = 0x000007fe},
+        {.addr = 0x00407004, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x0041a17c, .prod = 0x00020008, .disable = 0x0003fffe},
+        {.addr = 0x0041a894, .prod = 0x00000040, .disable = 0x03fffffe},
+        {.addr = 0x00418504, .prod = 0x00000000, .disable = 0x0007fffe},
+        {.addr = 0x0041860c, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x0041868c, .prod = 0x00000000, .disable = 0x0000001e},
+        {.addr = 0x0041871c, .prod = 0x00000000, .disable = 0x0000003e},
+        {.addr = 0x00418388, .prod = 0x00000000, .disable = 0x00000001},
+        {.addr = 0x0041882c, .prod = 0x00000000, .disable = 0x0001fffe},
+        {.addr = 0x00418bc0, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x00418974, .prod = 0x00000000, .disable = 0x0001fffe},
+        {.addr = 0x00418c74, .prod = 0xffffffc0, .disable = 0xfffffffe},
+        {.addr = 0x00418cf4, .prod = 0xfffffffc, .disable = 0xfffffffe},
+        {.addr = 0x00418d74, .prod = 0xffffffe0, .disable = 0xfffffffe},
+        {.addr = 0x00418f10, .prod = 0xffffffe0, .disable = 0xfffffffe},
+        {.addr = 0x00418e10, .prod = 0xfffffffe, .disable = 0xfffffffe},
+        {.addr = 0x00419024, .prod = 0x000001fe, .disable = 0x000001fe},
+        {.addr = 0x0041889c, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x00419d24, .prod = 0x00000000, .disable = 0x0000ffff},
+        {.addr = 0x00419a44, .prod = 0x00000000, .disable = 0x0000000e},
+        {.addr = 0x00419a4c, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x00419a54, .prod = 0x00000000, .disable = 0x0000003e},
+        {.addr = 0x00419a5c, .prod = 0x00000000, .disable = 0x0000000e},
+        {.addr = 0x00419a64, .prod = 0x00000000, .disable = 0x000001fe},
+        {.addr = 0x00419a6c, .prod = 0x00000000, .disable = 0x0000000e},
+        {.addr = 0x00419a74, .prod = 0x00000000, .disable = 0x0000000e},
+        {.addr = 0x00419a7c, .prod = 0x00000000, .disable = 0x0000003e},
+        {.addr = 0x00419a84, .prod = 0x00000000, .disable = 0x0000000e},
+        {.addr = 0x0041986c, .prod = 0x00000104, .disable = 0x00fffffe},
+        {.addr = 0x00419cd8, .prod = 0x00000000, .disable = 0x001ffffe},
+        {.addr = 0x00419ce0, .prod = 0x00000000, .disable = 0x001ffffe},
+        {.addr = 0x00419c74, .prod = 0x0000001e, .disable = 0x0000001e},
+        {.addr = 0x00419fd4, .prod = 0x00000000, .disable = 0x0003fffe},
+        {.addr = 0x00419fdc, .prod = 0xffedff00, .disable = 0xfffffffe},
+        {.addr = 0x00419fe4, .prod = 0x00001b00, .disable = 0x00001ffe},
+        {.addr = 0x00419ff4, .prod = 0x00000000, .disable = 0x00003ffe},
+        {.addr = 0x00419ffc, .prod = 0x00000000, .disable = 0x0001fffe},
+        {.addr = 0x0041be2c, .prod = 0x04115fc0, .disable = 0xfffffffe},
+        {.addr = 0x0041bfec, .prod = 0xfffffff0, .disable = 0xfffffffe},
+        {.addr = 0x0041bed4, .prod = 0xfffffff8, .disable = 0xfffffffe},
+        {.addr = 0x00408814, .prod = 0x00000000, .disable = 0x0001fffe},
+        {.addr = 0x00408a84, .prod = 0x00000000, .disable = 0x0001fffe},
+        {.addr = 0x004089ac, .prod = 0x00000000, .disable = 0x0001fffe},
+        {.addr = 0x00408a24, .prod = 0x00000000, .disable = 0x0000ffff},
+};
+/* slcg ltc */
+static const struct gating_desc gp10b_slcg_ltc[] = {
+        {.addr = 0x0017e050, .prod = 0x00000000, .disable = 0xfffffffe},
+        {.addr = 0x0017e35c, .prod = 0x00000000, .disable = 0xfffffffe},
+};
+/* slcg perf */
+static const struct gating_desc gp10b_slcg_perf[] = {
+        {.addr = 0x001be018, .prod = 0x000001ff, .disable = 0x00000000},
+        {.addr = 0x001bc018, .prod = 0x000001ff, .disable = 0x00000000},
+        {.addr = 0x001b8018, .prod = 0x000001ff, .disable = 0x00000000},
+        {.addr = 0x001b4124, .prod = 0x00000001, .disable = 0x00000000},
+};
+/* slcg PriRing */
+static const struct gating_desc gp10b_slcg_priring[] = {
+        {.addr = 0x001200a8, .prod = 0x00000000, .disable = 0x00000001},
+};
+/* slcg pwr_csb */
+static const struct gating_desc gp10b_slcg_pwr_csb[] = {
+        {.addr = 0x00000134, .prod = 0x00020008, .disable = 0x0003fffe},
+        {.addr = 0x00000e74, .prod = 0x00000000, .disable = 0x0000000f},
+        {.addr = 0x00000a74, .prod = 0x00004000, .disable = 0x00007ffe},
+        {.addr = 0x000016b8, .prod = 0x00000000, .disable = 0x0000000f},
+};
+/* slcg pmu */
+static const struct gating_desc gp10b_slcg_pmu[] = {
+        {.addr = 0x0010a134, .prod = 0x00020008, .disable = 0x0003fffe},
+        {.addr = 0x0010aa74, .prod = 0x00004000, .disable = 0x00007ffe},
+        {.addr = 0x0010ae74, .prod = 0x00000000, .disable = 0x0000000f},
+};
+/* therm gr */
+static const struct gating_desc gp10b_slcg_therm[] = {
+        {.addr = 0x000206b8, .prod = 0x00000000, .disable = 0x0000000f},
+};
+/* slcg Xbar */
+static const struct gating_desc gp10b_slcg_xbar[] = {
+        {.addr = 0x0013cbe4, .prod = 0x00000000, .disable = 0x1ffffffe},
+        {.addr = 0x0013cc04, .prod = 0x00000000, .disable = 0x1ffffffe},
+};
+/* blcg bus */
+static const struct gating_desc gp10b_blcg_bus[] = {
+        {.addr = 0x00001c00, .prod = 0x00000042, .disable = 0x00000000},
+};
+/* blcg ce */
+static const struct gating_desc gp10b_blcg_ce[] = {
+        {.addr = 0x00104200, .prod = 0x00008242, .disable = 0x00000000},
+};
+/* blcg ctxsw prog */
+static const struct gating_desc gp10b_blcg_ctxsw_prog[] = {
+};
+/* blcg fb */
+static const struct gating_desc gp10b_blcg_fb[] = {
+        {.addr = 0x00100d10, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00100d30, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00100d3c, .prod = 0x00000242, .disable = 0x00000000},
+        {.addr = 0x00100d48, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00100c98, .prod = 0x00004242, .disable = 0x00000000},
+};
+/* blcg fifo */
+static const struct gating_desc gp10b_blcg_fifo[] = {
+        {.addr = 0x000026a4, .prod = 0x0000c242, .disable = 0x00000000},
+};
+/* blcg gr */
+static const struct gating_desc gp10b_blcg_gr[] = {
+        {.addr = 0x004041f0, .prod = 0x0000c646, .disable = 0x00000000},
+        {.addr = 0x00409890, .prod = 0x0000007f, .disable = 0x00000000},
+        {.addr = 0x004098b0, .prod = 0x0000007f, .disable = 0x00000000},
+        {.addr = 0x004078c0, .prod = 0x00004242, .disable = 0x00000000},
+        {.addr = 0x00406000, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00405860, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x0040590c, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00408040, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00407000, .prod = 0x4000c242, .disable = 0x00000000},
+        {.addr = 0x00405bf0, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x0041a890, .prod = 0x0000427f, .disable = 0x00000000},
+        {.addr = 0x0041a8b0, .prod = 0x0000007f, .disable = 0x00000000},
+        {.addr = 0x00418500, .prod = 0x0000c244, .disable = 0x00000000},
+        {.addr = 0x00418608, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00418688, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00418718, .prod = 0x00000042, .disable = 0x00000000},
+        {.addr = 0x00418828, .prod = 0x00008444, .disable = 0x00000000},
+        {.addr = 0x00418bbc, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00418970, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00418c70, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00418cf0, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00418d70, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00418f0c, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00418e0c, .prod = 0x00008444, .disable = 0x00000000},
+        {.addr = 0x00419020, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419038, .prod = 0x00000042, .disable = 0x00000000},
+        {.addr = 0x00418898, .prod = 0x00004242, .disable = 0x00000000},
+        {.addr = 0x00419a40, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a48, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a50, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a58, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a60, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a68, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a70, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a78, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419a80, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00419868, .prod = 0x00008242, .disable = 0x00000000},
+        {.addr = 0x00419cd4, .prod = 0x00000002, .disable = 0x00000000},
+        {.addr = 0x00419cdc, .prod = 0x00000002, .disable = 0x00000000},
+        {.addr = 0x00419c70, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00419fd0, .prod = 0x0000c044, .disable = 0x00000000},
+        {.addr = 0x00419fd8, .prod = 0x0000c046, .disable = 0x00000000},
+        {.addr = 0x00419fe0, .prod = 0x0000c044, .disable = 0x00000000},
+        {.addr = 0x00419fe8, .prod = 0x0000c042, .disable = 0x00000000},
+        {.addr = 0x00419ff0, .prod = 0x0000c045, .disable = 0x00000000},
+        {.addr = 0x00419ff8, .prod = 0x00000002, .disable = 0x00000000},
+        {.addr = 0x00419f90, .prod = 0x00000002, .disable = 0x00000000},
+        {.addr = 0x0041be28, .prod = 0x00008242, .disable = 0x00000000},
+        {.addr = 0x0041bfe8, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x0041bed0, .prod = 0x0000c444, .disable = 0x00000000},
+        {.addr = 0x00408810, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x00408a80, .prod = 0x0000c242, .disable = 0x00000000},
+        {.addr = 0x004089a8, .prod = 0x0000c242, .disable = 0x00000000},
+};
+/* blcg ltc */
+static const struct gating_desc gp10b_blcg_ltc[] = {
+        {.addr = 0x0017e030, .prod = 0x00000044, .disable = 0x00000000},
+        {.addr = 0x0017e040, .prod = 0x00000044, .disable = 0x00000000},
+        {.addr = 0x0017e3e0, .prod = 0x00000044, .disable = 0x00000000},
+        {.addr = 0x0017e3c8, .prod = 0x00000044, .disable = 0x00000000},
+};
+/* blcg pwr_csb  */
+static const struct gating_desc gp10b_blcg_pwr_csb[] = {
+        {.addr = 0x00000a70, .prod = 0x00000045, .disable = 0x00000000},
+};
+/* blcg pmu */
+static const struct gating_desc gp10b_blcg_pmu[] = {
+        {.addr = 0x0010aa70, .prod = 0x00000045, .disable = 0x00000000},
+};
+/* blcg Xbar */
+static const struct gating_desc gp10b_blcg_xbar[] = {
+        {.addr = 0x0013cbe0, .prod = 0x00000042, .disable = 0x00000000},
+        {.addr = 0x0013cc00, .prod = 0x00000042, .disable = 0x00000000},
+};
+/* pg gr */
+static const struct gating_desc gp10b_pg_gr[] = {
+};
+/* inline functions */
+void gp10b_slcg_bus_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_bus) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_bus[i].addr,
+                                gp10b_slcg_bus[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_bus[i].addr,
+                                 gp10b_slcg_bus[i].disable);
+        }
+}
+void gp10b_slcg_ce2_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_ce2) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_ce2[i].addr,
+                                gp10b_slcg_ce2[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_ce2[i].addr,
+                                 gp10b_slcg_ce2[i].disable);
+        }
+}
+void gp10b_slcg_chiplet_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_chiplet) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_chiplet[i].addr,
+                                gp10b_slcg_chiplet[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_chiplet[i].addr,
+                                 gp10b_slcg_chiplet[i].disable);
+        }
+}
+void gp10b_slcg_ctxsw_firmware_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+}
+void gp10b_slcg_fb_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_fb) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_fb[i].addr,
+                                gp10b_slcg_fb[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_fb[i].addr,
+                                 gp10b_slcg_fb[i].disable);
+        }
+}
+void gp10b_slcg_fifo_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_fifo) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_fifo[i].addr,
+                                gp10b_slcg_fifo[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_fifo[i].addr,
+                                 gp10b_slcg_fifo[i].disable);
+        }
+}
+void gr_gp10b_slcg_gr_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_gr) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_gr[i].addr,
+                                gp10b_slcg_gr[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_gr[i].addr,
+                                 gp10b_slcg_gr[i].disable);
+        }
+}
+void ltc_gp10b_slcg_ltc_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_ltc) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_ltc[i].addr,
+                                gp10b_slcg_ltc[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_ltc[i].addr,
+                                gp10b_slcg_ltc[i].disable);
+        }
+}
+void gp10b_slcg_perf_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_perf) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_perf[i].addr,
+                                gp10b_slcg_perf[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_perf[i].addr,
+                                gp10b_slcg_perf[i].disable);
+        }
+}
+void gp10b_slcg_priring_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_priring) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_priring[i].addr,
+                                gp10b_slcg_priring[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_priring[i].addr,
+                                gp10b_slcg_priring[i].disable);
+        }
+}
+void gp10b_slcg_pwr_csb_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_pwr_csb) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_pwr_csb[i].addr,
+                                gp10b_slcg_pwr_csb[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_pwr_csb[i].addr,
+                                gp10b_slcg_pwr_csb[i].disable);
+        }
+}
+void gp10b_slcg_pmu_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_pmu) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_pmu[i].addr,
+                                gp10b_slcg_pmu[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_pmu[i].addr,
+                                gp10b_slcg_pmu[i].disable);
+        }
+}
+void gp10b_slcg_therm_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_therm) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_therm[i].addr,
+                                gp10b_slcg_therm[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_therm[i].addr,
+                                gp10b_slcg_therm[i].disable);
+        }
+}
+void gp10b_slcg_xbar_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_slcg_xbar) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_SLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_slcg_xbar[i].addr,
+                                gp10b_slcg_xbar[i].prod);
+                else
+                        gk20a_writel(g, gp10b_slcg_xbar[i].addr,
+                                gp10b_slcg_xbar[i].disable);
+        }
+}
+void gp10b_blcg_bus_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_bus) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_bus[i].addr,
+                                gp10b_blcg_bus[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_bus[i].addr,
+                                gp10b_blcg_bus[i].disable);
+        }
+}
+void gp10b_blcg_ce_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_ce) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_ce[i].addr,
+                                gp10b_blcg_ce[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_ce[i].addr,
+                                gp10b_blcg_ce[i].disable);
+        }
+}
+void gp10b_blcg_ctxsw_firmware_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_ctxsw_prog) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_ctxsw_prog[i].addr,
+                                gp10b_blcg_ctxsw_prog[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_ctxsw_prog[i].addr,
+                                gp10b_blcg_ctxsw_prog[i].disable);
+        }
+}
+void gp10b_blcg_fb_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_fb) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_fb[i].addr,
+                                gp10b_blcg_fb[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_fb[i].addr,
+                                gp10b_blcg_fb[i].disable);
+        }
+}
+void gp10b_blcg_fifo_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_fifo) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_fifo[i].addr,
+                                gp10b_blcg_fifo[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_fifo[i].addr,
+                                gp10b_blcg_fifo[i].disable);
+        }
+}
+void gp10b_blcg_gr_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_gr) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_gr[i].addr,
+                                gp10b_blcg_gr[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_gr[i].addr,
+                                gp10b_blcg_gr[i].disable);
+        }
+}
+void gp10b_blcg_ltc_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_ltc) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_ltc[i].addr,
+                                gp10b_blcg_ltc[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_ltc[i].addr,
+                                gp10b_blcg_ltc[i].disable);
+        }
+}
+void gp10b_blcg_pwr_csb_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_pwr_csb) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_pwr_csb[i].addr,
+                                gp10b_blcg_pwr_csb[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_pwr_csb[i].addr,
+                                gp10b_blcg_pwr_csb[i].disable);
+        }
+}
+void gp10b_blcg_pmu_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_pmu) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_pmu[i].addr,
+                                gp10b_blcg_pmu[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_pmu[i].addr,
+                                gp10b_blcg_pmu[i].disable);
+        }
+}
+void gp10b_blcg_xbar_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_blcg_xbar) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_blcg_xbar[i].addr,
+                                gp10b_blcg_xbar[i].prod);
+                else
+                        gk20a_writel(g, gp10b_blcg_xbar[i].addr,
+                                gp10b_blcg_xbar[i].disable);
+        }
+}
+void gr_gp10b_pg_gr_load_gating_prod(struct gk20a *g,
+        bool prod)
+{
+        u32 i;
+        u32 size = sizeof(gp10b_pg_gr) / sizeof(struct gating_desc);
+        if (!nvgpu_is_enabled(g, NVGPU_GPU_CAN_BLCG))
+                return;
+        for (i = 0; i < size; i++) {
+                if (prod)
+                        gk20a_writel(g, gp10b_pg_gr[i].addr,
+                                gp10b_pg_gr[i].prod);
+                else
+                        gk20a_writel(g, gp10b_pg_gr[i].addr,
+                                gp10b_pg_gr[i].disable);
+        }
+}
+#endif /* __gp10b_gating_reglist_h__ */
diff --git a/drivers/gpu/nvgpu/gp10b/gp10b_gating_reglist.h b/drivers/gpu/nvgpu/gp10b/gp10b_gating_reglist.h
new file mode 100644
index 00000000..7dbc6cac
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gp10b_gating_reglist.h
@@ -0,0 +1,99 @@
+/*
+ * Copyright (c) 2015-2016, NVIDIA Corporation. All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+void gp10b_slcg_bus_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_ce2_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_chiplet_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_ctxsw_firmware_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_fb_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_fifo_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gr_gp10b_slcg_gr_load_gating_prod(struct gk20a *g,
+        bool prod);
+void ltc_gp10b_slcg_ltc_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_perf_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_priring_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_pwr_csb_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_pmu_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_therm_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_slcg_xbar_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_bus_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_ce_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_ctxsw_firmware_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_fb_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_fifo_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_gr_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_ltc_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_pwr_csb_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_pmu_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gp10b_blcg_xbar_load_gating_prod(struct gk20a *g,
+        bool prod);
+void gr_gp10b_pg_gr_load_gating_prod(struct gk20a *g,
+        bool prod);
diff --git a/drivers/gpu/nvgpu/gp10b/gr_ctx_gp10b.c b/drivers/gpu/nvgpu/gp10b/gr_ctx_gp10b.c
new file mode 100644
index 00000000..cf51e8b4
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gr_ctx_gp10b.c
@@ -0,0 +1,72 @@
+/*
+ * drivers/video/tegra/host/gp10b/gr_ctx_gp10b.c
+ *
+ * GM20B Graphics Context
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include "gr_ctx_gp10b.h"
+int gr_gp10b_get_netlist_name(struct gk20a *g, int index, char *name)
+{
+        switch (index) {
+#ifdef GP10B_NETLIST_IMAGE_FW_NAME
+        case NETLIST_FINAL:
+                sprintf(name, GP10B_NETLIST_IMAGE_FW_NAME);
+                return 0;
+#endif
+#ifdef GK20A_NETLIST_IMAGE_A
+        case NETLIST_SLOT_A:
+                sprintf(name, GK20A_NETLIST_IMAGE_A);
+                return 0;
+#endif
+#ifdef GK20A_NETLIST_IMAGE_B
+        case NETLIST_SLOT_B:
+                sprintf(name, GK20A_NETLIST_IMAGE_B);
+                return 0;
+#endif
+#ifdef GK20A_NETLIST_IMAGE_C
+        case NETLIST_SLOT_C:
+                sprintf(name, GK20A_NETLIST_IMAGE_C);
+                return 0;
+#endif
+#ifdef GK20A_NETLIST_IMAGE_D
+        case NETLIST_SLOT_D:
+                sprintf(name, GK20A_NETLIST_IMAGE_D);
+                return 0;
+#endif
+        default:
+                return -1;
+        }
+        return -1;
+}
+bool gr_gp10b_is_firmware_defined(void)
+{
+#ifdef GP10B_NETLIST_IMAGE_FW_NAME
+        return true;
+#else
+        return false;
+#endif
+}
diff --git a/drivers/gpu/nvgpu/gp10b/gr_ctx_gp10b.h b/drivers/gpu/nvgpu/gp10b/gr_ctx_gp10b.h
new file mode 100644
index 00000000..b409b442
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gr_ctx_gp10b.h
@@ -0,0 +1,35 @@
+/*
+ * GP10B Graphics Context
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef __GR_CTX_GM10B_H__
+#define __GR_CTX_GM10B_H__
+#include "gk20a/gr_ctx_gk20a.h"
+/* production netlist, one and only one from below */
+#define GP10B_NETLIST_IMAGE_FW_NAME GK20A_NETLIST_IMAGE_A
+int gr_gp10b_get_netlist_name(struct gk20a *g, int index, char *name);
+bool gr_gp10b_is_firmware_defined(void);
+#endif /*__GR_CTX_GP10B_H__*/
diff --git a/drivers/gpu/nvgpu/gp10b/gr_gp10b.c b/drivers/gpu/nvgpu/gp10b/gr_gp10b.c
new file mode 100644
index 00000000..08988ac8
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gr_gp10b.c
@@ -0,0 +1,2357 @@
+/*
+ * GP10B GPU GR
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <dt-bindings/soc/gm20b-fuse.h>
+#include <dt-bindings/soc/gp10b-fuse.h>
+#include <uapi/linux/nvgpu.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/gmmu.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/debug.h>
+#include <nvgpu/fuse.h>
+#include <nvgpu/enabled.h>
+#include "gk20a/gk20a.h"
+#include "gk20a/gr_gk20a.h"
+#include "gk20a/dbg_gpu_gk20a.h"
+#include "gk20a/regops_gk20a.h"
+#include "common/linux/os_linux.h"
+#include "gm20b/gr_gm20b.h"
+#include "gp10b/gr_gp10b.h"
+#include <nvgpu/hw/gp10b/hw_gr_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fifo_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_ctxsw_prog_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_mc_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fuse_gp10b.h>
+bool gr_gp10b_is_valid_class(struct gk20a *g, u32 class_num)
+{
+        bool valid = false;
+        switch (class_num) {
+        case PASCAL_COMPUTE_A:
+        case PASCAL_A:
+        case PASCAL_DMA_COPY_A:
+                valid = true;
+                break;
+        case MAXWELL_COMPUTE_B:
+        case MAXWELL_B:
+        case FERMI_TWOD_A:
+        case KEPLER_DMA_COPY_A:
+        case MAXWELL_DMA_COPY_A:
+                valid = true;
+                break;
+        default:
+                break;
+        }
+        gk20a_dbg_info("class=0x%x valid=%d", class_num, valid);
+        return valid;
+}
+bool gr_gp10b_is_valid_gfx_class(struct gk20a *g, u32 class_num)
+{
+        if (class_num == PASCAL_A ||  class_num == MAXWELL_B)
+                return true;
+        else
+                return false;
+}
+bool gr_gp10b_is_valid_compute_class(struct gk20a *g, u32 class_num)
+{
+        if (class_num == PASCAL_COMPUTE_A ||  class_num == MAXWELL_COMPUTE_B)
+                return true;
+        else
+                return false;
+}
+static void gr_gp10b_sm_lrf_ecc_overcount_war(int single_err,
+                                                u32 sed_status,
+                                                u32 ded_status,
+                                                u32 *count_to_adjust,
+                                                u32 opposite_count)
+{
+        u32 over_count = 0;
+        sed_status >>= gr_pri_gpc0_tpc0_sm_lrf_ecc_status_single_err_detected_qrfdp0_b();
+        ded_status >>= gr_pri_gpc0_tpc0_sm_lrf_ecc_status_double_err_detected_qrfdp0_b();
+        /* One overcount for each partition on which a SBE occurred but not a
+           DBE (or vice-versa) */
+        if (single_err) {
+                over_count =
+                        hweight32(sed_status & ~ded_status);
+        } else {
+                over_count =
+                        hweight32(ded_status & ~sed_status);
+        }
+        /* If both a SBE and a DBE occur on the same partition, then we have an
+           overcount for the subpartition if the opposite error counts are
+           zero. */
+        if ((sed_status & ded_status) && (opposite_count == 0)) {
+                over_count +=
+                        hweight32(sed_status & ded_status);
+        }
+        if (*count_to_adjust > over_count)
+                *count_to_adjust -= over_count;
+        else
+                *count_to_adjust = 0;
+}
+int gr_gp10b_handle_sm_exception(struct gk20a *g,
+                        u32 gpc, u32 tpc, u32 sm,
+                        bool *post_event, struct channel_gk20a *fault_ch,
+                        u32 *hww_global_esr)
+{
+        int ret = 0;
+        u32 gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_GPC_STRIDE);
+        u32 tpc_in_gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_TPC_IN_GPC_STRIDE);
+        u32 offset = gpc_stride * gpc + tpc_in_gpc_stride * tpc;
+        u32 lrf_ecc_status, lrf_ecc_sed_status, lrf_ecc_ded_status;
+        u32 lrf_single_count_delta, lrf_double_count_delta;
+        u32 shm_ecc_status;
+        ret = gr_gk20a_handle_sm_exception(g,
+                gpc, tpc, sm, post_event, fault_ch, hww_global_esr);
+        /* Check for LRF ECC errors. */
+        lrf_ecc_status = gk20a_readl(g,
+                        gr_pri_gpc0_tpc0_sm_lrf_ecc_status_r() + offset);
+        lrf_ecc_sed_status = lrf_ecc_status &
+                                (gr_pri_gpc0_tpc0_sm_lrf_ecc_status_single_err_detected_qrfdp0_pending_f() |
+                                 gr_pri_gpc0_tpc0_sm_lrf_ecc_status_single_err_detected_qrfdp1_pending_f() |
+                                 gr_pri_gpc0_tpc0_sm_lrf_ecc_status_single_err_detected_qrfdp2_pending_f() |
+                                 gr_pri_gpc0_tpc0_sm_lrf_ecc_status_single_err_detected_qrfdp3_pending_f());
+        lrf_ecc_ded_status = lrf_ecc_status &
+                                (gr_pri_gpc0_tpc0_sm_lrf_ecc_status_double_err_detected_qrfdp0_pending_f() |
+                                 gr_pri_gpc0_tpc0_sm_lrf_ecc_status_double_err_detected_qrfdp1_pending_f() |
+                                 gr_pri_gpc0_tpc0_sm_lrf_ecc_status_double_err_detected_qrfdp2_pending_f() |
+                                 gr_pri_gpc0_tpc0_sm_lrf_ecc_status_double_err_detected_qrfdp3_pending_f());
+        lrf_single_count_delta =
+                gk20a_readl(g,
+                        gr_pri_gpc0_tpc0_sm_lrf_ecc_single_err_count_r() +
+                        offset);
+        lrf_double_count_delta =
+                gk20a_readl(g,
+                        gr_pri_gpc0_tpc0_sm_lrf_ecc_double_err_count_r() +
+                        offset);
+        gk20a_writel(g,
+                gr_pri_gpc0_tpc0_sm_lrf_ecc_single_err_count_r() + offset,
+                0);
+        gk20a_writel(g,
+                gr_pri_gpc0_tpc0_sm_lrf_ecc_double_err_count_r() + offset,
+                0);
+        if (lrf_ecc_sed_status) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_intr,
+                        "Single bit error detected in SM LRF!");
+                gr_gp10b_sm_lrf_ecc_overcount_war(1,
+                                                lrf_ecc_sed_status,
+                                                lrf_ecc_ded_status,
+                                                &lrf_single_count_delta,
+                                                lrf_double_count_delta);
+                g->ecc.gr.t18x.sm_lrf_single_err_count.counters[tpc] +=
+                                                        lrf_single_count_delta;
+        }
+        if (lrf_ecc_ded_status) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_intr,
+                        "Double bit error detected in SM LRF!");
+                gr_gp10b_sm_lrf_ecc_overcount_war(0,
+                                                lrf_ecc_sed_status,
+                                                lrf_ecc_ded_status,
+                                                &lrf_double_count_delta,
+                                                lrf_single_count_delta);
+                g->ecc.gr.t18x.sm_lrf_double_err_count.counters[tpc] +=
+                                                        lrf_double_count_delta;
+        }
+        gk20a_writel(g, gr_pri_gpc0_tpc0_sm_lrf_ecc_status_r() + offset,
+                        lrf_ecc_status);
+        /* Check for SHM ECC errors. */
+        shm_ecc_status = gk20a_readl(g,
+                        gr_pri_gpc0_tpc0_sm_shm_ecc_status_r() + offset);
+        if ((shm_ecc_status &
+                gr_pri_gpc0_tpc0_sm_shm_ecc_status_single_err_corrected_shm0_pending_f()) ||
+                (shm_ecc_status &
+                gr_pri_gpc0_tpc0_sm_shm_ecc_status_single_err_corrected_shm1_pending_f()) ||
+                (shm_ecc_status &
+                gr_pri_gpc0_tpc0_sm_shm_ecc_status_single_err_detected_shm0_pending_f()) ||
+                (shm_ecc_status &
+                gr_pri_gpc0_tpc0_sm_shm_ecc_status_single_err_detected_shm1_pending_f()) ) {
+                u32 ecc_stats_reg_val;
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_intr,
+                        "Single bit error detected in SM SHM!");
+                ecc_stats_reg_val =
+                        gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_r() + offset);
+                g->ecc.gr.t18x.sm_shm_sec_count.counters[tpc] +=
+                        gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_single_corrected_v(ecc_stats_reg_val);
+                g->ecc.gr.t18x.sm_shm_sed_count.counters[tpc] +=
+                        gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_single_detected_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~(gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_single_corrected_m() |
+                                        gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_single_detected_m());
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_r() + offset,
+                        ecc_stats_reg_val);
+        }
+        if ( (shm_ecc_status &
+                gr_pri_gpc0_tpc0_sm_shm_ecc_status_double_err_detected_shm0_pending_f()) ||
+                (shm_ecc_status &
+                gr_pri_gpc0_tpc0_sm_shm_ecc_status_double_err_detected_shm1_pending_f()) ) {
+                u32 ecc_stats_reg_val;
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_intr,
+                        "Double bit error detected in SM SHM!");
+                ecc_stats_reg_val =
+                        gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_r() + offset);
+                g->ecc.gr.t18x.sm_shm_ded_count.counters[tpc] +=
+                        gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_double_detected_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~(gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_double_detected_m());
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_sm_shm_ecc_err_count_r() + offset,
+                        ecc_stats_reg_val);
+        }
+        gk20a_writel(g, gr_pri_gpc0_tpc0_sm_shm_ecc_status_r() + offset,
+                        shm_ecc_status);
+        return ret;
+}
+int gr_gp10b_handle_tex_exception(struct gk20a *g, u32 gpc, u32 tpc,
+                bool *post_event)
+{
+        int ret = 0;
+        u32 gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_GPC_STRIDE);
+        u32 tpc_in_gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_TPC_IN_GPC_STRIDE);
+        u32 offset = gpc_stride * gpc + tpc_in_gpc_stride * tpc;
+        u32 esr;
+        u32 ecc_stats_reg_val;
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg, "");
+        esr = gk20a_readl(g,
+                         gr_gpc0_tpc0_tex_m_hww_esr_r() + offset);
+        gk20a_dbg(gpu_dbg_intr | gpu_dbg_gpu_dbg, "0x%08x", esr);
+        if (esr & gr_gpc0_tpc0_tex_m_hww_esr_ecc_sec_pending_f()) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_intr,
+                        "Single bit error detected in TEX!");
+                /* Pipe 0 counters */
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_routing_r() + offset,
+                        gr_pri_gpc0_tpc0_tex_m_routing_sel_pipe0_f());
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset);
+                g->ecc.gr.t18x.tex_total_sec_pipe0_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_sec_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_sec_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset,
+                        ecc_stats_reg_val);
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset);
+                g->ecc.gr.t18x.tex_unique_sec_pipe0_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_sec_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_sec_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset,
+                        ecc_stats_reg_val);
+                /* Pipe 1 counters */
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_routing_r() + offset,
+                        gr_pri_gpc0_tpc0_tex_m_routing_sel_pipe1_f());
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset);
+                g->ecc.gr.t18x.tex_total_sec_pipe1_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_sec_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_sec_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset,
+                        ecc_stats_reg_val);
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset);
+                g->ecc.gr.t18x.tex_unique_sec_pipe1_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_sec_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_sec_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset,
+                        ecc_stats_reg_val);
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_routing_r() + offset,
+                        gr_pri_gpc0_tpc0_tex_m_routing_sel_default_f());
+        }
+        if (esr & gr_gpc0_tpc0_tex_m_hww_esr_ecc_ded_pending_f()) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_intr,
+                        "Double bit error detected in TEX!");
+                /* Pipe 0 counters */
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_routing_r() + offset,
+                        gr_pri_gpc0_tpc0_tex_m_routing_sel_pipe0_f());
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset);
+                g->ecc.gr.t18x.tex_total_ded_pipe0_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_ded_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_ded_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset,
+                        ecc_stats_reg_val);
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset);
+                g->ecc.gr.t18x.tex_unique_ded_pipe0_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_ded_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_ded_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset,
+                        ecc_stats_reg_val);
+                /* Pipe 1 counters */
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_routing_r() + offset,
+                        gr_pri_gpc0_tpc0_tex_m_routing_sel_pipe1_f());
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset);
+                g->ecc.gr.t18x.tex_total_ded_pipe1_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_ded_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_ded_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_total_r() + offset,
+                        ecc_stats_reg_val);
+                ecc_stats_reg_val = gk20a_readl(g,
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset);
+                g->ecc.gr.t18x.tex_unique_ded_pipe1_count.counters[tpc] +=
+                                gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_ded_v(ecc_stats_reg_val);
+                ecc_stats_reg_val &= ~gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_ded_m();
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_ecc_cnt_unique_r() + offset,
+                        ecc_stats_reg_val);
+                gk20a_writel(g,
+                        gr_pri_gpc0_tpc0_tex_m_routing_r() + offset,
+                        gr_pri_gpc0_tpc0_tex_m_routing_sel_default_f());
+        }
+        gk20a_writel(g,
+                     gr_gpc0_tpc0_tex_m_hww_esr_r() + offset,
+                     esr | gr_gpc0_tpc0_tex_m_hww_esr_reset_active_f());
+        return ret;
+}
+int gr_gp10b_commit_global_cb_manager(struct gk20a *g,
+                        struct channel_gk20a *c, bool patch)
+{
+        struct gr_gk20a *gr = &g->gr;
+        struct channel_ctx_gk20a *ch_ctx = &c->ch_ctx;
+        struct gr_ctx_desc *gr_ctx = ch_ctx->gr_ctx;
+        u32 attrib_offset_in_chunk = 0;
+        u32 alpha_offset_in_chunk = 0;
+        u32 pd_ab_max_output;
+        u32 gpc_index, ppc_index;
+        u32 temp, temp2;
+        u32 cbm_cfg_size_beta, cbm_cfg_size_alpha, cbm_cfg_size_steadystate;
+        u32 attrib_size_in_chunk, cb_attrib_cache_size_init;
+        u32 gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_GPC_STRIDE);
+        u32 ppc_in_gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_PPC_IN_GPC_STRIDE);
+        u32 num_pes_per_gpc = nvgpu_get_litter_value(g, GPU_LIT_NUM_PES_PER_GPC);
+        gk20a_dbg_fn("");
+        if (gr_ctx->graphics_preempt_mode == NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP) {
+                attrib_size_in_chunk = gr->attrib_cb_default_size +
+                                  (gr_gpc0_ppc0_cbm_beta_cb_size_v_gfxp_v() -
+                                   gr_gpc0_ppc0_cbm_beta_cb_size_v_default_v());
+                cb_attrib_cache_size_init = gr->attrib_cb_default_size +
+                                  (gr_gpc0_ppc0_cbm_beta_cb_size_v_gfxp_v() -
+                                   gr_gpc0_ppc0_cbm_beta_cb_size_v_default_v());
+        } else {
+                attrib_size_in_chunk = gr->attrib_cb_size;
+                cb_attrib_cache_size_init = gr->attrib_cb_default_size;
+        }
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_ds_tga_constraintlogic_beta_r(),
+                gr->attrib_cb_default_size, patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_ds_tga_constraintlogic_alpha_r(),
+                gr->alpha_cb_default_size, patch);
+        pd_ab_max_output = (gr->alpha_cb_default_size *
+                gr_gpc0_ppc0_cbm_beta_cb_size_v_granularity_v()) /
+                gr_pd_ab_dist_cfg1_max_output_granularity_v();
+        if (g->gr.pd_max_batches) {
+                gr_gk20a_ctx_patch_write(g, ch_ctx, gr_pd_ab_dist_cfg1_r(),
+                        gr_pd_ab_dist_cfg1_max_output_f(pd_ab_max_output) |
+                        gr_pd_ab_dist_cfg1_max_batches_f(g->gr.pd_max_batches), patch);
+        } else {
+                gr_gk20a_ctx_patch_write(g, ch_ctx, gr_pd_ab_dist_cfg1_r(),
+                        gr_pd_ab_dist_cfg1_max_output_f(pd_ab_max_output) |
+                        gr_pd_ab_dist_cfg1_max_batches_init_f(), patch);
+        }
+        attrib_offset_in_chunk = alpha_offset_in_chunk +
+                gr->tpc_count * gr->alpha_cb_size;
+        for (gpc_index = 0; gpc_index < gr->gpc_count; gpc_index++) {
+                temp = gpc_stride * gpc_index;
+                temp2 = num_pes_per_gpc * gpc_index;
+                for (ppc_index = 0; ppc_index < gr->gpc_ppc_count[gpc_index];
+                     ppc_index++) {
+                        cbm_cfg_size_beta = cb_attrib_cache_size_init *
+                                gr->pes_tpc_count[ppc_index][gpc_index];
+                        cbm_cfg_size_alpha = gr->alpha_cb_default_size *
+                                gr->pes_tpc_count[ppc_index][gpc_index];
+                        cbm_cfg_size_steadystate = gr->attrib_cb_default_size *
+                                gr->pes_tpc_count[ppc_index][gpc_index];
+                        gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpc0_ppc0_cbm_beta_cb_size_r() + temp +
+                                ppc_in_gpc_stride * ppc_index,
+                                cbm_cfg_size_beta, patch);
+                        gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpc0_ppc0_cbm_beta_cb_offset_r() + temp +
+                                ppc_in_gpc_stride * ppc_index,
+                                attrib_offset_in_chunk, patch);
+                        gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpc0_ppc0_cbm_beta_steady_state_cb_size_r() + temp +
+                                ppc_in_gpc_stride * ppc_index,
+                                cbm_cfg_size_steadystate,
+                                patch);
+                        attrib_offset_in_chunk += attrib_size_in_chunk *
+                                gr->pes_tpc_count[ppc_index][gpc_index];
+                        gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpc0_ppc0_cbm_alpha_cb_size_r() + temp +
+                                ppc_in_gpc_stride * ppc_index,
+                                cbm_cfg_size_alpha, patch);
+                        gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpc0_ppc0_cbm_alpha_cb_offset_r() + temp +
+                                ppc_in_gpc_stride * ppc_index,
+                                alpha_offset_in_chunk, patch);
+                        alpha_offset_in_chunk += gr->alpha_cb_size *
+                                gr->pes_tpc_count[ppc_index][gpc_index];
+                        gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpcs_swdx_tc_beta_cb_size_r(ppc_index + temp2),
+                                gr_gpcs_swdx_tc_beta_cb_size_v_f(cbm_cfg_size_steadystate),
+                                patch);
+                }
+        }
+        return 0;
+}
+void gr_gp10b_commit_global_pagepool(struct gk20a *g,
+                                            struct channel_ctx_gk20a *ch_ctx,
+                                            u64 addr, u32 size, bool patch)
+{
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_scc_pagepool_base_r(),
+                gr_scc_pagepool_base_addr_39_8_f(addr), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_scc_pagepool_r(),
+                gr_scc_pagepool_total_pages_f(size) |
+                gr_scc_pagepool_valid_true_f(), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_gpcs_gcc_pagepool_base_r(),
+                gr_gpcs_gcc_pagepool_base_addr_39_8_f(addr), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_gpcs_gcc_pagepool_r(),
+                gr_gpcs_gcc_pagepool_total_pages_f(size), patch);
+}
+int gr_gp10b_add_zbc_color(struct gk20a *g, struct gr_gk20a *gr,
+                                  struct zbc_entry *color_val, u32 index)
+{
+        u32 i;
+        u32 zbc_c;
+        /* update l2 table */
+        g->ops.ltc.set_zbc_color_entry(g, color_val, index);
+        /* update ds table */
+        gk20a_writel(g, gr_ds_zbc_color_r_r(),
+                gr_ds_zbc_color_r_val_f(color_val->color_ds[0]));
+        gk20a_writel(g, gr_ds_zbc_color_g_r(),
+                gr_ds_zbc_color_g_val_f(color_val->color_ds[1]));
+        gk20a_writel(g, gr_ds_zbc_color_b_r(),
+                gr_ds_zbc_color_b_val_f(color_val->color_ds[2]));
+        gk20a_writel(g, gr_ds_zbc_color_a_r(),
+                gr_ds_zbc_color_a_val_f(color_val->color_ds[3]));
+        gk20a_writel(g, gr_ds_zbc_color_fmt_r(),
+                gr_ds_zbc_color_fmt_val_f(color_val->format));
+        gk20a_writel(g, gr_ds_zbc_tbl_index_r(),
+                gr_ds_zbc_tbl_index_val_f(index + GK20A_STARTOF_ZBC_TABLE));
+        /* trigger the write */
+        gk20a_writel(g, gr_ds_zbc_tbl_ld_r(),
+                gr_ds_zbc_tbl_ld_select_c_f() |
+                gr_ds_zbc_tbl_ld_action_write_f() |
+                gr_ds_zbc_tbl_ld_trigger_active_f());
+        /* update local copy */
+        for (i = 0; i < GK20A_ZBC_COLOR_VALUE_SIZE; i++) {
+                gr->zbc_col_tbl[index].color_l2[i] = color_val->color_l2[i];
+                gr->zbc_col_tbl[index].color_ds[i] = color_val->color_ds[i];
+        }
+        gr->zbc_col_tbl[index].format = color_val->format;
+        gr->zbc_col_tbl[index].ref_cnt++;
+        gk20a_writel_check(g, gr_gpcs_swdx_dss_zbc_color_r_r(index),
+                           color_val->color_ds[0]);
+        gk20a_writel_check(g, gr_gpcs_swdx_dss_zbc_color_g_r(index),
+                           color_val->color_ds[1]);
+        gk20a_writel_check(g, gr_gpcs_swdx_dss_zbc_color_b_r(index),
+                           color_val->color_ds[2]);
+        gk20a_writel_check(g, gr_gpcs_swdx_dss_zbc_color_a_r(index),
+                           color_val->color_ds[3]);
+        zbc_c = gk20a_readl(g, gr_gpcs_swdx_dss_zbc_c_01_to_04_format_r() + (index & ~3));
+        zbc_c &= ~(0x7f << ((index % 4) * 7));
+        zbc_c |= color_val->format << ((index % 4) * 7);
+        gk20a_writel_check(g, gr_gpcs_swdx_dss_zbc_c_01_to_04_format_r() + (index & ~3), zbc_c);
+        return 0;
+}
+int gr_gp10b_add_zbc_depth(struct gk20a *g, struct gr_gk20a *gr,
+                                struct zbc_entry *depth_val, u32 index)
+{
+        u32 zbc_z;
+        /* update l2 table */
+        g->ops.ltc.set_zbc_depth_entry(g, depth_val, index);
+        /* update ds table */
+        gk20a_writel(g, gr_ds_zbc_z_r(),
+                gr_ds_zbc_z_val_f(depth_val->depth));
+        gk20a_writel(g, gr_ds_zbc_z_fmt_r(),
+                gr_ds_zbc_z_fmt_val_f(depth_val->format));
+        gk20a_writel(g, gr_ds_zbc_tbl_index_r(),
+                gr_ds_zbc_tbl_index_val_f(index + GK20A_STARTOF_ZBC_TABLE));
+        /* trigger the write */
+        gk20a_writel(g, gr_ds_zbc_tbl_ld_r(),
+                gr_ds_zbc_tbl_ld_select_z_f() |
+                gr_ds_zbc_tbl_ld_action_write_f() |
+                gr_ds_zbc_tbl_ld_trigger_active_f());
+        /* update local copy */
+        gr->zbc_dep_tbl[index].depth = depth_val->depth;
+        gr->zbc_dep_tbl[index].format = depth_val->format;
+        gr->zbc_dep_tbl[index].ref_cnt++;
+        gk20a_writel(g, gr_gpcs_swdx_dss_zbc_z_r(index), depth_val->depth);
+        zbc_z = gk20a_readl(g, gr_gpcs_swdx_dss_zbc_z_01_to_04_format_r() + (index & ~3));
+        zbc_z &= ~(0x7f << (index % 4) * 7);
+        zbc_z |= depth_val->format << (index % 4) * 7;
+        gk20a_writel(g, gr_gpcs_swdx_dss_zbc_z_01_to_04_format_r() + (index & ~3), zbc_z);
+        return 0;
+}
+u32 gr_gp10b_pagepool_default_size(struct gk20a *g)
+{
+        return gr_scc_pagepool_total_pages_hwmax_value_v();
+}
+int gr_gp10b_calc_global_ctx_buffer_size(struct gk20a *g)
+{
+        struct gr_gk20a *gr = &g->gr;
+        int size;
+        gr->attrib_cb_size = gr->attrib_cb_default_size;
+        gr->alpha_cb_size = gr->alpha_cb_default_size;
+        gr->attrib_cb_size = min(gr->attrib_cb_size,
+                 gr_gpc0_ppc0_cbm_beta_cb_size_v_f(~0) / g->gr.tpc_count);
+        gr->alpha_cb_size = min(gr->alpha_cb_size,
+                 gr_gpc0_ppc0_cbm_alpha_cb_size_v_f(~0) / g->gr.tpc_count);
+        size = gr->attrib_cb_size *
+                gr_gpc0_ppc0_cbm_beta_cb_size_v_granularity_v() *
+                gr->max_tpc_count;
+        size += gr->alpha_cb_size *
+                gr_gpc0_ppc0_cbm_alpha_cb_size_v_granularity_v() *
+                gr->max_tpc_count;
+        size = ALIGN(size, 128);
+        return size;
+}
+static void gr_gp10b_set_go_idle_timeout(struct gk20a *g, u32 data)
+{
+        gk20a_writel(g, gr_fe_go_idle_timeout_r(), data);
+}
+static void gr_gp10b_set_coalesce_buffer_size(struct gk20a *g, u32 data)
+{
+        u32 val;
+        gk20a_dbg_fn("");
+        val = gk20a_readl(g, gr_gpcs_tc_debug0_r());
+        val = set_field(val, gr_gpcs_tc_debug0_limit_coalesce_buffer_size_m(),
+                             gr_gpcs_tc_debug0_limit_coalesce_buffer_size_f(data));
+        gk20a_writel(g, gr_gpcs_tc_debug0_r(), val);
+        gk20a_dbg_fn("done");
+}
+void gr_gp10b_set_bes_crop_debug3(struct gk20a *g, u32 data)
+{
+        u32 val;
+        gk20a_dbg_fn("");
+        val = gk20a_readl(g, gr_bes_crop_debug3_r());
+        if ((data & 1)) {
+                val = set_field(val,
+                                gr_bes_crop_debug3_blendopt_read_suppress_m(),
+                                gr_bes_crop_debug3_blendopt_read_suppress_enabled_f());
+                val = set_field(val,
+                                gr_bes_crop_debug3_blendopt_fill_override_m(),
+                                gr_bes_crop_debug3_blendopt_fill_override_enabled_f());
+        } else {
+                val = set_field(val,
+                                gr_bes_crop_debug3_blendopt_read_suppress_m(),
+                                gr_bes_crop_debug3_blendopt_read_suppress_disabled_f());
+                val = set_field(val,
+                                gr_bes_crop_debug3_blendopt_fill_override_m(),
+                                gr_bes_crop_debug3_blendopt_fill_override_disabled_f());
+        }
+        gk20a_writel(g, gr_bes_crop_debug3_r(), val);
+}
+int gr_gp10b_handle_sw_method(struct gk20a *g, u32 addr,
+                                     u32 class_num, u32 offset, u32 data)
+{
+        gk20a_dbg_fn("");
+        if (class_num == PASCAL_COMPUTE_A) {
+                switch (offset << 2) {
+                case NVC0C0_SET_SHADER_EXCEPTIONS:
+                        gk20a_gr_set_shader_exceptions(g, data);
+                        break;
+                case NVC0C0_SET_RD_COALESCE:
+                        gr_gm20b_set_rd_coalesce(g, data);
+                        break;
+                default:
+                        goto fail;
+                }
+        }
+        if (class_num == PASCAL_A) {
+                switch (offset << 2) {
+                case NVC097_SET_SHADER_EXCEPTIONS:
+                        gk20a_gr_set_shader_exceptions(g, data);
+                        break;
+                case NVC097_SET_CIRCULAR_BUFFER_SIZE:
+                        g->ops.gr.set_circular_buffer_size(g, data);
+                        break;
+                case NVC097_SET_ALPHA_CIRCULAR_BUFFER_SIZE:
+                        g->ops.gr.set_alpha_circular_buffer_size(g, data);
+                        break;
+                case NVC097_SET_GO_IDLE_TIMEOUT:
+                        gr_gp10b_set_go_idle_timeout(g, data);
+                        break;
+                case NVC097_SET_COALESCE_BUFFER_SIZE:
+                        gr_gp10b_set_coalesce_buffer_size(g, data);
+                        break;
+                case NVC097_SET_RD_COALESCE:
+                        gr_gm20b_set_rd_coalesce(g, data);
+                        break;
+                case NVC097_SET_BES_CROP_DEBUG3:
+                        g->ops.gr.set_bes_crop_debug3(g, data);
+                        break;
+                default:
+                        goto fail;
+                }
+        }
+        return 0;
+fail:
+        return -EINVAL;
+}
+void gr_gp10b_cb_size_default(struct gk20a *g)
+{
+        struct gr_gk20a *gr = &g->gr;
+        if (!gr->attrib_cb_default_size)
+                gr->attrib_cb_default_size = 0x800;
+        gr->alpha_cb_default_size =
+                gr_gpc0_ppc0_cbm_alpha_cb_size_v_default_v();
+}
+void gr_gp10b_set_alpha_circular_buffer_size(struct gk20a *g, u32 data)
+{
+        struct gr_gk20a *gr = &g->gr;
+        u32 gpc_index, ppc_index, stride, val;
+        u32 pd_ab_max_output;
+        u32 alpha_cb_size = data * 4;
+        u32 gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_GPC_STRIDE);
+        u32 ppc_in_gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_PPC_IN_GPC_STRIDE);
+        gk20a_dbg_fn("");
+        if (alpha_cb_size > gr->alpha_cb_size)
+                alpha_cb_size = gr->alpha_cb_size;
+        gk20a_writel(g, gr_ds_tga_constraintlogic_alpha_r(),
+                (gk20a_readl(g, gr_ds_tga_constraintlogic_alpha_r()) &
+                 ~gr_ds_tga_constraintlogic_alpha_cbsize_f(~0)) |
+                 gr_ds_tga_constraintlogic_alpha_cbsize_f(alpha_cb_size));
+        pd_ab_max_output = alpha_cb_size *
+                gr_gpc0_ppc0_cbm_alpha_cb_size_v_granularity_v() /
+                gr_pd_ab_dist_cfg1_max_output_granularity_v();
+        if (g->gr.pd_max_batches) {
+                gk20a_writel(g, gr_pd_ab_dist_cfg1_r(),
+                        gr_pd_ab_dist_cfg1_max_output_f(pd_ab_max_output) |
+                        gr_pd_ab_dist_cfg1_max_batches_f(g->gr.pd_max_batches));
+        } else {
+                gk20a_writel(g, gr_pd_ab_dist_cfg1_r(),
+                        gr_pd_ab_dist_cfg1_max_output_f(pd_ab_max_output) |
+                        gr_pd_ab_dist_cfg1_max_batches_init_f());
+        }
+        for (gpc_index = 0; gpc_index < gr->gpc_count; gpc_index++) {
+                stride = gpc_stride * gpc_index;
+                for (ppc_index = 0; ppc_index < gr->gpc_ppc_count[gpc_index];
+                        ppc_index++) {
+                        val = gk20a_readl(g, gr_gpc0_ppc0_cbm_alpha_cb_size_r() +
+                                stride +
+                                ppc_in_gpc_stride * ppc_index);
+                        val = set_field(val, gr_gpc0_ppc0_cbm_alpha_cb_size_v_m(),
+                                        gr_gpc0_ppc0_cbm_alpha_cb_size_v_f(alpha_cb_size *
+                                                gr->pes_tpc_count[ppc_index][gpc_index]));
+                        gk20a_writel(g, gr_gpc0_ppc0_cbm_alpha_cb_size_r() +
+                                stride +
+                                ppc_in_gpc_stride * ppc_index, val);
+                }
+        }
+}
+void gr_gp10b_set_circular_buffer_size(struct gk20a *g, u32 data)
+{
+        struct gr_gk20a *gr = &g->gr;
+        u32 gpc_index, ppc_index, stride, val;
+        u32 cb_size_steady = data * 4, cb_size;
+        u32 gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_GPC_STRIDE);
+        u32 ppc_in_gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_PPC_IN_GPC_STRIDE);
+        gk20a_dbg_fn("");
+        if (cb_size_steady > gr->attrib_cb_size)
+                cb_size_steady = gr->attrib_cb_size;
+        if (gk20a_readl(g, gr_gpc0_ppc0_cbm_beta_cb_size_r()) !=
+                gk20a_readl(g,
+                        gr_gpc0_ppc0_cbm_beta_steady_state_cb_size_r())) {
+                cb_size = cb_size_steady +
+                        (gr_gpc0_ppc0_cbm_beta_cb_size_v_gfxp_v() -
+                         gr_gpc0_ppc0_cbm_beta_cb_size_v_default_v());
+        } else {
+                cb_size = cb_size_steady;
+        }
+        gk20a_writel(g, gr_ds_tga_constraintlogic_beta_r(),
+                (gk20a_readl(g, gr_ds_tga_constraintlogic_beta_r()) &
+                 ~gr_ds_tga_constraintlogic_beta_cbsize_f(~0)) |
+                 gr_ds_tga_constraintlogic_beta_cbsize_f(cb_size_steady));
+        for (gpc_index = 0; gpc_index < gr->gpc_count; gpc_index++) {
+                stride = gpc_stride * gpc_index;
+                for (ppc_index = 0; ppc_index < gr->gpc_ppc_count[gpc_index];
+                        ppc_index++) {
+                        val = gk20a_readl(g, gr_gpc0_ppc0_cbm_beta_cb_size_r() +
+                                stride +
+                                ppc_in_gpc_stride * ppc_index);
+                        val = set_field(val,
+                                gr_gpc0_ppc0_cbm_beta_cb_size_v_m(),
+                                gr_gpc0_ppc0_cbm_beta_cb_size_v_f(cb_size *
+                                        gr->pes_tpc_count[ppc_index][gpc_index]));
+                        gk20a_writel(g, gr_gpc0_ppc0_cbm_beta_cb_size_r() +
+                                stride +
+                                ppc_in_gpc_stride * ppc_index, val);
+                        gk20a_writel(g, ppc_in_gpc_stride * ppc_index +
+                                gr_gpc0_ppc0_cbm_beta_steady_state_cb_size_r() +
+                                stride,
+                                gr_gpc0_ppc0_cbm_beta_steady_state_cb_size_v_f(
+                                        cb_size_steady));
+                        val = gk20a_readl(g, gr_gpcs_swdx_tc_beta_cb_size_r(
+                                                ppc_index + gpc_index));
+                        val = set_field(val,
+                                gr_gpcs_swdx_tc_beta_cb_size_v_m(),
+                                gr_gpcs_swdx_tc_beta_cb_size_v_f(
+                                        cb_size_steady *
+                                        gr->gpc_ppc_count[gpc_index]));
+                        gk20a_writel(g, gr_gpcs_swdx_tc_beta_cb_size_r(
+                                                ppc_index + gpc_index), val);
+                }
+        }
+}
+int gr_gp10b_init_ctx_state(struct gk20a *g)
+{
+        struct fecs_method_op_gk20a op = {
+                .mailbox = { .id = 0, .data = 0,
+                             .clr = ~0, .ok = 0, .fail = 0},
+                .method.data = 0,
+                .cond.ok = GR_IS_UCODE_OP_NOT_EQUAL,
+                .cond.fail = GR_IS_UCODE_OP_SKIP,
+                };
+        int err;
+        gk20a_dbg_fn("");
+        err = gr_gk20a_init_ctx_state(g);
+        if (err)
+                return err;
+        if (!g->gr.t18x.ctx_vars.preempt_image_size) {
+                op.method.addr =
+                        gr_fecs_method_push_adr_discover_preemption_image_size_v();
+                op.mailbox.ret = &g->gr.t18x.ctx_vars.preempt_image_size;
+                err = gr_gk20a_submit_fecs_method_op(g, op, false);
+                if (err) {
+                        nvgpu_err(g, "query preempt image size failed");
+                        return err;
+                }
+        }
+        gk20a_dbg_info("preempt image size: %u",
+                g->gr.t18x.ctx_vars.preempt_image_size);
+        gk20a_dbg_fn("done");
+        return 0;
+}
+int gr_gp10b_alloc_buffer(struct vm_gk20a *vm, size_t size,
+                        struct nvgpu_mem *mem)
+{
+        int err;
+        gk20a_dbg_fn("");
+        err = nvgpu_dma_alloc_sys(vm->mm->g, size, mem);
+        if (err)
+                return err;
+        mem->gpu_va = nvgpu_gmmu_map(vm,
+                                mem,
+                                mem->aligned_size,
+                                NVGPU_AS_MAP_BUFFER_FLAGS_CACHEABLE,
+                                gk20a_mem_flag_none,
+                                false,
+                                mem->aperture);
+        if (!mem->gpu_va) {
+                err = -ENOMEM;
+                goto fail_free;
+        }
+        return 0;
+fail_free:
+        nvgpu_dma_free(vm->mm->g, mem);
+        return err;
+}
+int gr_gp10b_set_ctxsw_preemption_mode(struct gk20a *g,
+                                struct gr_ctx_desc *gr_ctx,
+                                struct vm_gk20a *vm, u32 class,
+                                u32 graphics_preempt_mode,
+                                u32 compute_preempt_mode)
+{
+        int err = 0;
+        if (g->ops.gr.is_valid_gfx_class(g, class) &&
+                                g->gr.t18x.ctx_vars.force_preemption_gfxp)
+                graphics_preempt_mode = NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP;
+        if (g->ops.gr.is_valid_compute_class(g, class) &&
+                        g->gr.t18x.ctx_vars.force_preemption_cilp)
+                compute_preempt_mode = NVGPU_PREEMPTION_MODE_COMPUTE_CILP;
+        /* check for invalid combinations */
+        if ((graphics_preempt_mode == 0) && (compute_preempt_mode == 0))
+                return -EINVAL;
+        if ((graphics_preempt_mode == NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP) &&
+                   (compute_preempt_mode == NVGPU_PREEMPTION_MODE_COMPUTE_CILP))
+                return -EINVAL;
+        /* Do not allow lower preemption modes than current ones */
+        if (graphics_preempt_mode &&
+           (graphics_preempt_mode < gr_ctx->graphics_preempt_mode))
+                return -EINVAL;
+        if (compute_preempt_mode &&
+           (compute_preempt_mode < gr_ctx->compute_preempt_mode))
+                return -EINVAL;
+        /* set preemption modes */
+        switch (graphics_preempt_mode) {
+        case NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP:
+                {
+                u32 spill_size =
+                        gr_gpc0_swdx_rm_spill_buffer_size_256b_default_v() *
+                        gr_gpc0_swdx_rm_spill_buffer_size_256b_byte_granularity_v();
+                u32 pagepool_size = g->ops.gr.pagepool_default_size(g) *
+                        gr_scc_pagepool_total_pages_byte_granularity_v();
+                u32 betacb_size = g->gr.attrib_cb_default_size +
+                                  (gr_gpc0_ppc0_cbm_beta_cb_size_v_gfxp_v() -
+                                   gr_gpc0_ppc0_cbm_beta_cb_size_v_default_v());
+                u32 attrib_cb_size = (betacb_size + g->gr.alpha_cb_size) *
+                                  gr_gpc0_ppc0_cbm_beta_cb_size_v_granularity_v() *
+                                  g->gr.max_tpc_count;
+                attrib_cb_size = ALIGN(attrib_cb_size, 128);
+                gk20a_dbg_info("gfxp context spill_size=%d", spill_size);
+                gk20a_dbg_info("gfxp context pagepool_size=%d", pagepool_size);
+                gk20a_dbg_info("gfxp context attrib_cb_size=%d",
+                                attrib_cb_size);
+                err = gr_gp10b_alloc_buffer(vm,
+                                        g->gr.t18x.ctx_vars.preempt_image_size,
+                                        &gr_ctx->t18x.preempt_ctxsw_buffer);
+                if (err) {
+                        nvgpu_err(g, "cannot allocate preempt buffer");
+                        goto fail;
+                }
+                err = gr_gp10b_alloc_buffer(vm,
+                                        spill_size,
+                                        &gr_ctx->t18x.spill_ctxsw_buffer);
+                if (err) {
+                        nvgpu_err(g, "cannot allocate spill buffer");
+                        goto fail_free_preempt;
+                }
+                err = gr_gp10b_alloc_buffer(vm,
+                                        attrib_cb_size,
+                                        &gr_ctx->t18x.betacb_ctxsw_buffer);
+                if (err) {
+                        nvgpu_err(g, "cannot allocate beta buffer");
+                        goto fail_free_spill;
+                }
+                err = gr_gp10b_alloc_buffer(vm,
+                                        pagepool_size,
+                                        &gr_ctx->t18x.pagepool_ctxsw_buffer);
+                if (err) {
+                        nvgpu_err(g, "cannot allocate page pool");
+                        goto fail_free_betacb;
+                }
+                gr_ctx->graphics_preempt_mode = graphics_preempt_mode;
+                break;
+                }
+        case NVGPU_PREEMPTION_MODE_GRAPHICS_WFI:
+                gr_ctx->graphics_preempt_mode = graphics_preempt_mode;
+                break;
+        default:
+                break;
+        }
+        if (g->ops.gr.is_valid_compute_class(g, class) ||
+                        g->ops.gr.is_valid_gfx_class(g, class)) {
+                switch (compute_preempt_mode) {
+                case NVGPU_PREEMPTION_MODE_COMPUTE_WFI:
+                case NVGPU_PREEMPTION_MODE_COMPUTE_CTA:
+                case NVGPU_PREEMPTION_MODE_COMPUTE_CILP:
+                        gr_ctx->compute_preempt_mode = compute_preempt_mode;
+                        break;
+                default:
+                        break;
+                }
+        }
+        return 0;
+fail_free_betacb:
+        nvgpu_dma_unmap_free(vm, &gr_ctx->t18x.betacb_ctxsw_buffer);
+fail_free_spill:
+        nvgpu_dma_unmap_free(vm, &gr_ctx->t18x.spill_ctxsw_buffer);
+fail_free_preempt:
+        nvgpu_dma_unmap_free(vm, &gr_ctx->t18x.preempt_ctxsw_buffer);
+fail:
+        return err;
+}
+int gr_gp10b_alloc_gr_ctx(struct gk20a *g,
+                          struct gr_ctx_desc **gr_ctx, struct vm_gk20a *vm,
+                          u32 class,
+                          u32 flags)
+{
+        int err;
+        u32 graphics_preempt_mode = 0;
+        u32 compute_preempt_mode = 0;
+        gk20a_dbg_fn("");
+        err = gr_gk20a_alloc_gr_ctx(g, gr_ctx, vm, class, flags);
+        if (err)
+                return err;
+        (*gr_ctx)->t18x.ctx_id_valid = false;
+        if (flags & NVGPU_OBJ_CTX_FLAGS_SUPPORT_GFXP)
+                graphics_preempt_mode = NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP;
+        if (flags & NVGPU_OBJ_CTX_FLAGS_SUPPORT_CILP)
+                compute_preempt_mode = NVGPU_PREEMPTION_MODE_COMPUTE_CILP;
+        if (graphics_preempt_mode || compute_preempt_mode) {
+                if (g->ops.gr.set_ctxsw_preemption_mode) {
+                        err = g->ops.gr.set_ctxsw_preemption_mode(g, *gr_ctx, vm,
+                            class, graphics_preempt_mode, compute_preempt_mode);
+                        if (err) {
+                                nvgpu_err(g, "set_ctxsw_preemption_mode failed");
+                                goto fail_free_gk20a_ctx;
+                        }
+                } else
+                        goto fail_free_gk20a_ctx;
+        }
+        gk20a_dbg_fn("done");
+        return 0;
+fail_free_gk20a_ctx:
+        gr_gk20a_free_gr_ctx(g, vm, *gr_ctx);
+        *gr_ctx = NULL;
+        return err;
+}
+static void dump_ctx_switch_stats(struct gk20a *g, struct vm_gk20a *vm,
+                  struct gr_ctx_desc *gr_ctx)
+{
+        struct nvgpu_mem *mem = &gr_ctx->mem;
+        if (nvgpu_mem_begin(g, mem)) {
+                WARN_ON("Cannot map context");
+                return;
+        }
+        nvgpu_err(g, "ctxsw_prog_main_image_magic_value_o : %x (expect %x)",
+                nvgpu_mem_rd(g, mem,
+                                ctxsw_prog_main_image_magic_value_o()),
+                ctxsw_prog_main_image_magic_value_v_value_v());
+        nvgpu_err(g, "ctxsw_prog_main_image_context_timestamp_buffer_ptr_hi : %x",
+                nvgpu_mem_rd(g, mem,
+                                ctxsw_prog_main_image_context_timestamp_buffer_ptr_hi_o()));
+        nvgpu_err(g, "ctxsw_prog_main_image_context_timestamp_buffer_ptr : %x",
+                nvgpu_mem_rd(g, mem,
+                                ctxsw_prog_main_image_context_timestamp_buffer_ptr_o()));
+        nvgpu_err(g, "ctxsw_prog_main_image_context_timestamp_buffer_control : %x",
+                nvgpu_mem_rd(g, mem,
+                                ctxsw_prog_main_image_context_timestamp_buffer_control_o()));
+        nvgpu_err(g, "NUM_SAVE_OPERATIONS : %d",
+                nvgpu_mem_rd(g, mem,
+                        ctxsw_prog_main_image_num_save_ops_o()));
+        nvgpu_err(g, "WFI_SAVE_OPERATIONS : %d",
+                nvgpu_mem_rd(g, mem,
+                        ctxsw_prog_main_image_num_wfi_save_ops_o()));
+        nvgpu_err(g, "CTA_SAVE_OPERATIONS : %d",
+                nvgpu_mem_rd(g, mem,
+                        ctxsw_prog_main_image_num_cta_save_ops_o()));
+        nvgpu_err(g, "GFXP_SAVE_OPERATIONS : %d",
+                nvgpu_mem_rd(g, mem,
+                        ctxsw_prog_main_image_num_gfxp_save_ops_o()));
+        nvgpu_err(g, "CILP_SAVE_OPERATIONS : %d",
+                nvgpu_mem_rd(g, mem,
+                        ctxsw_prog_main_image_num_cilp_save_ops_o()));
+        nvgpu_err(g,
+                "image gfx preemption option (GFXP is 1) %x",
+                nvgpu_mem_rd(g, mem,
+                        ctxsw_prog_main_image_graphics_preemption_options_o()));
+        nvgpu_err(g,
+                "image compute preemption option (CTA is 1) %x",
+                nvgpu_mem_rd(g, mem,
+                        ctxsw_prog_main_image_compute_preemption_options_o()));
+        nvgpu_mem_end(g, mem);
+}
+void gr_gp10b_free_gr_ctx(struct gk20a *g, struct vm_gk20a *vm,
+                          struct gr_ctx_desc *gr_ctx)
+{
+        gk20a_dbg_fn("");
+        if (!gr_ctx)
+                return;
+        if (g->gr.t18x.ctx_vars.dump_ctxsw_stats_on_channel_close)
+                dump_ctx_switch_stats(g, vm, gr_ctx);
+        nvgpu_dma_unmap_free(vm, &gr_ctx->t18x.pagepool_ctxsw_buffer);
+        nvgpu_dma_unmap_free(vm, &gr_ctx->t18x.betacb_ctxsw_buffer);
+        nvgpu_dma_unmap_free(vm, &gr_ctx->t18x.spill_ctxsw_buffer);
+        nvgpu_dma_unmap_free(vm, &gr_ctx->t18x.preempt_ctxsw_buffer);
+        gr_gk20a_free_gr_ctx(g, vm, gr_ctx);
+        gk20a_dbg_fn("done");
+}
+void gr_gp10b_update_ctxsw_preemption_mode(struct gk20a *g,
+                struct channel_ctx_gk20a *ch_ctx,
+                struct nvgpu_mem *mem)
+{
+        struct gr_ctx_desc *gr_ctx = ch_ctx->gr_ctx;
+        struct ctx_header_desc *ctx = &ch_ctx->ctx_header;
+        struct nvgpu_mem *ctxheader = &ctx->mem;
+        u32 gfxp_preempt_option =
+                ctxsw_prog_main_image_graphics_preemption_options_control_gfxp_f();
+        u32 cilp_preempt_option =
+                ctxsw_prog_main_image_compute_preemption_options_control_cilp_f();
+        u32 cta_preempt_option =
+                ctxsw_prog_main_image_compute_preemption_options_control_cta_f();
+        int err;
+        gk20a_dbg_fn("");
+        if (gr_ctx->graphics_preempt_mode == NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP) {
+                gk20a_dbg_info("GfxP: %x", gfxp_preempt_option);
+                nvgpu_mem_wr(g, mem,
+                                ctxsw_prog_main_image_graphics_preemption_options_o(),
+                                gfxp_preempt_option);
+        }
+        if (gr_ctx->compute_preempt_mode == NVGPU_PREEMPTION_MODE_COMPUTE_CILP) {
+                gk20a_dbg_info("CILP: %x", cilp_preempt_option);
+                nvgpu_mem_wr(g, mem,
+                                ctxsw_prog_main_image_compute_preemption_options_o(),
+                                cilp_preempt_option);
+        }
+        if (gr_ctx->compute_preempt_mode == NVGPU_PREEMPTION_MODE_COMPUTE_CTA) {
+                gk20a_dbg_info("CTA: %x", cta_preempt_option);
+                nvgpu_mem_wr(g, mem,
+                                ctxsw_prog_main_image_compute_preemption_options_o(),
+                                cta_preempt_option);
+        }
+        if (gr_ctx->t18x.preempt_ctxsw_buffer.gpu_va) {
+                u32 addr;
+                u32 size;
+                u32 cbes_reserve;
+                if (g->ops.gr.set_preemption_buffer_va) {
+                        if (ctxheader->gpu_va)
+                                g->ops.gr.set_preemption_buffer_va(g, ctxheader,
+                                gr_ctx->t18x.preempt_ctxsw_buffer.gpu_va);
+                        else
+                                g->ops.gr.set_preemption_buffer_va(g, mem,
+                                gr_ctx->t18x.preempt_ctxsw_buffer.gpu_va);
+                }
+                err = gr_gk20a_ctx_patch_write_begin(g, ch_ctx, true);
+                if (err) {
+                        nvgpu_err(g, "can't map patch context");
+                        goto out;
+                }
+                addr = (u64_lo32(gr_ctx->t18x.betacb_ctxsw_buffer.gpu_va) >>
+                        gr_gpcs_setup_attrib_cb_base_addr_39_12_align_bits_v()) |
+                        (u64_hi32(gr_ctx->t18x.betacb_ctxsw_buffer.gpu_va) <<
+                         (32 - gr_gpcs_setup_attrib_cb_base_addr_39_12_align_bits_v()));
+                gk20a_dbg_info("attrib cb addr : 0x%016x", addr);
+                g->ops.gr.commit_global_attrib_cb(g, ch_ctx, addr, true);
+                addr = (u64_lo32(gr_ctx->t18x.pagepool_ctxsw_buffer.gpu_va) >>
+                        gr_scc_pagepool_base_addr_39_8_align_bits_v()) |
+                        (u64_hi32(gr_ctx->t18x.pagepool_ctxsw_buffer.gpu_va) <<
+                         (32 - gr_scc_pagepool_base_addr_39_8_align_bits_v()));
+                size = gr_ctx->t18x.pagepool_ctxsw_buffer.size;
+                if (size == g->ops.gr.pagepool_default_size(g))
+                        size = gr_scc_pagepool_total_pages_hwmax_v();
+                g->ops.gr.commit_global_pagepool(g, ch_ctx, addr, size, true);
+                addr = (u64_lo32(gr_ctx->t18x.spill_ctxsw_buffer.gpu_va) >>
+                        gr_gpc0_swdx_rm_spill_buffer_addr_39_8_align_bits_v()) |
+                        (u64_hi32(gr_ctx->t18x.spill_ctxsw_buffer.gpu_va) <<
+                         (32 - gr_gpc0_swdx_rm_spill_buffer_addr_39_8_align_bits_v()));
+                size = gr_ctx->t18x.spill_ctxsw_buffer.size /
+                        gr_gpc0_swdx_rm_spill_buffer_size_256b_byte_granularity_v();
+                gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpc0_swdx_rm_spill_buffer_addr_r(),
+                                gr_gpc0_swdx_rm_spill_buffer_addr_39_8_f(addr),
+                                true);
+                gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpc0_swdx_rm_spill_buffer_size_r(),
+                                gr_gpc0_swdx_rm_spill_buffer_size_256b_f(size),
+                                true);
+                cbes_reserve = gr_gpcs_swdx_beta_cb_ctrl_cbes_reserve_gfxp_v();
+                gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpcs_swdx_beta_cb_ctrl_r(),
+                                gr_gpcs_swdx_beta_cb_ctrl_cbes_reserve_f(
+                                        cbes_reserve),
+                                true);
+                gr_gk20a_ctx_patch_write(g, ch_ctx,
+                                gr_gpcs_ppcs_cbm_beta_cb_ctrl_r(),
+                                gr_gpcs_ppcs_cbm_beta_cb_ctrl_cbes_reserve_f(
+                                        cbes_reserve),
+                                true);
+                gr_gk20a_ctx_patch_write_end(g, ch_ctx, true);
+        }
+out:
+        gk20a_dbg_fn("done");
+}
+int gr_gp10b_dump_gr_status_regs(struct gk20a *g,
+                           struct gk20a_debug_output *o)
+{
+        struct gr_gk20a *gr = &g->gr;
+        u32 gr_engine_id;
+        gr_engine_id = gk20a_fifo_get_gr_engine_id(g);
+        gk20a_debug_output(o, "NV_PGRAPH_STATUS: 0x%x\n",
+                gk20a_readl(g, gr_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_STATUS1: 0x%x\n",
+                gk20a_readl(g, gr_status_1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_STATUS2: 0x%x\n",
+                gk20a_readl(g, gr_status_2_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_ENGINE_STATUS: 0x%x\n",
+                gk20a_readl(g, gr_engine_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_GRFIFO_STATUS : 0x%x\n",
+                gk20a_readl(g, gr_gpfifo_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_GRFIFO_CONTROL : 0x%x\n",
+                gk20a_readl(g, gr_gpfifo_ctl_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FECS_HOST_INT_STATUS : 0x%x\n",
+                gk20a_readl(g, gr_fecs_host_int_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_EXCEPTION  : 0x%x\n",
+                gk20a_readl(g, gr_exception_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_FECS_INTR  : 0x%x\n",
+                gk20a_readl(g, gr_fecs_intr_r()));
+        gk20a_debug_output(o, "NV_PFIFO_ENGINE_STATUS(GR) : 0x%x\n",
+                gk20a_readl(g, fifo_engine_status_r(gr_engine_id)));
+        gk20a_debug_output(o, "NV_PGRAPH_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_activity_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_ACTIVITY1: 0x%x\n",
+                gk20a_readl(g, gr_activity_1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_ACTIVITY2: 0x%x\n",
+                gk20a_readl(g, gr_activity_2_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_ACTIVITY4: 0x%x\n",
+                gk20a_readl(g, gr_activity_4_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_SKED_ACTIVITY: 0x%x\n",
+                gk20a_readl(g, gr_pri_sked_activity_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_GPC_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_gpccs_gpc_activity0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_GPC_ACTIVITY1: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_gpccs_gpc_activity1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_GPC_ACTIVITY2: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_gpccs_gpc_activity2_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_GPC_ACTIVITY3: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_gpccs_gpc_activity3_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_TPC0_TPCCS_TPC_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_tpc0_tpccs_tpc_activity_0_r()));
+        if (gr->gpc_tpc_count && gr->gpc_tpc_count[0] == 2)
+                gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_TPC1_TPCCS_TPC_ACTIVITY0: 0x%x\n",
+                        gk20a_readl(g, gr_pri_gpc0_tpc1_tpccs_tpc_activity_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_TPCS_TPCCS_TPC_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_tpcs_tpccs_tpc_activity_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPCS_GPCCS_GPC_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpcs_gpccs_gpc_activity_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPCS_GPCCS_GPC_ACTIVITY1: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpcs_gpccs_gpc_activity_1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPCS_GPCCS_GPC_ACTIVITY2: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpcs_gpccs_gpc_activity_2_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPCS_GPCCS_GPC_ACTIVITY3: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpcs_gpccs_gpc_activity_3_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPCS_TPC0_TPCCS_TPC_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpcs_tpc0_tpccs_tpc_activity_0_r()));
+        if (gr->gpc_tpc_count && gr->gpc_tpc_count[0] == 2)
+                gk20a_debug_output(o, "NV_PGRAPH_PRI_GPCS_TPC1_TPCCS_TPC_ACTIVITY0: 0x%x\n",
+                        gk20a_readl(g, gr_pri_gpcs_tpc1_tpccs_tpc_activity_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPCS_TPCS_TPCCS_TPC_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpcs_tpcs_tpccs_tpc_activity_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BE0_BECS_BE_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_be0_becs_be_activity0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BE1_BECS_BE_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_be1_becs_be_activity0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BES_BECS_BE_ACTIVITY0: 0x%x\n",
+                gk20a_readl(g, gr_pri_bes_becs_be_activity0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_DS_MPIPE_STATUS: 0x%x\n",
+                gk20a_readl(g, gr_pri_ds_mpipe_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FE_GO_IDLE_TIMEOUT : 0x%x\n",
+                gk20a_readl(g, gr_fe_go_idle_timeout_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FE_GO_IDLE_INFO : 0x%x\n",
+                gk20a_readl(g, gr_pri_fe_go_idle_info_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_TPC0_TEX_M_TEX_SUBUNITS_STATUS: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_tpc0_tex_m_tex_subunits_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_CWD_FS: 0x%x\n",
+                gk20a_readl(g, gr_cwd_fs_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FE_TPC_FS: 0x%x\n",
+                gk20a_readl(g, gr_fe_tpc_fs_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_CWD_GPC_TPC_ID(0): 0x%x\n",
+                gk20a_readl(g, gr_cwd_gpc_tpc_id_r(0)));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_CWD_SM_ID(0): 0x%x\n",
+                gk20a_readl(g, gr_cwd_sm_id_r(0)));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FECS_CTXSW_STATUS_FE_0: 0x%x\n",
+                gk20a_readl(g, gr_fecs_ctxsw_status_fe_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FECS_CTXSW_STATUS_1: 0x%x\n",
+                gk20a_readl(g, gr_fecs_ctxsw_status_1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_CTXSW_STATUS_GPC_0: 0x%x\n",
+                gk20a_readl(g, gr_gpc0_gpccs_ctxsw_status_gpc_0_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_CTXSW_STATUS_1: 0x%x\n",
+                gk20a_readl(g, gr_gpc0_gpccs_ctxsw_status_1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FECS_CTXSW_IDLESTATE : 0x%x\n",
+                gk20a_readl(g, gr_fecs_ctxsw_idlestate_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_CTXSW_IDLESTATE : 0x%x\n",
+                gk20a_readl(g, gr_gpc0_gpccs_ctxsw_idlestate_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FECS_CURRENT_CTX : 0x%x\n",
+                gk20a_readl(g, gr_fecs_current_ctx_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_FECS_NEW_CTX : 0x%x\n",
+                gk20a_readl(g, gr_fecs_new_ctx_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BE0_CROP_STATUS1 : 0x%x\n",
+                gk20a_readl(g, gr_pri_be0_crop_status1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BES_CROP_STATUS1 : 0x%x\n",
+                gk20a_readl(g, gr_pri_bes_crop_status1_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BE0_ZROP_STATUS : 0x%x\n",
+                gk20a_readl(g, gr_pri_be0_zrop_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BE0_ZROP_STATUS2 : 0x%x\n",
+                gk20a_readl(g, gr_pri_be0_zrop_status2_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BES_ZROP_STATUS : 0x%x\n",
+                gk20a_readl(g, gr_pri_bes_zrop_status_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BES_ZROP_STATUS2 : 0x%x\n",
+                gk20a_readl(g, gr_pri_bes_zrop_status2_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BE0_BECS_BE_EXCEPTION: 0x%x\n",
+                gk20a_readl(g, gr_pri_be0_becs_be_exception_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_BE0_BECS_BE_EXCEPTION_EN: 0x%x\n",
+                gk20a_readl(g, gr_pri_be0_becs_be_exception_en_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_GPC_EXCEPTION: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_gpccs_gpc_exception_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_GPCCS_GPC_EXCEPTION_EN: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_gpccs_gpc_exception_en_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_TPC0_TPCCS_TPC_EXCEPTION: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_tpc0_tpccs_tpc_exception_r()));
+        gk20a_debug_output(o, "NV_PGRAPH_PRI_GPC0_TPC0_TPCCS_TPC_EXCEPTION_EN: 0x%x\n",
+                gk20a_readl(g, gr_pri_gpc0_tpc0_tpccs_tpc_exception_en_r()));
+        return 0;
+}
+static bool gr_activity_empty_or_preempted(u32 val)
+{
+        while(val) {
+                u32 v = val & 7;
+                if (v != gr_activity_4_gpc0_empty_v() &&
+                    v != gr_activity_4_gpc0_preempted_v())
+                        return false;
+                val >>= 3;
+        }
+        return true;
+}
+int gr_gp10b_wait_empty(struct gk20a *g, unsigned long duration_ms,
+                               u32 expect_delay)
+{
+        u32 delay = expect_delay;
+        bool gr_enabled;
+        bool ctxsw_active;
+        bool gr_busy;
+        u32 gr_status;
+        u32 activity0, activity1, activity2, activity4;
+        struct nvgpu_timeout timeout;
+        gk20a_dbg_fn("");
+        nvgpu_timeout_init(g, &timeout, duration_ms, NVGPU_TIMER_CPU_TIMER);
+        do {
+                /* fmodel: host gets fifo_engine_status(gr) from gr
+                   only when gr_status is read */
+                gr_status = gk20a_readl(g, gr_status_r());
+                gr_enabled = gk20a_readl(g, mc_enable_r()) &
+                        mc_enable_pgraph_enabled_f();
+                ctxsw_active = gr_status & 1<<7;
+                activity0 = gk20a_readl(g, gr_activity_0_r());
+                activity1 = gk20a_readl(g, gr_activity_1_r());
+                activity2 = gk20a_readl(g, gr_activity_2_r());
+                activity4 = gk20a_readl(g, gr_activity_4_r());
+                gr_busy = !(gr_activity_empty_or_preempted(activity0) &&
+                            gr_activity_empty_or_preempted(activity1) &&
+                            activity2 == 0 &&
+                            gr_activity_empty_or_preempted(activity4));
+                if (!gr_enabled || (!gr_busy && !ctxsw_active)) {
+                        gk20a_dbg_fn("done");
+                        return 0;
+                }
+                nvgpu_usleep_range(delay, delay * 2);
+                delay = min_t(u32, delay << 1, GR_IDLE_CHECK_MAX);
+        } while (!nvgpu_timeout_expired(&timeout));
+        nvgpu_err(g,
+                "timeout, ctxsw busy : %d, gr busy : %d, %08x, %08x, %08x, %08x",
+                ctxsw_active, gr_busy, activity0, activity1, activity2, activity4);
+        return -EAGAIN;
+}
+void gr_gp10b_commit_global_attrib_cb(struct gk20a *g,
+                                             struct channel_ctx_gk20a *ch_ctx,
+                                             u64 addr, bool patch)
+{
+        struct gr_ctx_desc *gr_ctx = ch_ctx->gr_ctx;
+        int attrBufferSize;
+        if (gr_ctx->t18x.preempt_ctxsw_buffer.gpu_va)
+                attrBufferSize = gr_ctx->t18x.betacb_ctxsw_buffer.size;
+        else
+                attrBufferSize = g->ops.gr.calc_global_ctx_buffer_size(g);
+        attrBufferSize /= gr_gpcs_tpcs_tex_rm_cb_1_size_div_128b_granularity_f();
+        gr_gm20b_commit_global_attrib_cb(g, ch_ctx, addr, patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_gpcs_tpcs_mpc_vtg_cb_global_base_addr_r(),
+                gr_gpcs_tpcs_mpc_vtg_cb_global_base_addr_v_f(addr) |
+                gr_gpcs_tpcs_mpc_vtg_cb_global_base_addr_valid_true_f(), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_gpcs_tpcs_tex_rm_cb_0_r(),
+                gr_gpcs_tpcs_tex_rm_cb_0_base_addr_43_12_f(addr), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_gpcs_tpcs_tex_rm_cb_1_r(),
+                gr_gpcs_tpcs_tex_rm_cb_1_size_div_128b_f(attrBufferSize) |
+                gr_gpcs_tpcs_tex_rm_cb_1_valid_true_f(), patch);
+}
+void gr_gp10b_commit_global_bundle_cb(struct gk20a *g,
+                                            struct channel_ctx_gk20a *ch_ctx,
+                                            u64 addr, u64 size, bool patch)
+{
+        u32 data;
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_scc_bundle_cb_base_r(),
+                gr_scc_bundle_cb_base_addr_39_8_f(addr), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_scc_bundle_cb_size_r(),
+                gr_scc_bundle_cb_size_div_256b_f(size) |
+                gr_scc_bundle_cb_size_valid_true_f(), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_gpcs_swdx_bundle_cb_base_r(),
+                gr_gpcs_swdx_bundle_cb_base_addr_39_8_f(addr), patch);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_gpcs_swdx_bundle_cb_size_r(),
+                gr_gpcs_swdx_bundle_cb_size_div_256b_f(size) |
+                gr_gpcs_swdx_bundle_cb_size_valid_true_f(), patch);
+        /* data for state_limit */
+        data = (g->gr.bundle_cb_default_size *
+                gr_scc_bundle_cb_size_div_256b_byte_granularity_v()) /
+                gr_pd_ab_dist_cfg2_state_limit_scc_bundle_granularity_v();
+        data = min_t(u32, data, g->gr.min_gpm_fifo_depth);
+        gk20a_dbg_info("bundle cb token limit : %d, state limit : %d",
+                   g->gr.bundle_cb_token_limit, data);
+        gr_gk20a_ctx_patch_write(g, ch_ctx, gr_pd_ab_dist_cfg2_r(),
+                gr_pd_ab_dist_cfg2_token_limit_f(g->gr.bundle_cb_token_limit) |
+                gr_pd_ab_dist_cfg2_state_limit_f(data), patch);
+}
+int gr_gp10b_load_smid_config(struct gk20a *g)
+{
+        u32 *tpc_sm_id;
+        u32 i, j;
+        u32 tpc_index, gpc_index;
+        u32 max_gpcs = nvgpu_get_litter_value(g, GPU_LIT_NUM_GPCS);
+        tpc_sm_id = nvgpu_kcalloc(g, gr_cwd_sm_id__size_1_v(), sizeof(u32));
+        if (!tpc_sm_id)
+                return -ENOMEM;
+        /* Each NV_PGRAPH_PRI_CWD_GPC_TPC_ID can store 4 TPCs.*/
+        for (i = 0; i <= ((g->gr.tpc_count-1) / 4); i++) {
+                u32 reg = 0;
+                u32 bit_stride = gr_cwd_gpc_tpc_id_gpc0_s() +
+                                 gr_cwd_gpc_tpc_id_tpc0_s();
+                for (j = 0; j < 4; j++) {
+                        u32 sm_id = (i * 4) + j;
+                        u32 bits;
+                        if (sm_id >= g->gr.tpc_count)
+                                break;
+                        gpc_index = g->gr.sm_to_cluster[sm_id].gpc_index;
+                        tpc_index = g->gr.sm_to_cluster[sm_id].tpc_index;
+                        bits = gr_cwd_gpc_tpc_id_gpc0_f(gpc_index) |
+                               gr_cwd_gpc_tpc_id_tpc0_f(tpc_index);
+                        reg |= bits << (j * bit_stride);
+                        tpc_sm_id[gpc_index + max_gpcs * ((tpc_index & 4) >> 2)]
+                                |= sm_id << (bit_stride * (tpc_index & 3));
+                }
+                gk20a_writel(g, gr_cwd_gpc_tpc_id_r(i), reg);
+        }
+        for (i = 0; i < gr_cwd_sm_id__size_1_v(); i++)
+                gk20a_writel(g, gr_cwd_sm_id_r(i), tpc_sm_id[i]);
+        nvgpu_kfree(g, tpc_sm_id);
+        return 0;
+}
+int gr_gp10b_init_fs_state(struct gk20a *g)
+{
+        u32 data;
+        gk20a_dbg_fn("");
+        data = gk20a_readl(g, gr_gpcs_tpcs_sm_texio_control_r());
+        data = set_field(data, gr_gpcs_tpcs_sm_texio_control_oor_addr_check_mode_m(),
+                        gr_gpcs_tpcs_sm_texio_control_oor_addr_check_mode_arm_63_48_match_f());
+        gk20a_writel(g, gr_gpcs_tpcs_sm_texio_control_r(), data);
+        data = gk20a_readl(g, gr_gpcs_tpcs_sm_disp_ctrl_r());
+        data = set_field(data, gr_gpcs_tpcs_sm_disp_ctrl_re_suppress_m(),
+                         gr_gpcs_tpcs_sm_disp_ctrl_re_suppress_disable_f());
+        gk20a_writel(g, gr_gpcs_tpcs_sm_disp_ctrl_r(), data);
+        if (g->gr.t18x.fecs_feature_override_ecc_val != 0) {
+                gk20a_writel(g,
+                        gr_fecs_feature_override_ecc_r(),
+                        g->gr.t18x.fecs_feature_override_ecc_val);
+        }
+        return gr_gm20b_init_fs_state(g);
+}
+void gr_gp10b_set_gpc_tpc_mask(struct gk20a *g, u32 gpc_index)
+{
+        nvgpu_tegra_fuse_write_bypass(g, 0x1);
+        nvgpu_tegra_fuse_write_access_sw(g, 0x0);
+        if (g->gr.gpc_tpc_mask[gpc_index] == 0x1)
+                nvgpu_tegra_fuse_write_opt_gpu_tpc0_disable(g, 0x2);
+        else if (g->gr.gpc_tpc_mask[gpc_index] == 0x2)
+                nvgpu_tegra_fuse_write_opt_gpu_tpc0_disable(g, 0x1);
+        else
+                nvgpu_tegra_fuse_write_opt_gpu_tpc0_disable(g, 0x0);
+}
+void gr_gp10b_get_access_map(struct gk20a *g,
+                                   u32 **whitelist, int *num_entries)
+{
+        static u32 wl_addr_gp10b[] = {
+                /* this list must be sorted (low to high) */
+                0x404468, /* gr_pri_mme_max_instructions       */
+                0x418300, /* gr_pri_gpcs_rasterarb_line_class  */
+                0x418800, /* gr_pri_gpcs_setup_debug           */
+                0x418e00, /* gr_pri_gpcs_swdx_config           */
+                0x418e40, /* gr_pri_gpcs_swdx_tc_bundle_ctrl   */
+                0x418e44, /* gr_pri_gpcs_swdx_tc_bundle_ctrl   */
+                0x418e48, /* gr_pri_gpcs_swdx_tc_bundle_ctrl   */
+                0x418e4c, /* gr_pri_gpcs_swdx_tc_bundle_ctrl   */
+                0x418e50, /* gr_pri_gpcs_swdx_tc_bundle_ctrl   */
+                0x418e58, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e5c, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e60, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e64, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e68, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e6c, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e70, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e74, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e78, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e7c, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e80, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e84, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e88, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e8c, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e90, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x418e94, /* gr_pri_gpcs_swdx_tc_bundle_addr   */
+                0x419864, /* gr_pri_gpcs_tpcs_pe_l2_evict_policy */
+                0x419a04, /* gr_pri_gpcs_tpcs_tex_lod_dbg      */
+                0x419a08, /* gr_pri_gpcs_tpcs_tex_samp_dbg     */
+                0x419e10, /* gr_pri_gpcs_tpcs_sm_dbgr_control0 */
+                0x419f78, /* gr_pri_gpcs_tpcs_sm_disp_ctrl     */
+        };
+        *whitelist = wl_addr_gp10b;
+        *num_entries = ARRAY_SIZE(wl_addr_gp10b);
+}
+static int gr_gp10b_disable_channel_or_tsg(struct gk20a *g, struct channel_gk20a *fault_ch)
+{
+        int ret = 0;
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr, "");
+        ret = gk20a_disable_channel_tsg(g, fault_ch);
+        if (ret) {
+                nvgpu_err(g,
+                                "CILP: failed to disable channel/TSG!");
+                return ret;
+        }
+        ret = g->ops.fifo.update_runlist(g, fault_ch->runlist_id, ~0, true, false);
+        if (ret) {
+                nvgpu_err(g,
+                                "CILP: failed to restart runlist 0!");
+                return ret;
+        }
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr, "CILP: restarted runlist");
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                        "CILP: tsgid: 0x%x", fault_ch->tsgid);
+        if (gk20a_is_channel_marked_as_tsg(fault_ch)) {
+                gk20a_fifo_issue_preempt(g, fault_ch->tsgid, true);
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                        "CILP: preempted tsg");
+        } else {
+                gk20a_fifo_issue_preempt(g, fault_ch->chid, false);
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                        "CILP: preempted channel");
+        }
+        return ret;
+}
+int gr_gp10b_set_cilp_preempt_pending(struct gk20a *g,
+                        struct channel_gk20a *fault_ch)
+{
+        int ret;
+        struct gr_ctx_desc *gr_ctx = fault_ch->ch_ctx.gr_ctx;
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr, "");
+        if (!gr_ctx)
+                return -EINVAL;
+        if (gr_ctx->t18x.cilp_preempt_pending) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                                "CILP is already pending for chid %d",
+                                fault_ch->chid);
+                return 0;
+        }
+        /* get ctx_id from the ucode image */
+        if (!gr_ctx->t18x.ctx_id_valid) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                                "CILP: looking up ctx id");
+                ret = gr_gk20a_get_ctx_id(g, fault_ch, &gr_ctx->t18x.ctx_id);
+                if (ret) {
+                        nvgpu_err(g, "CILP: error looking up ctx id!");
+                        return ret;
+                }
+                gr_ctx->t18x.ctx_id_valid = true;
+        }
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                        "CILP: ctx id is 0x%x", gr_ctx->t18x.ctx_id);
+        /* send ucode method to set ctxsw interrupt */
+        ret = gr_gk20a_submit_fecs_sideband_method_op(g,
+                        (struct fecs_method_op_gk20a) {
+                        .method.data = gr_ctx->t18x.ctx_id,
+                        .method.addr =
+                        gr_fecs_method_push_adr_configure_interrupt_completion_option_v(),
+                        .mailbox = {
+                        .id = 1 /* sideband */, .data = 0,
+                        .clr = ~0, .ret = NULL,
+                        .ok = gr_fecs_ctxsw_mailbox_value_pass_v(),
+                        .fail = 0},
+                        .cond.ok = GR_IS_UCODE_OP_EQUAL,
+                        .cond.fail = GR_IS_UCODE_OP_SKIP});
+        if (ret) {
+                nvgpu_err(g, "CILP: failed to enable ctxsw interrupt!");
+                return ret;
+        }
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                                "CILP: enabled ctxsw completion interrupt");
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                        "CILP: disabling channel %d",
+                        fault_ch->chid);
+        ret = gr_gp10b_disable_channel_or_tsg(g, fault_ch);
+        if (ret) {
+                nvgpu_err(g, "CILP: failed to disable channel!!");
+                return ret;
+        }
+        /* set cilp_preempt_pending = true and record the channel */
+        gr_ctx->t18x.cilp_preempt_pending = true;
+        g->gr.t18x.cilp_preempt_pending_chid = fault_ch->chid;
+        if (gk20a_is_channel_marked_as_tsg(fault_ch)) {
+                struct tsg_gk20a *tsg = &g->fifo.tsg[fault_ch->tsgid];
+                gk20a_tsg_event_id_post_event(tsg,
+                                NVGPU_EVENT_ID_CILP_PREEMPTION_STARTED);
+        } else {
+                gk20a_channel_event_id_post_event(fault_ch,
+                                NVGPU_EVENT_ID_CILP_PREEMPTION_STARTED);
+        }
+        return 0;
+}
+static int gr_gp10b_clear_cilp_preempt_pending(struct gk20a *g,
+                                               struct channel_gk20a *fault_ch)
+{
+        struct gr_ctx_desc *gr_ctx = fault_ch->ch_ctx.gr_ctx;
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr, "");
+        if (!gr_ctx)
+                return -EINVAL;
+        /* The ucode is self-clearing, so all we need to do here is
+           to clear cilp_preempt_pending. */
+        if (!gr_ctx->t18x.cilp_preempt_pending) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                                "CILP is already cleared for chid %d\n",
+                                fault_ch->chid);
+                return 0;
+        }
+        gr_ctx->t18x.cilp_preempt_pending = false;
+        g->gr.t18x.cilp_preempt_pending_chid = -1;
+        return 0;
+}
+/* @brief pre-process work on the SM exceptions to determine if we clear them or not.
+ *
+ * On Pascal, if we are in CILP preemtion mode, preempt the channel and handle errors with special processing
+ */
+int gr_gp10b_pre_process_sm_exception(struct gk20a *g,
+                u32 gpc, u32 tpc, u32 sm, u32 global_esr, u32 warp_esr,
+                bool sm_debugger_attached, struct channel_gk20a *fault_ch,
+                bool *early_exit, bool *ignore_debugger)
+{
+        int ret;
+        bool cilp_enabled = false;
+        u32 global_mask = 0, dbgr_control0, global_esr_copy;
+        u32 gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_GPC_STRIDE);
+        u32 tpc_in_gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_TPC_IN_GPC_STRIDE);
+        u32 offset = gpc_stride * gpc + tpc_in_gpc_stride * tpc;
+        *early_exit = false;
+        *ignore_debugger = false;
+        if (fault_ch)
+                cilp_enabled = (fault_ch->ch_ctx.gr_ctx->compute_preempt_mode ==
+                        NVGPU_PREEMPTION_MODE_COMPUTE_CILP);
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg, "SM Exception received on gpc %d tpc %d = %u\n",
+                        gpc, tpc, global_esr);
+        if (cilp_enabled && sm_debugger_attached) {
+                if (global_esr & gr_gpc0_tpc0_sm_hww_global_esr_bpt_int_pending_f())
+                        gk20a_writel(g, gr_gpc0_tpc0_sm_hww_global_esr_r() + offset,
+                                        gr_gpc0_tpc0_sm_hww_global_esr_bpt_int_pending_f());
+                if (global_esr & gr_gpc0_tpc0_sm_hww_global_esr_single_step_complete_pending_f())
+                        gk20a_writel(g, gr_gpc0_tpc0_sm_hww_global_esr_r() + offset,
+                                        gr_gpc0_tpc0_sm_hww_global_esr_single_step_complete_pending_f());
+                global_mask = gr_gpc0_tpc0_sm_hww_global_esr_sm_to_sm_fault_pending_f() |
+                        gr_gpcs_tpcs_sm_hww_global_esr_l1_error_pending_f() |
+                        gr_gpcs_tpcs_sm_hww_global_esr_multiple_warp_errors_pending_f() |
+                        gr_gpcs_tpcs_sm_hww_global_esr_physical_stack_overflow_error_pending_f() |
+                        gr_gpcs_tpcs_sm_hww_global_esr_timeout_error_pending_f() |
+                        gr_gpcs_tpcs_sm_hww_global_esr_bpt_pause_pending_f();
+                if (warp_esr != 0 || (global_esr & global_mask) != 0) {
+                        *ignore_debugger = true;
+                        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg,
+                                        "CILP: starting wait for LOCKED_DOWN on gpc %d tpc %d\n",
+                                        gpc, tpc);
+                        if (gk20a_dbg_gpu_broadcast_stop_trigger(fault_ch)) {
+                                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg,
+                                                "CILP: Broadcasting STOP_TRIGGER from gpc %d tpc %d\n",
+                                                gpc, tpc);
+                                g->ops.gr.suspend_all_sms(g, global_mask, false);
+                                gk20a_dbg_gpu_clear_broadcast_stop_trigger(fault_ch);
+                        } else {
+                                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg,
+                                                "CILP: STOP_TRIGGER from gpc %d tpc %d\n",
+                                                gpc, tpc);
+                                g->ops.gr.suspend_single_sm(g, gpc, tpc, sm, global_mask, true);
+                        }
+                        /* reset the HWW errors after locking down */
+                        global_esr_copy = g->ops.gr.get_sm_hww_global_esr(g,
+                                                        gpc, tpc, sm);
+                        g->ops.gr.clear_sm_hww(g,
+                                                gpc, tpc, sm, global_esr_copy);
+                        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg,
+                                        "CILP: HWWs cleared for gpc %d tpc %d\n",
+                                        gpc, tpc);
+                        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg, "CILP: Setting CILP preempt pending\n");
+                        ret = gr_gp10b_set_cilp_preempt_pending(g, fault_ch);
+                        if (ret) {
+                                nvgpu_err(g, "CILP: error while setting CILP preempt pending!");
+                                return ret;
+                        }
+                        dbgr_control0 = gk20a_readl(g, gr_gpc0_tpc0_sm_dbgr_control0_r() + offset);
+                        if (dbgr_control0 & gr_gpcs_tpcs_sm_dbgr_control0_single_step_mode_enable_f()) {
+                                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg,
+                                                "CILP: clearing SINGLE_STEP_MODE before resume for gpc %d tpc %d\n",
+                                                gpc, tpc);
+                                dbgr_control0 = set_field(dbgr_control0,
+                                                gr_gpcs_tpcs_sm_dbgr_control0_single_step_mode_m(),
+                                                gr_gpcs_tpcs_sm_dbgr_control0_single_step_mode_disable_f());
+                                gk20a_writel(g, gr_gpc0_tpc0_sm_dbgr_control0_r() + offset, dbgr_control0);
+                        }
+                        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg,
+                                        "CILP: resume for gpc %d tpc %d\n",
+                                        gpc, tpc);
+                        g->ops.gr.resume_single_sm(g, gpc, tpc, sm);
+                        *ignore_debugger = true;
+                        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg, "CILP: All done on gpc %d, tpc %d\n", gpc, tpc);
+                }
+                *early_exit = true;
+        }
+        return 0;
+}
+static int gr_gp10b_get_cilp_preempt_pending_chid(struct gk20a *g, int *__chid)
+{
+        struct gr_ctx_desc *gr_ctx;
+        struct channel_gk20a *ch;
+        int chid;
+        int ret = -EINVAL;
+        chid = g->gr.t18x.cilp_preempt_pending_chid;
+        ch = gk20a_channel_get(gk20a_fifo_channel_from_chid(g, chid));
+        if (!ch)
+                return ret;
+        gr_ctx = ch->ch_ctx.gr_ctx;
+        if (gr_ctx->t18x.cilp_preempt_pending) {
+                *__chid = chid;
+                ret = 0;
+        }
+        gk20a_channel_put(ch);
+        return ret;
+}
+int gr_gp10b_handle_fecs_error(struct gk20a *g,
+                                struct channel_gk20a *__ch,
+                                struct gr_gk20a_isr_data *isr_data)
+{
+        u32 gr_fecs_intr = gk20a_readl(g, gr_fecs_host_int_status_r());
+        struct channel_gk20a *ch;
+        int chid = -1;
+        int ret = 0;
+        gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr, "");
+        /*
+         * INTR1 (bit 1 of the HOST_INT_STATUS_CTXSW_INTR)
+         * indicates that a CILP ctxsw save has finished
+         */
+        if (gr_fecs_intr & gr_fecs_host_int_status_ctxsw_intr_f(2)) {
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                                "CILP: ctxsw save completed!\n");
+                /* now clear the interrupt */
+                gk20a_writel(g, gr_fecs_host_int_clear_r(),
+                                gr_fecs_host_int_clear_ctxsw_intr1_clear_f());
+                ret = gr_gp10b_get_cilp_preempt_pending_chid(g, &chid);
+                if (ret)
+                        goto clean_up;
+                ch = gk20a_channel_get(
+                                gk20a_fifo_channel_from_chid(g, chid));
+                if (!ch)
+                        goto clean_up;
+                /* set preempt_pending to false */
+                ret = gr_gp10b_clear_cilp_preempt_pending(g, ch);
+                if (ret) {
+                        nvgpu_err(g, "CILP: error while unsetting CILP preempt pending!");
+                        gk20a_channel_put(ch);
+                        goto clean_up;
+                }
+                /* Post events to UMD */
+                gk20a_dbg_gpu_post_events(ch);
+                if (gk20a_is_channel_marked_as_tsg(ch)) {
+                        struct tsg_gk20a *tsg = &g->fifo.tsg[ch->tsgid];
+                        gk20a_tsg_event_id_post_event(tsg,
+                                NVGPU_EVENT_ID_CILP_PREEMPTION_COMPLETE);
+                } else {
+                        gk20a_channel_event_id_post_event(ch,
+                                NVGPU_EVENT_ID_CILP_PREEMPTION_COMPLETE);
+                }
+                gk20a_channel_put(ch);
+        }
+clean_up:
+        /* handle any remaining interrupts */
+        return gk20a_gr_handle_fecs_error(g, __ch, isr_data);
+}
+u32 gp10b_gr_get_sm_hww_warp_esr(struct gk20a *g,
+                        u32 gpc, u32 tpc, u32 sm)
+{
+        u32 offset = gk20a_gr_gpc_offset(g, gpc) + gk20a_gr_tpc_offset(g, tpc);
+        u32 hww_warp_esr = gk20a_readl(g,
+                         gr_gpc0_tpc0_sm_hww_warp_esr_r() + offset);
+        if (!(hww_warp_esr & gr_gpc0_tpc0_sm_hww_warp_esr_addr_valid_m()))
+                hww_warp_esr = set_field(hww_warp_esr,
+                        gr_gpc0_tpc0_sm_hww_warp_esr_addr_error_type_m(),
+                        gr_gpc0_tpc0_sm_hww_warp_esr_addr_error_type_none_f());
+        return hww_warp_esr;
+}
+u32 get_ecc_override_val(struct gk20a *g)
+{
+        u32 val;
+        val = gk20a_readl(g, fuse_opt_ecc_en_r());
+        if (val)
+                return gk20a_readl(g, gr_fecs_feature_override_ecc_r());
+        return 0;
+}
+static bool gr_gp10b_suspend_context(struct channel_gk20a *ch,
+                                bool *cilp_preempt_pending)
+{
+        struct gk20a *g = ch->g;
+        struct channel_ctx_gk20a *ch_ctx = &ch->ch_ctx;
+        struct gr_ctx_desc *gr_ctx = ch_ctx->gr_ctx;
+        bool ctx_resident = false;
+        int err = 0;
+        *cilp_preempt_pending = false;
+        if (gk20a_is_channel_ctx_resident(ch)) {
+                g->ops.gr.suspend_all_sms(g, 0, false);
+                if (gr_ctx->compute_preempt_mode == NVGPU_PREEMPTION_MODE_COMPUTE_CILP) {
+                        err = gr_gp10b_set_cilp_preempt_pending(g, ch);
+                        if (err)
+                                nvgpu_err(g, "unable to set CILP preempt pending");
+                        else
+                                *cilp_preempt_pending = true;
+                        g->ops.gr.resume_all_sms(g);
+                }
+                ctx_resident = true;
+        } else {
+                gk20a_disable_channel_tsg(g, ch);
+        }
+        return ctx_resident;
+}
+int gr_gp10b_suspend_contexts(struct gk20a *g,
+                                struct dbg_session_gk20a *dbg_s,
+                                int *ctx_resident_ch_fd)
+{
+        u32 delay = GR_IDLE_CHECK_DEFAULT;
+        bool cilp_preempt_pending = false;
+        struct channel_gk20a *cilp_preempt_pending_ch = NULL;
+        struct channel_gk20a *ch;
+        struct dbg_session_channel_data *ch_data;
+        int err = 0;
+        int local_ctx_resident_ch_fd = -1;
+        bool ctx_resident;
+        nvgpu_mutex_acquire(&g->dbg_sessions_lock);
+        err = gr_gk20a_disable_ctxsw(g);
+        if (err) {
+                nvgpu_err(g, "unable to stop gr ctxsw");
+                nvgpu_mutex_release(&g->dbg_sessions_lock);
+                goto clean_up;
+        }
+        nvgpu_mutex_acquire(&dbg_s->ch_list_lock);
+        list_for_each_entry(ch_data, &dbg_s->ch_list, ch_entry) {
+                ch = g->fifo.channel + ch_data->chid;
+                ctx_resident = gr_gp10b_suspend_context(ch,
+                                        &cilp_preempt_pending);
+                if (ctx_resident)
+                        local_ctx_resident_ch_fd = ch_data->channel_fd;
+                if (cilp_preempt_pending)
+                        cilp_preempt_pending_ch = ch;
+        }
+        nvgpu_mutex_release(&dbg_s->ch_list_lock);
+        err = gr_gk20a_enable_ctxsw(g);
+        if (err) {
+                nvgpu_mutex_release(&g->dbg_sessions_lock);
+                goto clean_up;
+        }
+        nvgpu_mutex_release(&g->dbg_sessions_lock);
+        if (cilp_preempt_pending_ch) {
+                struct channel_ctx_gk20a *ch_ctx =
+                                &cilp_preempt_pending_ch->ch_ctx;
+                struct gr_ctx_desc *gr_ctx = ch_ctx->gr_ctx;
+                struct nvgpu_timeout timeout;
+                gk20a_dbg(gpu_dbg_fn | gpu_dbg_gpu_dbg | gpu_dbg_intr,
+                        "CILP preempt pending, waiting %lu msecs for preemption",
+                        gk20a_get_gr_idle_timeout(g));
+                nvgpu_timeout_init(g, &timeout, gk20a_get_gr_idle_timeout(g),
+                                   NVGPU_TIMER_CPU_TIMER);
+                do {
+                        if (!gr_ctx->t18x.cilp_preempt_pending)
+                                break;
+                        nvgpu_usleep_range(delay, delay * 2);
+                        delay = min_t(u32, delay << 1, GR_IDLE_CHECK_MAX);
+                } while (!nvgpu_timeout_expired(&timeout));
+                /* If cilp is still pending at this point, timeout */
+                if (gr_ctx->t18x.cilp_preempt_pending)
+                        err = -ETIMEDOUT;
+        }
+        *ctx_resident_ch_fd = local_ctx_resident_ch_fd;
+clean_up:
+        return err;
+}
+int gr_gp10b_set_boosted_ctx(struct channel_gk20a *ch,
+                                    bool boost)
+{
+        struct gr_ctx_desc *gr_ctx = ch->ch_ctx.gr_ctx;
+        struct gk20a *g = ch->g;
+        struct nvgpu_mem *mem = &gr_ctx->mem;
+        int err = 0;
+        gr_ctx->boosted_ctx = boost;
+        if (nvgpu_mem_begin(g, mem))
+                return -ENOMEM;
+        err = gk20a_disable_channel_tsg(g, ch);
+        if (err)
+                goto unmap_ctx;
+        err = gk20a_fifo_preempt(g, ch);
+        if (err)
+                goto enable_ch;
+        if (g->ops.gr.update_boosted_ctx)
+                g->ops.gr.update_boosted_ctx(g, mem, gr_ctx);
+        else
+                err = -ENOSYS;
+enable_ch:
+        gk20a_enable_channel_tsg(g, ch);
+unmap_ctx:
+        nvgpu_mem_end(g, mem);
+        return err;
+}
+void gr_gp10b_update_boosted_ctx(struct gk20a *g, struct nvgpu_mem *mem,
+                                       struct gr_ctx_desc *gr_ctx) {
+        u32 v;
+        v = ctxsw_prog_main_image_pmu_options_boost_clock_frequencies_f(
+                gr_ctx->boosted_ctx);
+        nvgpu_mem_wr(g, mem, ctxsw_prog_main_image_pmu_options_o(), v);
+}
+int gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
+                                        u32 graphics_preempt_mode,
+                                        u32 compute_preempt_mode)
+{
+        struct gr_ctx_desc *gr_ctx = ch->ch_ctx.gr_ctx;
+        struct channel_ctx_gk20a *ch_ctx = &ch->ch_ctx;
+        struct gk20a *g = ch->g;
+        struct tsg_gk20a *tsg;
+        struct vm_gk20a *vm;
+        struct nvgpu_mem *mem = &gr_ctx->mem;
+        struct ctx_header_desc *ctx = &ch->ch_ctx.ctx_header;
+        struct nvgpu_mem *ctxheader = &ctx->mem;
+        u32 class;
+        int err = 0;
+        class = ch->obj_class;
+        if (!class)
+                return -EINVAL;
+        if (gk20a_is_channel_marked_as_tsg(ch)) {
+                tsg = &g->fifo.tsg[ch->tsgid];
+                vm = tsg->vm;
+        } else {
+                vm = ch->vm;
+        }
+        /* skip setting anything if both modes are already set */
+        if (graphics_preempt_mode &&
+           (graphics_preempt_mode == gr_ctx->graphics_preempt_mode))
+                graphics_preempt_mode = 0;
+        if (compute_preempt_mode &&
+           (compute_preempt_mode == gr_ctx->compute_preempt_mode))
+                compute_preempt_mode = 0;
+        if (graphics_preempt_mode == 0 && compute_preempt_mode == 0)
+                return 0;
+        if (g->ops.gr.set_ctxsw_preemption_mode) {
+                gk20a_dbg(gpu_dbg_sched, "chid=%d tsgid=%d pid=%d "
+                                "graphics_preempt=%d compute_preempt=%d",
+                                ch->chid,
+                                ch->tsgid,
+                                ch->tgid,
+                                graphics_preempt_mode,
+                                compute_preempt_mode);
+                err = g->ops.gr.set_ctxsw_preemption_mode(g, gr_ctx, vm, class,
+                                                graphics_preempt_mode, compute_preempt_mode);
+                if (err) {
+                        nvgpu_err(g, "set_ctxsw_preemption_mode failed");
+                        return err;
+                }
+        }
+        if (nvgpu_mem_begin(g, mem))
+                return -ENOMEM;
+        if (nvgpu_mem_begin(g, ctxheader))
+                goto unamp_ctx_header;
+        err = gk20a_disable_channel_tsg(g, ch);
+        if (err)
+                goto unmap_ctx;
+        err = gk20a_fifo_preempt(g, ch);
+        if (err)
+                goto enable_ch;
+        if (g->ops.gr.update_ctxsw_preemption_mode) {
+                g->ops.gr.update_ctxsw_preemption_mode(ch->g,
+                                                ch_ctx, mem);
+                err = gr_gk20a_ctx_patch_write_begin(g, ch_ctx, true);
+                if (err) {
+                        nvgpu_err(g, "can't map patch context");
+                        goto enable_ch;
+                }
+                g->ops.gr.commit_global_cb_manager(g, ch, true);
+                gr_gk20a_ctx_patch_write_end(g, ch_ctx, true);
+        }
+enable_ch:
+        gk20a_enable_channel_tsg(g, ch);
+unmap_ctx:
+        nvgpu_mem_end(g, ctxheader);
+unamp_ctx_header:
+        nvgpu_mem_end(g, mem);
+        return err;
+}
+int gr_gp10b_get_preemption_mode_flags(struct gk20a *g,
+        struct nvgpu_preemption_modes_rec *preemption_modes_rec)
+{
+        preemption_modes_rec->graphics_preemption_mode_flags = (
+                        NVGPU_PREEMPTION_MODE_GRAPHICS_WFI |
+                        NVGPU_PREEMPTION_MODE_GRAPHICS_GFXP);
+        preemption_modes_rec->compute_preemption_mode_flags = (
+                        NVGPU_PREEMPTION_MODE_COMPUTE_WFI |
+                        NVGPU_PREEMPTION_MODE_COMPUTE_CTA |
+                        NVGPU_PREEMPTION_MODE_COMPUTE_CILP);
+        preemption_modes_rec->default_graphics_preempt_mode =
+                        NVGPU_PREEMPTION_MODE_GRAPHICS_WFI;
+        preemption_modes_rec->default_compute_preempt_mode =
+                        NVGPU_PREEMPTION_MODE_COMPUTE_WFI;
+        return 0;
+}
+int gr_gp10b_init_preemption_state(struct gk20a *g)
+{
+        u32 debug_2;
+        struct gr_gk20a *gr = &g->gr;
+        u32 sysclk_cycles = gr->gfxp_wfi_timeout_count;
+        gk20a_writel(g, gr_fe_gfxp_wfi_timeout_r(),
+                        gr_fe_gfxp_wfi_timeout_count_f(sysclk_cycles));
+        debug_2 = gk20a_readl(g, gr_debug_2_r());
+        debug_2 = set_field(debug_2,
+                        gr_debug_2_gfxp_wfi_always_injects_wfi_m(),
+                        gr_debug_2_gfxp_wfi_always_injects_wfi_enabled_f());
+        gk20a_writel(g, gr_debug_2_r(), debug_2);
+        return 0;
+}
+void gr_gp10b_set_preemption_buffer_va(struct gk20a *g,
+                        struct nvgpu_mem *mem, u64 gpu_va)
+{
+        u32 va = u64_lo32(gpu_va >> 8);
+        nvgpu_mem_wr(g, mem,
+                        ctxsw_prog_main_image_full_preemption_ptr_o(), va);
+}
+void gr_gp10b_init_czf_bypass(struct gk20a *g)
+{
+        g->gr.czf_bypass = gr_gpc0_prop_debug1_czf_bypass_init_v();
+}
+int gr_gp10b_set_czf_bypass(struct gk20a *g, struct channel_gk20a *ch)
+{
+        struct nvgpu_dbg_gpu_reg_op ops;
+        ops.op     = REGOP(WRITE_32);
+        ops.type   = REGOP(TYPE_GR_CTX);
+        ops.status = REGOP(STATUS_SUCCESS);
+        ops.value_hi      = 0;
+        ops.and_n_mask_lo = gr_gpc0_prop_debug1_czf_bypass_m();
+        ops.and_n_mask_hi = 0;
+        ops.offset   = gr_gpc0_prop_debug1_r();
+        ops.value_lo = gr_gpc0_prop_debug1_czf_bypass_f(
+                g->gr.czf_bypass);
+        return __gr_gk20a_exec_ctx_ops(ch, &ops, 1, 1, 0, false);
+}
+void gr_gp10b_init_ctxsw_hdr_data(struct gk20a *g, struct nvgpu_mem *mem)
+{
+        gk20a_gr_init_ctxsw_hdr_data(g, mem);
+        nvgpu_mem_wr(g, mem,
+                        ctxsw_prog_main_image_num_wfi_save_ops_o(), 0);
+        nvgpu_mem_wr(g, mem,
+                        ctxsw_prog_main_image_num_cta_save_ops_o(), 0);
+        nvgpu_mem_wr(g, mem,
+                        ctxsw_prog_main_image_num_gfxp_save_ops_o(), 0);
+        nvgpu_mem_wr(g, mem,
+                        ctxsw_prog_main_image_num_cilp_save_ops_o(), 0);
+}
diff --git a/drivers/gpu/nvgpu/gp10b/gr_gp10b.h b/drivers/gpu/nvgpu/gp10b/gr_gp10b.h
new file mode 100644
index 00000000..45ac5305
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/gr_gp10b.h
@@ -0,0 +1,171 @@
+/*
+ * GP10B GPU GR
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef _NVGPU_GR_GP10B_H_
+#define _NVGPU_GR_GP10B_H_
+#include "gk20a/mm_gk20a.h"
+struct gk20a;
+struct gr_gk20a_isr_data;
+struct channel_ctx_gk20a;
+struct zbc_entry;
+struct gr_ctx_desc;
+struct nvgpu_preemption_modes_rec;
+struct gk20a_debug_output;
+enum {
+        PASCAL_CHANNEL_GPFIFO_A  = 0xC06F,
+        PASCAL_A                 = 0xC097,
+        PASCAL_COMPUTE_A         = 0xC0C0,
+        PASCAL_DMA_COPY_A        = 0xC0B5,
+        PASCAL_DMA_COPY_B        = 0xC1B5,
+};
+#define NVC097_SET_GO_IDLE_TIMEOUT              0x022c
+#define NVC097_SET_ALPHA_CIRCULAR_BUFFER_SIZE   0x02dc
+#define NVC097_SET_COALESCE_BUFFER_SIZE         0x1028
+#define NVC097_SET_RD_COALESCE                  0x102c
+#define NVC097_SET_CIRCULAR_BUFFER_SIZE         0x1280
+#define NVC097_SET_SHADER_EXCEPTIONS            0x1528
+#define NVC097_SET_BES_CROP_DEBUG3              0x10c4
+#define NVC0C0_SET_SHADER_EXCEPTIONS            0x1528
+#define NVC0C0_SET_RD_COALESCE                  0x0228
+int gr_gp10b_init_fs_state(struct gk20a *g);
+int gr_gp10b_alloc_buffer(struct vm_gk20a *vm, size_t size,
+                        struct nvgpu_mem *mem);
+void gr_gp10b_create_sysfs(struct gk20a *g);
+int gr_gp10b_handle_fecs_error(struct gk20a *g,
+                        struct channel_gk20a *__ch,
+                        struct gr_gk20a_isr_data *isr_data);
+int gr_gp10b_set_cilp_preempt_pending(struct gk20a *g,
+                struct channel_gk20a *fault_ch);
+bool gr_gp10b_is_valid_class(struct gk20a *g, u32 class_num);
+bool gr_gp10b_is_valid_gfx_class(struct gk20a *g, u32 class_num);
+bool gr_gp10b_is_valid_compute_class(struct gk20a *g, u32 class_num);
+int gr_gp10b_handle_sm_exception(struct gk20a *g,
+                        u32 gpc, u32 tpc, u32 sm,
+                        bool *post_event, struct channel_gk20a *fault_ch,
+                        u32 *hww_global_esr);
+int gr_gp10b_handle_tex_exception(struct gk20a *g, u32 gpc, u32 tpc,
+                bool *post_event);
+int gr_gp10b_commit_global_cb_manager(struct gk20a *g,
+                        struct channel_gk20a *c, bool patch);
+void gr_gp10b_commit_global_pagepool(struct gk20a *g,
+                                            struct channel_ctx_gk20a *ch_ctx,
+                                            u64 addr, u32 size, bool patch);
+int gr_gp10b_add_zbc_color(struct gk20a *g, struct gr_gk20a *gr,
+                                  struct zbc_entry *color_val, u32 index);
+int gr_gp10b_add_zbc_depth(struct gk20a *g, struct gr_gk20a *gr,
+                                struct zbc_entry *depth_val, u32 index);
+u32 gr_gp10b_pagepool_default_size(struct gk20a *g);
+int gr_gp10b_calc_global_ctx_buffer_size(struct gk20a *g);
+void gr_gp10b_set_bes_crop_debug3(struct gk20a *g, u32 data);
+int gr_gp10b_handle_sw_method(struct gk20a *g, u32 addr,
+                                     u32 class_num, u32 offset, u32 data);
+void gr_gp10b_cb_size_default(struct gk20a *g);
+void gr_gp10b_set_alpha_circular_buffer_size(struct gk20a *g, u32 data);
+void gr_gp10b_set_circular_buffer_size(struct gk20a *g, u32 data);
+int gr_gp10b_init_ctx_state(struct gk20a *g);
+int gr_gp10b_set_ctxsw_preemption_mode(struct gk20a *g,
+                                struct gr_ctx_desc *gr_ctx,
+                                struct vm_gk20a *vm, u32 class,
+                                u32 graphics_preempt_mode,
+                                u32 compute_preempt_mode);
+int gr_gp10b_alloc_gr_ctx(struct gk20a *g,
+                          struct gr_ctx_desc **gr_ctx, struct vm_gk20a *vm,
+                          u32 class,
+                          u32 flags);
+void gr_gp10b_free_gr_ctx(struct gk20a *g, struct vm_gk20a *vm,
+                          struct gr_ctx_desc *gr_ctx);
+void gr_gp10b_update_ctxsw_preemption_mode(struct gk20a *g,
+                struct channel_ctx_gk20a *ch_ctx,
+                struct nvgpu_mem *mem);
+int gr_gp10b_dump_gr_status_regs(struct gk20a *g,
+                           struct gk20a_debug_output *o);
+int gr_gp10b_wait_empty(struct gk20a *g, unsigned long duration_ms,
+                               u32 expect_delay);
+void gr_gp10b_commit_global_attrib_cb(struct gk20a *g,
+                                             struct channel_ctx_gk20a *ch_ctx,
+                                             u64 addr, bool patch);
+void gr_gp10b_commit_global_bundle_cb(struct gk20a *g,
+                                            struct channel_ctx_gk20a *ch_ctx,
+                                            u64 addr, u64 size, bool patch);
+int gr_gp10b_load_smid_config(struct gk20a *g);
+void gr_gp10b_set_gpc_tpc_mask(struct gk20a *g, u32 gpc_index);
+void gr_gp10b_get_access_map(struct gk20a *g,
+                                   u32 **whitelist, int *num_entries);
+int gr_gp10b_pre_process_sm_exception(struct gk20a *g,
+                u32 gpc, u32 tpc, u32 sm, u32 global_esr, u32 warp_esr,
+                bool sm_debugger_attached, struct channel_gk20a *fault_ch,
+                bool *early_exit, bool *ignore_debugger);
+u32 gp10b_gr_get_sm_hww_warp_esr(struct gk20a *g,
+                        u32 gpc, u32 tpc, u32 sm);
+u32 get_ecc_override_val(struct gk20a *g);
+int gr_gp10b_suspend_contexts(struct gk20a *g,
+                                struct dbg_session_gk20a *dbg_s,
+                                int *ctx_resident_ch_fd);
+int gr_gp10b_set_boosted_ctx(struct channel_gk20a *ch,
+                                    bool boost);
+void gr_gp10b_update_boosted_ctx(struct gk20a *g, struct nvgpu_mem *mem,
+                                       struct gr_ctx_desc *gr_ctx);
+int gr_gp10b_set_preemption_mode(struct channel_gk20a *ch,
+                                        u32 graphics_preempt_mode,
+                                        u32 compute_preempt_mode);
+int gr_gp10b_get_preemption_mode_flags(struct gk20a *g,
+        struct nvgpu_preemption_modes_rec *preemption_modes_rec);
+int gp10b_gr_fuse_override(struct gk20a *g);
+int gr_gp10b_init_preemption_state(struct gk20a *g);
+void gr_gp10b_set_preemption_buffer_va(struct gk20a *g,
+                        struct nvgpu_mem *mem, u64 gpu_va);
+int gr_gp10b_set_czf_bypass(struct gk20a *g, struct channel_gk20a *ch);
+void gr_gp10b_init_czf_bypass(struct gk20a *g);
+void gr_gp10b_init_ctxsw_hdr_data(struct gk20a *g, struct nvgpu_mem *mem);
+struct gr_t18x {
+        struct {
+                u32 preempt_image_size;
+                bool force_preemption_gfxp;
+                bool force_preemption_cilp;
+                bool dump_ctxsw_stats_on_channel_close;
+        } ctx_vars;
+        u32 fecs_feature_override_ecc_val;
+        int cilp_preempt_pending_chid;
+};
+struct gr_ctx_desc_t18x {
+        struct nvgpu_mem preempt_ctxsw_buffer;
+        struct nvgpu_mem spill_ctxsw_buffer;
+        struct nvgpu_mem betacb_ctxsw_buffer;
+        struct nvgpu_mem pagepool_ctxsw_buffer;
+        u32 ctx_id;
+        bool ctx_id_valid;
+        bool cilp_preempt_pending;
+};
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/hal_gp10b.c b/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
new file mode 100644
index 00000000..9b3d1a2c
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
@@ -0,0 +1,748 @@
+/*
+ * GP10B Tegra HAL interface
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include "gk20a/fifo_gk20a.h"
+#include "gk20a/fecs_trace_gk20a.h"
+#include "gk20a/mm_gk20a.h"
+#include "gk20a/dbg_gpu_gk20a.h"
+#include "gk20a/css_gr_gk20a.h"
+#include "gk20a/bus_gk20a.h"
+#include "gk20a/pramin_gk20a.h"
+#include "gk20a/flcn_gk20a.h"
+#include "gk20a/regops_gk20a.h"
+#include "gk20a/mc_gk20a.h"
+#include "gk20a/fb_gk20a.h"
+#include "gk20a/pmu_gk20a.h"
+#include "gk20a/gr_gk20a.h"
+#include "gk20a/tsg_gk20a.h"
+#include "gp10b/gr_gp10b.h"
+#include "gp10b/fecs_trace_gp10b.h"
+#include "gp10b/mc_gp10b.h"
+#include "gp10b/ltc_gp10b.h"
+#include "gp10b/mm_gp10b.h"
+#include "gp10b/ce_gp10b.h"
+#include "gp10b/fb_gp10b.h"
+#include "gp10b/pmu_gp10b.h"
+#include "gp10b/gr_ctx_gp10b.h"
+#include "gp10b/fifo_gp10b.h"
+#include "gp10b/gp10b_gating_reglist.h"
+#include "gp10b/regops_gp10b.h"
+#include "gp10b/therm_gp10b.h"
+#include "gp10b/priv_ring_gp10b.h"
+#include "gm20b/ltc_gm20b.h"
+#include "gm20b/gr_gm20b.h"
+#include "gm20b/fifo_gm20b.h"
+#include "gm20b/acr_gm20b.h"
+#include "gm20b/pmu_gm20b.h"
+#include "gm20b/clk_gm20b.h"
+#include "gm20b/fb_gm20b.h"
+#include "gm20b/mm_gm20b.h"
+#include "gp10b.h"
+#include "hal_gp10b.h"
+#include <nvgpu/debug.h>
+#include <nvgpu/bug.h>
+#include <nvgpu/enabled.h>
+#include <nvgpu/bus.h>
+#include <nvgpu/ctxsw_trace.h>
+#include <nvgpu/hw/gp10b/hw_proj_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fuse_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fifo_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_ram_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_top_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_pram_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_pwr_gp10b.h>
+int gp10b_get_litter_value(struct gk20a *g, int value)
+{
+        int ret = EINVAL;
+        switch (value) {
+        case GPU_LIT_NUM_GPCS:
+                ret = proj_scal_litter_num_gpcs_v();
+                break;
+        case GPU_LIT_NUM_PES_PER_GPC:
+                ret = proj_scal_litter_num_pes_per_gpc_v();
+                break;
+        case GPU_LIT_NUM_ZCULL_BANKS:
+                ret = proj_scal_litter_num_zcull_banks_v();
+                break;
+        case GPU_LIT_NUM_TPC_PER_GPC:
+                ret = proj_scal_litter_num_tpc_per_gpc_v();
+                break;
+        case GPU_LIT_NUM_SM_PER_TPC:
+                ret = proj_scal_litter_num_sm_per_tpc_v();
+                break;
+        case GPU_LIT_NUM_FBPS:
+                ret = proj_scal_litter_num_fbps_v();
+                break;
+        case GPU_LIT_GPC_BASE:
+                ret = proj_gpc_base_v();
+                break;
+        case GPU_LIT_GPC_STRIDE:
+                ret = proj_gpc_stride_v();
+                break;
+        case GPU_LIT_GPC_SHARED_BASE:
+                ret = proj_gpc_shared_base_v();
+                break;
+        case GPU_LIT_TPC_IN_GPC_BASE:
+                ret = proj_tpc_in_gpc_base_v();
+                break;
+        case GPU_LIT_TPC_IN_GPC_STRIDE:
+                ret = proj_tpc_in_gpc_stride_v();
+                break;
+        case GPU_LIT_TPC_IN_GPC_SHARED_BASE:
+                ret = proj_tpc_in_gpc_shared_base_v();
+                break;
+        case GPU_LIT_PPC_IN_GPC_BASE:
+                ret = proj_ppc_in_gpc_base_v();
+                break;
+        case GPU_LIT_PPC_IN_GPC_STRIDE:
+                ret = proj_ppc_in_gpc_stride_v();
+                break;
+        case GPU_LIT_PPC_IN_GPC_SHARED_BASE:
+                ret = proj_ppc_in_gpc_shared_base_v();
+                break;
+        case GPU_LIT_ROP_BASE:
+                ret = proj_rop_base_v();
+                break;
+        case GPU_LIT_ROP_STRIDE:
+                ret = proj_rop_stride_v();
+                break;
+        case GPU_LIT_ROP_SHARED_BASE:
+                ret = proj_rop_shared_base_v();
+                break;
+        case GPU_LIT_HOST_NUM_ENGINES:
+                ret = proj_host_num_engines_v();
+                break;
+        case GPU_LIT_HOST_NUM_PBDMA:
+                ret = proj_host_num_pbdma_v();
+                break;
+        case GPU_LIT_LTC_STRIDE:
+                ret = proj_ltc_stride_v();
+                break;
+        case GPU_LIT_LTS_STRIDE:
+                ret = proj_lts_stride_v();
+                break;
+        /* Even though GP10B doesn't have an FBPA unit, the HW reports one,
+         * and the microcode as a result leaves space in the context buffer
+         * for one, so make sure SW accounts for this also.
+         */
+        case GPU_LIT_NUM_FBPAS:
+                ret = proj_scal_litter_num_fbpas_v();
+                break;
+        /* Hardcode FBPA values other than NUM_FBPAS to 0. */
+        case GPU_LIT_FBPA_STRIDE:
+        case GPU_LIT_FBPA_BASE:
+        case GPU_LIT_FBPA_SHARED_BASE:
+                ret = 0;
+                break;
+        case GPU_LIT_TWOD_CLASS:
+                ret = FERMI_TWOD_A;
+                break;
+        case GPU_LIT_THREED_CLASS:
+                ret = PASCAL_A;
+                break;
+        case GPU_LIT_COMPUTE_CLASS:
+                ret = PASCAL_COMPUTE_A;
+                break;
+        case GPU_LIT_GPFIFO_CLASS:
+                ret = PASCAL_CHANNEL_GPFIFO_A;
+                break;
+        case GPU_LIT_I2M_CLASS:
+                ret = KEPLER_INLINE_TO_MEMORY_B;
+                break;
+        case GPU_LIT_DMA_COPY_CLASS:
+                ret = PASCAL_DMA_COPY_A;
+                break;
+        default:
+                nvgpu_err(g, "Missing definition %d", value);
+                BUG();
+                break;
+        }
+        return ret;
+}
+static const struct gpu_ops gp10b_ops = {
+        .ltc = {
+                .determine_L2_size_bytes = gp10b_determine_L2_size_bytes,
+                .set_zbc_color_entry = gm20b_ltc_set_zbc_color_entry,
+                .set_zbc_depth_entry = gm20b_ltc_set_zbc_depth_entry,
+                .init_cbc = gm20b_ltc_init_cbc,
+                .init_fs_state = gp10b_ltc_init_fs_state,
+                .init_comptags = gp10b_ltc_init_comptags,
+                .cbc_ctrl = gm20b_ltc_cbc_ctrl,
+                .isr = gp10b_ltc_isr,
+                .cbc_fix_config = gm20b_ltc_cbc_fix_config,
+                .flush = gm20b_flush_ltc,
+                .set_enabled = gp10b_ltc_set_enabled,
+        },
+        .ce2 = {
+                .isr_stall = gp10b_ce_isr,
+                .isr_nonstall = gp10b_ce_nonstall_isr,
+        },
+        .gr = {
+                .get_patch_slots = gr_gk20a_get_patch_slots,
+                .init_gpc_mmu = gr_gm20b_init_gpc_mmu,
+                .bundle_cb_defaults = gr_gm20b_bundle_cb_defaults,
+                .cb_size_default = gr_gp10b_cb_size_default,
+                .calc_global_ctx_buffer_size =
+                        gr_gp10b_calc_global_ctx_buffer_size,
+                .commit_global_attrib_cb = gr_gp10b_commit_global_attrib_cb,
+                .commit_global_bundle_cb = gr_gp10b_commit_global_bundle_cb,
+                .commit_global_cb_manager = gr_gp10b_commit_global_cb_manager,
+                .commit_global_pagepool = gr_gp10b_commit_global_pagepool,
+                .handle_sw_method = gr_gp10b_handle_sw_method,
+                .set_alpha_circular_buffer_size =
+                        gr_gp10b_set_alpha_circular_buffer_size,
+                .set_circular_buffer_size = gr_gp10b_set_circular_buffer_size,
+                .enable_hww_exceptions = gr_gk20a_enable_hww_exceptions,
+                .is_valid_class = gr_gp10b_is_valid_class,
+                .is_valid_gfx_class = gr_gp10b_is_valid_gfx_class,
+                .is_valid_compute_class = gr_gp10b_is_valid_compute_class,
+                .get_sm_dsm_perf_regs = gr_gm20b_get_sm_dsm_perf_regs,
+                .get_sm_dsm_perf_ctrl_regs = gr_gm20b_get_sm_dsm_perf_ctrl_regs,
+                .init_fs_state = gr_gp10b_init_fs_state,
+                .set_hww_esr_report_mask = gr_gm20b_set_hww_esr_report_mask,
+                .falcon_load_ucode = gr_gm20b_load_ctxsw_ucode_segments,
+                .load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode,
+                .set_gpc_tpc_mask = gr_gp10b_set_gpc_tpc_mask,
+                .get_gpc_tpc_mask = gr_gm20b_get_gpc_tpc_mask,
+                .free_channel_ctx = gk20a_free_channel_ctx,
+                .alloc_obj_ctx = gk20a_alloc_obj_ctx,
+                .bind_ctxsw_zcull = gr_gk20a_bind_ctxsw_zcull,
+                .get_zcull_info = gr_gk20a_get_zcull_info,
+                .is_tpc_addr = gr_gm20b_is_tpc_addr,
+                .get_tpc_num = gr_gm20b_get_tpc_num,
+                .detect_sm_arch = gr_gm20b_detect_sm_arch,
+                .add_zbc_color = gr_gp10b_add_zbc_color,
+                .add_zbc_depth = gr_gp10b_add_zbc_depth,
+                .zbc_set_table = gk20a_gr_zbc_set_table,
+                .zbc_query_table = gr_gk20a_query_zbc,
+                .pmu_save_zbc = gk20a_pmu_save_zbc,
+                .add_zbc = gr_gk20a_add_zbc,
+                .pagepool_default_size = gr_gp10b_pagepool_default_size,
+                .init_ctx_state = gr_gp10b_init_ctx_state,
+                .alloc_gr_ctx = gr_gp10b_alloc_gr_ctx,
+                .free_gr_ctx = gr_gp10b_free_gr_ctx,
+                .update_ctxsw_preemption_mode =
+                        gr_gp10b_update_ctxsw_preemption_mode,
+                .dump_gr_regs = gr_gp10b_dump_gr_status_regs,
+                .update_pc_sampling = gr_gm20b_update_pc_sampling,
+                .get_fbp_en_mask = gr_gm20b_get_fbp_en_mask,
+                .get_max_ltc_per_fbp = gr_gm20b_get_max_ltc_per_fbp,
+                .get_max_lts_per_ltc = gr_gm20b_get_max_lts_per_ltc,
+                .get_rop_l2_en_mask = gr_gm20b_rop_l2_en_mask,
+                .get_max_fbps_count = gr_gm20b_get_max_fbps_count,
+                .init_sm_dsm_reg_info = gr_gm20b_init_sm_dsm_reg_info,
+                .wait_empty = gr_gp10b_wait_empty,
+                .init_cyclestats = gr_gm20b_init_cyclestats,
+                .set_sm_debug_mode = gr_gk20a_set_sm_debug_mode,
+                .enable_cde_in_fecs = gr_gm20b_enable_cde_in_fecs,
+                .bpt_reg_info = gr_gm20b_bpt_reg_info,
+                .get_access_map = gr_gp10b_get_access_map,
+                .handle_fecs_error = gr_gp10b_handle_fecs_error,
+                .handle_sm_exception = gr_gp10b_handle_sm_exception,
+                .handle_tex_exception = gr_gp10b_handle_tex_exception,
+                .enable_gpc_exceptions = gk20a_gr_enable_gpc_exceptions,
+                .enable_exceptions = gk20a_gr_enable_exceptions,
+                .get_lrf_tex_ltc_dram_override = get_ecc_override_val,
+                .update_smpc_ctxsw_mode = gr_gk20a_update_smpc_ctxsw_mode,
+                .update_hwpm_ctxsw_mode = gr_gk20a_update_hwpm_ctxsw_mode,
+                .record_sm_error_state = gm20b_gr_record_sm_error_state,
+                .update_sm_error_state = gm20b_gr_update_sm_error_state,
+                .clear_sm_error_state = gm20b_gr_clear_sm_error_state,
+                .suspend_contexts = gr_gp10b_suspend_contexts,
+                .resume_contexts = gr_gk20a_resume_contexts,
+                .get_preemption_mode_flags = gr_gp10b_get_preemption_mode_flags,
+                .init_sm_id_table = gr_gk20a_init_sm_id_table,
+                .load_smid_config = gr_gp10b_load_smid_config,
+                .program_sm_id_numbering = gr_gm20b_program_sm_id_numbering,
+                .is_ltcs_ltss_addr = gr_gm20b_is_ltcs_ltss_addr,
+                .is_ltcn_ltss_addr = gr_gm20b_is_ltcn_ltss_addr,
+                .split_lts_broadcast_addr = gr_gm20b_split_lts_broadcast_addr,
+                .split_ltc_broadcast_addr = gr_gm20b_split_ltc_broadcast_addr,
+                .setup_rop_mapping = gr_gk20a_setup_rop_mapping,
+                .program_zcull_mapping = gr_gk20a_program_zcull_mapping,
+                .commit_global_timeslice = gr_gk20a_commit_global_timeslice,
+                .commit_inst = gr_gk20a_commit_inst,
+                .write_zcull_ptr = gr_gk20a_write_zcull_ptr,
+                .write_pm_ptr = gr_gk20a_write_pm_ptr,
+                .init_elcg_mode = gr_gk20a_init_elcg_mode,
+                .load_tpc_mask = gr_gm20b_load_tpc_mask,
+                .inval_icache = gr_gk20a_inval_icache,
+                .trigger_suspend = gr_gk20a_trigger_suspend,
+                .wait_for_pause = gr_gk20a_wait_for_pause,
+                .resume_from_pause = gr_gk20a_resume_from_pause,
+                .clear_sm_errors = gr_gk20a_clear_sm_errors,
+                .tpc_enabled_exceptions = gr_gk20a_tpc_enabled_exceptions,
+                .get_esr_sm_sel = gk20a_gr_get_esr_sm_sel,
+                .sm_debugger_attached = gk20a_gr_sm_debugger_attached,
+                .suspend_single_sm = gk20a_gr_suspend_single_sm,
+                .suspend_all_sms = gk20a_gr_suspend_all_sms,
+                .resume_single_sm = gk20a_gr_resume_single_sm,
+                .resume_all_sms = gk20a_gr_resume_all_sms,
+                .get_sm_hww_warp_esr = gp10b_gr_get_sm_hww_warp_esr,
+                .get_sm_hww_global_esr = gk20a_gr_get_sm_hww_global_esr,
+                .get_sm_no_lock_down_hww_global_esr_mask =
+                        gk20a_gr_get_sm_no_lock_down_hww_global_esr_mask,
+                .lock_down_sm = gk20a_gr_lock_down_sm,
+                .wait_for_sm_lock_down = gk20a_gr_wait_for_sm_lock_down,
+                .clear_sm_hww = gm20b_gr_clear_sm_hww,
+                .init_ovr_sm_dsm_perf =  gk20a_gr_init_ovr_sm_dsm_perf,
+                .get_ovr_perf_regs = gk20a_gr_get_ovr_perf_regs,
+                .disable_rd_coalesce = gm20a_gr_disable_rd_coalesce,
+                .set_boosted_ctx = gr_gp10b_set_boosted_ctx,
+                .set_preemption_mode = gr_gp10b_set_preemption_mode,
+                .set_czf_bypass = gr_gp10b_set_czf_bypass,
+                .init_czf_bypass = gr_gp10b_init_czf_bypass,
+                .pre_process_sm_exception = gr_gp10b_pre_process_sm_exception,
+                .set_preemption_buffer_va = gr_gp10b_set_preemption_buffer_va,
+                .init_preemption_state = gr_gp10b_init_preemption_state,
+                .update_boosted_ctx = gr_gp10b_update_boosted_ctx,
+                .set_bes_crop_debug3 = gr_gp10b_set_bes_crop_debug3,
+                .create_gr_sysfs = gr_gp10b_create_sysfs,
+                .set_ctxsw_preemption_mode = gr_gp10b_set_ctxsw_preemption_mode,
+                .init_ctxsw_hdr_data = gr_gp10b_init_ctxsw_hdr_data,
+        },
+        .fb = {
+                .reset = fb_gk20a_reset,
+                .init_hw = gk20a_fb_init_hw,
+                .init_fs_state = fb_gm20b_init_fs_state,
+                .set_mmu_page_size = gm20b_fb_set_mmu_page_size,
+                .set_use_full_comp_tag_line =
+                        gm20b_fb_set_use_full_comp_tag_line,
+                .compression_page_size = gp10b_fb_compression_page_size,
+                .compressible_page_size = gp10b_fb_compressible_page_size,
+                .vpr_info_fetch = gm20b_fb_vpr_info_fetch,
+                .dump_vpr_wpr_info = gm20b_fb_dump_vpr_wpr_info,
+                .read_wpr_info = gm20b_fb_read_wpr_info,
+                .is_debug_mode_enabled = gm20b_fb_debug_mode_enabled,
+                .set_debug_mode = gm20b_fb_set_debug_mode,
+                .tlb_invalidate = gk20a_fb_tlb_invalidate,
+                .mem_unlock = NULL,
+        },
+        .clock_gating = {
+                .slcg_bus_load_gating_prod =
+                        gp10b_slcg_bus_load_gating_prod,
+                .slcg_ce2_load_gating_prod =
+                        gp10b_slcg_ce2_load_gating_prod,
+                .slcg_chiplet_load_gating_prod =
+                        gp10b_slcg_chiplet_load_gating_prod,
+                .slcg_ctxsw_firmware_load_gating_prod =
+                        gp10b_slcg_ctxsw_firmware_load_gating_prod,
+                .slcg_fb_load_gating_prod =
+                        gp10b_slcg_fb_load_gating_prod,
+                .slcg_fifo_load_gating_prod =
+                        gp10b_slcg_fifo_load_gating_prod,
+                .slcg_gr_load_gating_prod =
+                        gr_gp10b_slcg_gr_load_gating_prod,
+                .slcg_ltc_load_gating_prod =
+                        ltc_gp10b_slcg_ltc_load_gating_prod,
+                .slcg_perf_load_gating_prod =
+                        gp10b_slcg_perf_load_gating_prod,
+                .slcg_priring_load_gating_prod =
+                        gp10b_slcg_priring_load_gating_prod,
+                .slcg_pmu_load_gating_prod =
+                        gp10b_slcg_pmu_load_gating_prod,
+                .slcg_therm_load_gating_prod =
+                        gp10b_slcg_therm_load_gating_prod,
+                .slcg_xbar_load_gating_prod =
+                        gp10b_slcg_xbar_load_gating_prod,
+                .blcg_bus_load_gating_prod =
+                        gp10b_blcg_bus_load_gating_prod,
+                .blcg_ce_load_gating_prod =
+                        gp10b_blcg_ce_load_gating_prod,
+                .blcg_ctxsw_firmware_load_gating_prod =
+                        gp10b_blcg_ctxsw_firmware_load_gating_prod,
+                .blcg_fb_load_gating_prod =
+                        gp10b_blcg_fb_load_gating_prod,
+                .blcg_fifo_load_gating_prod =
+                        gp10b_blcg_fifo_load_gating_prod,
+                .blcg_gr_load_gating_prod =
+                        gp10b_blcg_gr_load_gating_prod,
+                .blcg_ltc_load_gating_prod =
+                        gp10b_blcg_ltc_load_gating_prod,
+                .blcg_pwr_csb_load_gating_prod =
+                        gp10b_blcg_pwr_csb_load_gating_prod,
+                .blcg_pmu_load_gating_prod =
+                        gp10b_blcg_pmu_load_gating_prod,
+                .blcg_xbar_load_gating_prod =
+                        gp10b_blcg_xbar_load_gating_prod,
+                .pg_gr_load_gating_prod =
+                        gr_gp10b_pg_gr_load_gating_prod,
+        },
+        .fifo = {
+                .init_fifo_setup_hw = gk20a_init_fifo_setup_hw,
+                .bind_channel = channel_gm20b_bind,
+                .unbind_channel = gk20a_fifo_channel_unbind,
+                .disable_channel = gk20a_fifo_disable_channel,
+                .enable_channel = gk20a_fifo_enable_channel,
+                .alloc_inst = gk20a_fifo_alloc_inst,
+                .free_inst = gk20a_fifo_free_inst,
+                .setup_ramfc = channel_gp10b_setup_ramfc,
+                .channel_set_timeslice = gk20a_fifo_set_timeslice,
+                .default_timeslice_us = gk20a_fifo_default_timeslice_us,
+                .setup_userd = gk20a_fifo_setup_userd,
+                .userd_gp_get = gk20a_fifo_userd_gp_get,
+                .userd_gp_put = gk20a_fifo_userd_gp_put,
+                .userd_pb_get = gk20a_fifo_userd_pb_get,
+                .pbdma_acquire_val = gk20a_fifo_pbdma_acquire_val,
+                .preempt_channel = gk20a_fifo_preempt_channel,
+                .preempt_tsg = gk20a_fifo_preempt_tsg,
+                .enable_tsg = gk20a_enable_tsg,
+                .disable_tsg = gk20a_disable_tsg,
+                .tsg_verify_channel_status = gk20a_fifo_tsg_unbind_channel_verify_status,
+                .tsg_verify_status_ctx_reload = gm20b_fifo_tsg_verify_status_ctx_reload,
+                .reschedule_runlist = gk20a_fifo_reschedule_runlist,
+                .update_runlist = gk20a_fifo_update_runlist,
+                .trigger_mmu_fault = gm20b_fifo_trigger_mmu_fault,
+                .get_mmu_fault_info = gp10b_fifo_get_mmu_fault_info,
+                .wait_engine_idle = gk20a_fifo_wait_engine_idle,
+                .get_num_fifos = gm20b_fifo_get_num_fifos,
+                .get_pbdma_signature = gp10b_fifo_get_pbdma_signature,
+                .set_runlist_interleave = gk20a_fifo_set_runlist_interleave,
+                .tsg_set_timeslice = gk20a_fifo_tsg_set_timeslice,
+                .force_reset_ch = gk20a_fifo_force_reset_ch,
+                .engine_enum_from_type = gp10b_fifo_engine_enum_from_type,
+                .device_info_data_parse = gp10b_device_info_data_parse,
+                .eng_runlist_base_size = fifo_eng_runlist_base__size_1_v,
+                .init_engine_info = gk20a_fifo_init_engine_info,
+                .runlist_entry_size = ram_rl_entry_size_v,
+                .get_tsg_runlist_entry = gk20a_get_tsg_runlist_entry,
+                .get_ch_runlist_entry = gk20a_get_ch_runlist_entry,
+                .is_fault_engine_subid_gpc = gk20a_is_fault_engine_subid_gpc,
+                .dump_pbdma_status = gk20a_dump_pbdma_status,
+                .dump_eng_status = gk20a_dump_eng_status,
+                .dump_channel_status_ramfc = gk20a_dump_channel_status_ramfc,
+                .intr_0_error_mask = gk20a_fifo_intr_0_error_mask,
+                .is_preempt_pending = gk20a_fifo_is_preempt_pending,
+                .init_pbdma_intr_descs = gp10b_fifo_init_pbdma_intr_descs,
+                .reset_enable_hw = gk20a_init_fifo_reset_enable_hw,
+                .teardown_ch_tsg = gk20a_fifo_teardown_ch_tsg,
+                .handle_sched_error = gk20a_fifo_handle_sched_error,
+                .handle_pbdma_intr_0 = gk20a_fifo_handle_pbdma_intr_0,
+                .handle_pbdma_intr_1 = gk20a_fifo_handle_pbdma_intr_1,
+                .tsg_bind_channel = gk20a_tsg_bind_channel,
+                .tsg_unbind_channel = gk20a_tsg_unbind_channel,
+#ifdef CONFIG_TEGRA_GK20A_NVHOST
+                .alloc_syncpt_buf = gk20a_fifo_alloc_syncpt_buf,
+                .free_syncpt_buf = gk20a_fifo_free_syncpt_buf,
+                .add_syncpt_wait_cmd = gk20a_fifo_add_syncpt_wait_cmd,
+                .get_syncpt_wait_cmd_size = gk20a_fifo_get_syncpt_wait_cmd_size,
+                .add_syncpt_incr_cmd = gk20a_fifo_add_syncpt_incr_cmd,
+                .get_syncpt_incr_cmd_size = gk20a_fifo_get_syncpt_incr_cmd_size,
+#endif
+                .resetup_ramfc = gp10b_fifo_resetup_ramfc,
+                .device_info_fault_id = top_device_info_data_fault_id_enum_v,
+        },
+        .gr_ctx = {
+                .get_netlist_name = gr_gp10b_get_netlist_name,
+                .is_fw_defined = gr_gp10b_is_firmware_defined,
+        },
+#ifdef CONFIG_GK20A_CTXSW_TRACE
+        .fecs_trace = {
+                .alloc_user_buffer = gk20a_ctxsw_dev_ring_alloc,
+                .free_user_buffer = gk20a_ctxsw_dev_ring_free,
+                .mmap_user_buffer = gk20a_ctxsw_dev_mmap_buffer,
+                .init = gk20a_fecs_trace_init,
+                .deinit = gk20a_fecs_trace_deinit,
+                .enable = gk20a_fecs_trace_enable,
+                .disable = gk20a_fecs_trace_disable,
+                .is_enabled = gk20a_fecs_trace_is_enabled,
+                .reset = gk20a_fecs_trace_reset,
+                .flush = gp10b_fecs_trace_flush,
+                .poll = gk20a_fecs_trace_poll,
+                .bind_channel = gk20a_fecs_trace_bind_channel,
+                .unbind_channel = gk20a_fecs_trace_unbind_channel,
+                .max_entries = gk20a_gr_max_entries,
+        },
+#endif /* CONFIG_GK20A_CTXSW_TRACE */
+        .mm = {
+                .support_sparse = gm20b_mm_support_sparse,
+                .gmmu_map = gk20a_locked_gmmu_map,
+                .gmmu_unmap = gk20a_locked_gmmu_unmap,
+                .vm_bind_channel = gk20a_vm_bind_channel,
+                .fb_flush = gk20a_mm_fb_flush,
+                .l2_invalidate = gk20a_mm_l2_invalidate,
+                .l2_flush = gk20a_mm_l2_flush,
+                .cbc_clean = gk20a_mm_cbc_clean,
+                .set_big_page_size = gm20b_mm_set_big_page_size,
+                .get_big_page_sizes = gm20b_mm_get_big_page_sizes,
+                .get_default_big_page_size = gp10b_mm_get_default_big_page_size,
+                .gpu_phys_addr = gm20b_gpu_phys_addr,
+                .get_iommu_bit = gp10b_mm_get_iommu_bit,
+                .get_mmu_levels = gp10b_mm_get_mmu_levels,
+                .init_pdb = gp10b_mm_init_pdb,
+                .init_mm_setup_hw = gp10b_init_mm_setup_hw,
+                .is_bar1_supported = gm20b_mm_is_bar1_supported,
+                .alloc_inst_block = gk20a_alloc_inst_block,
+                .init_inst_block = gk20a_init_inst_block,
+                .mmu_fault_pending = gk20a_fifo_mmu_fault_pending,
+                .init_bar2_vm = gb10b_init_bar2_vm,
+                .init_bar2_mm_hw_setup = gb10b_init_bar2_mm_hw_setup,
+                .remove_bar2_vm = gp10b_remove_bar2_vm,
+                .get_kind_invalid = gm20b_get_kind_invalid,
+                .get_kind_pitch = gm20b_get_kind_pitch,
+        },
+        .pramin = {
+                .enter = gk20a_pramin_enter,
+                .exit = gk20a_pramin_exit,
+                .data032_r = pram_data032_r,
+        },
+        .therm = {
+                .init_therm_setup_hw = gp10b_init_therm_setup_hw,
+                .elcg_init_idle_filters = gp10b_elcg_init_idle_filters,
+        },
+        .pmu = {
+                .pmu_setup_elpg = gp10b_pmu_setup_elpg,
+                .pmu_get_queue_head = pwr_pmu_queue_head_r,
+                .pmu_get_queue_head_size = pwr_pmu_queue_head__size_1_v,
+                .pmu_get_queue_tail = pwr_pmu_queue_tail_r,
+                .pmu_get_queue_tail_size = pwr_pmu_queue_tail__size_1_v,
+                .pmu_queue_head = gk20a_pmu_queue_head,
+                .pmu_queue_tail = gk20a_pmu_queue_tail,
+                .pmu_msgq_tail = gk20a_pmu_msgq_tail,
+                .pmu_mutex_size = pwr_pmu_mutex__size_1_v,
+                .pmu_mutex_acquire = gk20a_pmu_mutex_acquire,
+                .pmu_mutex_release = gk20a_pmu_mutex_release,
+                .write_dmatrfbase = gp10b_write_dmatrfbase,
+                .pmu_elpg_statistics = gp10b_pmu_elpg_statistics,
+                .pmu_pg_init_param = gp10b_pg_gr_init,
+                .pmu_pg_supported_engines_list = gk20a_pmu_pg_engines_list,
+                .pmu_pg_engines_feature_list = gk20a_pmu_pg_feature_list,
+                .dump_secure_fuses = pmu_dump_security_fuses_gp10b,
+                .reset_engine = gk20a_pmu_engine_reset,
+                .is_engine_in_reset = gk20a_pmu_is_engine_in_reset,
+        },
+        .regops = {
+                .get_global_whitelist_ranges =
+                        gp10b_get_global_whitelist_ranges,
+                .get_global_whitelist_ranges_count =
+                        gp10b_get_global_whitelist_ranges_count,
+                .get_context_whitelist_ranges =
+                        gp10b_get_context_whitelist_ranges,
+                .get_context_whitelist_ranges_count =
+                        gp10b_get_context_whitelist_ranges_count,
+                .get_runcontrol_whitelist = gp10b_get_runcontrol_whitelist,
+                .get_runcontrol_whitelist_count =
+                        gp10b_get_runcontrol_whitelist_count,
+                .get_runcontrol_whitelist_ranges =
+                        gp10b_get_runcontrol_whitelist_ranges,
+                .get_runcontrol_whitelist_ranges_count =
+                        gp10b_get_runcontrol_whitelist_ranges_count,
+                .get_qctl_whitelist = gp10b_get_qctl_whitelist,
+                .get_qctl_whitelist_count = gp10b_get_qctl_whitelist_count,
+                .get_qctl_whitelist_ranges = gp10b_get_qctl_whitelist_ranges,
+                .get_qctl_whitelist_ranges_count =
+                        gp10b_get_qctl_whitelist_ranges_count,
+                .apply_smpc_war = gp10b_apply_smpc_war,
+        },
+        .mc = {
+                .intr_enable = mc_gp10b_intr_enable,
+                .intr_unit_config = mc_gp10b_intr_unit_config,
+                .isr_stall = mc_gp10b_isr_stall,
+                .intr_stall = mc_gp10b_intr_stall,
+                .intr_stall_pause = mc_gp10b_intr_stall_pause,
+                .intr_stall_resume = mc_gp10b_intr_stall_resume,
+                .intr_nonstall = mc_gp10b_intr_nonstall,
+                .intr_nonstall_pause = mc_gp10b_intr_nonstall_pause,
+                .intr_nonstall_resume = mc_gp10b_intr_nonstall_resume,
+                .enable = gk20a_mc_enable,
+                .disable = gk20a_mc_disable,
+                .reset = gk20a_mc_reset,
+                .boot_0 = gk20a_mc_boot_0,
+                .is_intr1_pending = mc_gp10b_is_intr1_pending,
+        },
+        .debug = {
+                .show_dump = gk20a_debug_show_dump,
+        },
+        .dbg_session_ops = {
+                .exec_reg_ops = exec_regops_gk20a,
+                .dbg_set_powergate = dbg_set_powergate,
+                .check_and_set_global_reservation =
+                        nvgpu_check_and_set_global_reservation,
+                .check_and_set_context_reservation =
+                        nvgpu_check_and_set_context_reservation,
+                .release_profiler_reservation =
+                        nvgpu_release_profiler_reservation,
+                .perfbuffer_enable = gk20a_perfbuf_enable_locked,
+                .perfbuffer_disable = gk20a_perfbuf_disable_locked,
+        },
+        .bus = {
+                .init_hw = gk20a_bus_init_hw,
+                .isr = gk20a_bus_isr,
+                .read_ptimer = gk20a_read_ptimer,
+                .get_timestamps_zipper = nvgpu_get_timestamps_zipper,
+                .bar1_bind = gk20a_bus_bar1_bind,
+        },
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+        .css = {
+                .enable_snapshot = css_hw_enable_snapshot,
+                .disable_snapshot = css_hw_disable_snapshot,
+                .check_data_available = css_hw_check_data_available,
+                .set_handled_snapshots = css_hw_set_handled_snapshots,
+                .allocate_perfmon_ids = css_gr_allocate_perfmon_ids,
+                .release_perfmon_ids = css_gr_release_perfmon_ids,
+        },
+#endif
+        .falcon = {
+                .falcon_hal_sw_init = gk20a_falcon_hal_sw_init,
+        },
+        .priv_ring = {
+                .isr = gp10b_priv_ring_isr,
+        },
+        .chip_init_gpu_characteristics = gp10b_init_gpu_characteristics,
+        .get_litter_value = gp10b_get_litter_value,
+};
+int gp10b_init_hal(struct gk20a *g)
+{
+        struct gpu_ops *gops = &g->ops;
+        u32 val;
+        gops->ltc = gp10b_ops.ltc;
+        gops->ce2 = gp10b_ops.ce2;
+        gops->gr = gp10b_ops.gr;
+        gops->fb = gp10b_ops.fb;
+        gops->clock_gating = gp10b_ops.clock_gating;
+        gops->fifo = gp10b_ops.fifo;
+        gops->gr_ctx = gp10b_ops.gr_ctx;
+#ifdef CONFIG_GK20A_CTXSW_TRACE
+        gops->fecs_trace = gp10b_ops.fecs_trace;
+#endif
+        gops->mm = gp10b_ops.mm;
+        gops->pramin = gp10b_ops.pramin;
+        gops->therm = gp10b_ops.therm;
+        gops->pmu = gp10b_ops.pmu;
+        gops->regops = gp10b_ops.regops;
+        gops->mc = gp10b_ops.mc;
+        gops->debug = gp10b_ops.debug;
+        gops->dbg_session_ops = gp10b_ops.dbg_session_ops;
+        gops->bus = gp10b_ops.bus;
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+        gops->css = gp10b_ops.css;
+#endif
+        gops->falcon = gp10b_ops.falcon;
+        gops->priv_ring = gp10b_ops.priv_ring;
+        /* Lone Functions */
+        gops->chip_init_gpu_characteristics =
+                gp10b_ops.chip_init_gpu_characteristics;
+        gops->get_litter_value = gp10b_ops.get_litter_value;
+        __nvgpu_set_enabled(g, NVGPU_GR_USE_DMA_FOR_FW_BOOTSTRAP, true);
+        __nvgpu_set_enabled(g, NVGPU_PMU_PSTATE, false);
+#ifdef CONFIG_TEGRA_ACR
+        if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+                __nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+                __nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+        } else if (g->is_virtual) {
+                __nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+                __nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+        } else {
+                val = gk20a_readl(g, fuse_opt_priv_sec_en_r());
+                if (val) {
+                        __nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+                        __nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+                } else {
+                        gk20a_dbg_info("priv security is disabled in HW");
+                        __nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+                        __nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+                }
+        }
+#else
+        if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+                gk20a_dbg_info("running simulator with PRIV security disabled");
+                __nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+                __nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+        } else {
+                val = gk20a_readl(g, fuse_opt_priv_sec_en_r());
+                if (val) {
+                        gk20a_dbg_info("priv security is not supported but enabled");
+                        __nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+                        __nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+                        return -EPERM;
+                } else {
+                        __nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, false);
+                        __nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, false);
+                }
+        }
+#endif
+        /* priv security dependent ops */
+        if (nvgpu_is_enabled(g, NVGPU_SEC_PRIVSECURITY)) {
+                /* Add in ops from gm20b acr */
+                gops->pmu.is_pmu_supported = gm20b_is_pmu_supported,
+                gops->pmu.prepare_ucode = prepare_ucode_blob,
+                gops->pmu.pmu_setup_hw_and_bootstrap = gm20b_bootstrap_hs_flcn,
+                gops->pmu.is_lazy_bootstrap = gm20b_is_lazy_bootstrap,
+                gops->pmu.is_priv_load = gm20b_is_priv_load,
+                gops->pmu.get_wpr = gm20b_wpr_info,
+                gops->pmu.alloc_blob_space = gm20b_alloc_blob_space,
+                gops->pmu.pmu_populate_loader_cfg =
+                        gm20b_pmu_populate_loader_cfg,
+                gops->pmu.flcn_populate_bl_dmem_desc =
+                        gm20b_flcn_populate_bl_dmem_desc,
+                gops->pmu.falcon_wait_for_halt = pmu_wait_for_halt,
+                gops->pmu.falcon_clear_halt_interrupt_status =
+                        clear_halt_interrupt_status,
+                gops->pmu.init_falcon_setup_hw = gm20b_init_pmu_setup_hw1,
+                gops->pmu.init_wpr_region = gm20b_pmu_init_acr;
+                gops->pmu.load_lsfalcon_ucode = gp10b_load_falcon_ucode;
+                gops->pmu.is_lazy_bootstrap = gp10b_is_lazy_bootstrap;
+                gops->pmu.is_priv_load = gp10b_is_priv_load;
+                gops->gr.load_ctxsw_ucode = gr_gm20b_load_ctxsw_ucode;
+        } else {
+                /* Inherit from gk20a */
+                gops->pmu.is_pmu_supported = gk20a_is_pmu_supported,
+                gops->pmu.prepare_ucode = nvgpu_pmu_prepare_ns_ucode_blob,
+                gops->pmu.pmu_setup_hw_and_bootstrap = gk20a_init_pmu_setup_hw1,
+                gops->pmu.pmu_nsbootstrap = pmu_bootstrap,
+                gops->pmu.load_lsfalcon_ucode = NULL;
+                gops->pmu.init_wpr_region = NULL;
+                gops->pmu.pmu_setup_hw_and_bootstrap = gp10b_init_pmu_setup_hw1;
+                gops->gr.load_ctxsw_ucode = gr_gk20a_load_ctxsw_ucode;
+        }
+        __nvgpu_set_enabled(g, NVGPU_PMU_FECS_BOOTSTRAP_DONE, false);
+        g->pmu_lsf_pmu_wpr_init_done = 0;
+        g->bootstrap_owner = LSF_BOOTSTRAP_OWNER_DEFAULT;
+        g->name = "gp10b";
+        return 0;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/hal_gp10b.h b/drivers/gpu/nvgpu/gp10b/hal_gp10b.h
new file mode 100644
index 00000000..cf3c295d
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/hal_gp10b.h
@@ -0,0 +1,31 @@
+/*
+ * GP10B Tegra HAL interface
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef _NVGPU_HAL_GP10B_H
+#define _NVGPU_HAL_GP10B_H
+struct gk20a;
+int gp10b_init_hal(struct gk20a *gops);
+int gp10b_get_litter_value(struct gk20a *g, int value);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/ltc_gp10b.c b/drivers/gpu/nvgpu/gp10b/ltc_gp10b.c
new file mode 100644
index 00000000..92a899b8
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/ltc_gp10b.c
@@ -0,0 +1,226 @@
+/*
+ * GP10B L2
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <dt-bindings/memory/tegra-swgroup.h>
+#include <nvgpu/ltc.h>
+#include <nvgpu/log.h>
+#include <nvgpu/enabled.h>
+#include <nvgpu/hw/gp10b/hw_mc_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_ltc_gp10b.h>
+#include "gk20a/gk20a.h"
+#include "gm20b/ltc_gm20b.h"
+#include "ltc_gp10b.h"
+int gp10b_determine_L2_size_bytes(struct gk20a *g)
+{
+        u32 tmp;
+        int ret;
+        gk20a_dbg_fn("");
+        tmp = gk20a_readl(g, ltc_ltc0_lts0_tstg_info_1_r());
+        ret = g->ltc_count *
+                ltc_ltc0_lts0_tstg_info_1_slice_size_in_kb_v(tmp)*1024 *
+                ltc_ltc0_lts0_tstg_info_1_slices_per_l2_v(tmp);
+        gk20a_dbg(gpu_dbg_info, "L2 size: %d\n", ret);
+        gk20a_dbg_fn("done");
+        return ret;
+}
+int gp10b_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr)
+{
+        /* max memory size (MB) to cover */
+        u32 max_size = gr->max_comptag_mem;
+        /* one tag line covers 64KB */
+        u32 max_comptag_lines = max_size << 4;
+        u32 hw_max_comptag_lines =
+                ltc_ltcs_ltss_cbc_ctrl3_clear_upper_bound_init_v();
+        u32 cbc_param =
+                gk20a_readl(g, ltc_ltcs_ltss_cbc_param_r());
+        u32 comptags_per_cacheline =
+                ltc_ltcs_ltss_cbc_param_comptags_per_cache_line_v(cbc_param);
+        u32 cacheline_size =
+                512 << ltc_ltcs_ltss_cbc_param_cache_line_size_v(cbc_param);
+        u32 slices_per_ltc =
+                ltc_ltcs_ltss_cbc_param_slices_per_ltc_v(cbc_param);
+        u32 cbc_param2 =
+                gk20a_readl(g, ltc_ltcs_ltss_cbc_param2_r());
+        u32 gobs_per_comptagline_per_slice =
+                ltc_ltcs_ltss_cbc_param2_gobs_per_comptagline_per_slice_v(cbc_param2);
+        u32 compbit_backing_size;
+        int err;
+        gk20a_dbg_fn("");
+        if (max_comptag_lines == 0)
+                return 0;
+        if (max_comptag_lines > hw_max_comptag_lines)
+                max_comptag_lines = hw_max_comptag_lines;
+        compbit_backing_size =
+                roundup(max_comptag_lines * gobs_per_comptagline_per_slice,
+                        cacheline_size);
+        compbit_backing_size =
+                roundup(compbit_backing_size * slices_per_ltc * g->ltc_count,
+                        g->ops.fb.compressible_page_size(g));
+        /* aligned to 2KB * ltc_count */
+        compbit_backing_size +=
+                g->ltc_count << ltc_ltcs_ltss_cbc_base_alignment_shift_v();
+        /* must be a multiple of 64KB */
+        compbit_backing_size = roundup(compbit_backing_size, 64*1024);
+        gk20a_dbg_info("compbit backing store size : %d",
+                compbit_backing_size);
+        gk20a_dbg_info("max comptag lines : %d",
+                max_comptag_lines);
+        gk20a_dbg_info("gobs_per_comptagline_per_slice: %d",
+                gobs_per_comptagline_per_slice);
+        err = nvgpu_ltc_alloc_cbc(g, compbit_backing_size);
+        if (err)
+                return err;
+        err = gk20a_comptag_allocator_init(g, &gr->comp_tags, max_comptag_lines);
+        if (err)
+                return err;
+        gr->comptags_per_cacheline = comptags_per_cacheline;
+        gr->slices_per_ltc = slices_per_ltc;
+        gr->cacheline_size = cacheline_size;
+        gr->gobs_per_comptagline_per_slice = gobs_per_comptagline_per_slice;
+        return 0;
+}
+void gp10b_ltc_isr(struct gk20a *g)
+{
+        u32 mc_intr, ltc_intr;
+        unsigned int ltc, slice;
+        u32 ltc_stride = nvgpu_get_litter_value(g, GPU_LIT_LTC_STRIDE);
+        u32 lts_stride = nvgpu_get_litter_value(g, GPU_LIT_LTS_STRIDE);
+        mc_intr = gk20a_readl(g, mc_intr_ltc_r());
+        nvgpu_err(g, "mc_ltc_intr: %08x", mc_intr);
+        for (ltc = 0; ltc < g->ltc_count; ltc++) {
+                if ((mc_intr & 1 << ltc) == 0)
+                        continue;
+                for (slice = 0; slice < g->gr.slices_per_ltc; slice++) {
+                        u32 offset = ltc_stride * ltc + lts_stride * slice;
+                        ltc_intr = gk20a_readl(g, ltc_ltc0_lts0_intr_r() + offset);
+                        /* Detect and handle ECC errors */
+                        if (ltc_intr &
+                                ltc_ltcs_ltss_intr_ecc_sec_error_pending_f()) {
+                                u32 ecc_stats_reg_val;
+                                nvgpu_err(g,
+                                        "Single bit error detected in GPU L2!");
+                                ecc_stats_reg_val =
+                                        gk20a_readl(g,
+                                                ltc_ltc0_lts0_dstg_ecc_report_r() + offset);
+                                g->ecc.gr.t18x.l2_sec_count.counters[ltc] +=
+                                        ltc_ltc0_lts0_dstg_ecc_report_sec_count_v(ecc_stats_reg_val);
+                                ecc_stats_reg_val &=
+                                        ~(ltc_ltc0_lts0_dstg_ecc_report_sec_count_m());
+                                gk20a_writel(g,
+                                        ltc_ltc0_lts0_dstg_ecc_report_r() + offset,
+                                        ecc_stats_reg_val);
+                                g->ops.mm.l2_flush(g, true);
+                        }
+                        if (ltc_intr &
+                                ltc_ltcs_ltss_intr_ecc_ded_error_pending_f()) {
+                                u32 ecc_stats_reg_val;
+                                nvgpu_err(g,
+                                        "Double bit error detected in GPU L2!");
+                                ecc_stats_reg_val =
+                                        gk20a_readl(g,
+                                                ltc_ltc0_lts0_dstg_ecc_report_r() + offset);
+                                g->ecc.gr.t18x.l2_ded_count.counters[ltc] +=
+                                        ltc_ltc0_lts0_dstg_ecc_report_ded_count_v(ecc_stats_reg_val);
+                                ecc_stats_reg_val &=
+                                        ~(ltc_ltc0_lts0_dstg_ecc_report_ded_count_m());
+                                gk20a_writel(g,
+                                        ltc_ltc0_lts0_dstg_ecc_report_r() + offset,
+                                        ecc_stats_reg_val);
+                        }
+                        nvgpu_err(g, "ltc%d, slice %d: %08x",
+                                  ltc, slice, ltc_intr);
+                        gk20a_writel(g, ltc_ltc0_lts0_intr_r() +
+                                           ltc_stride * ltc + lts_stride * slice,
+                                     ltc_intr);
+                }
+        }
+}
+void gp10b_ltc_init_fs_state(struct gk20a *g)
+{
+        u32 ltc_intr;
+        gm20b_ltc_init_fs_state(g);
+        gk20a_writel(g, ltc_ltca_g_axi_pctrl_r(),
+                        ltc_ltca_g_axi_pctrl_user_sid_f(TEGRA_SID_GPUB));
+        /* Enable ECC interrupts */
+        ltc_intr = gk20a_readl(g, ltc_ltcs_ltss_intr_r());
+        ltc_intr |= ltc_ltcs_ltss_intr_en_ecc_sec_error_enabled_f() |
+                        ltc_ltcs_ltss_intr_en_ecc_ded_error_enabled_f();
+        gk20a_writel(g, ltc_ltcs_ltss_intr_r(),
+                        ltc_intr);
+}
+void gp10b_ltc_set_enabled(struct gk20a *g, bool enabled)
+{
+        u32 reg_f = ltc_ltcs_ltss_tstg_set_mgmt_2_l2_bypass_mode_enabled_f();
+        u32 reg = gk20a_readl(g, ltc_ltcs_ltss_tstg_set_mgmt_2_r());
+        if (enabled)
+                /* bypass disabled (normal caching ops)*/
+                reg &= ~reg_f;
+        else
+                /* bypass enabled (no caching) */
+                reg |= reg_f;
+        gk20a_writel(g, ltc_ltcs_ltss_tstg_set_mgmt_2_r(), reg);
+}
diff --git a/drivers/gpu/nvgpu/gp10b/ltc_gp10b.h b/drivers/gpu/nvgpu/gp10b/ltc_gp10b.h
new file mode 100644
index 00000000..825204cb
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/ltc_gp10b.h
@@ -0,0 +1,33 @@
+/*
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef LTC_GP10B_H
+#define LTC_GP10B_H
+struct gpu_ops;
+void gp10b_ltc_isr(struct gk20a *g);
+int gp10b_determine_L2_size_bytes(struct gk20a *g);
+int gp10b_ltc_init_comptags(struct gk20a *g, struct gr_gk20a *gr);
+void gp10b_ltc_init_fs_state(struct gk20a *g);
+void gp10b_ltc_set_enabled(struct gk20a *g, bool enabled);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/mc_gp10b.c b/drivers/gpu/nvgpu/gp10b/mc_gp10b.c
new file mode 100644
index 00000000..9aea76f9
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/mc_gp10b.c
@@ -0,0 +1,185 @@
+/*
+ * GP10B master
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include "gk20a/mc_gk20a.h"
+#include "mc_gp10b.h"
+#include <nvgpu/atomic.h>
+#include <nvgpu/unit.h>
+#include <nvgpu/hw/gp10b/hw_mc_gp10b.h>
+void mc_gp10b_intr_enable(struct gk20a *g)
+{
+        u32 eng_intr_mask = gk20a_fifo_engine_interrupt_mask(g);
+        gk20a_writel(g, mc_intr_en_clear_r(NVGPU_MC_INTR_STALLING),
+                                0xffffffff);
+        g->mc_intr_mask_restore[NVGPU_MC_INTR_STALLING] =
+                                mc_intr_pfifo_pending_f() |
+                                 mc_intr_priv_ring_pending_f() |
+                                 mc_intr_pbus_pending_f() |
+                                 mc_intr_ltc_pending_f() |
+                                 mc_intr_replayable_fault_pending_f() |
+                                 eng_intr_mask;
+        gk20a_writel(g, mc_intr_en_set_r(NVGPU_MC_INTR_STALLING),
+                        g->mc_intr_mask_restore[NVGPU_MC_INTR_STALLING]);
+        gk20a_writel(g, mc_intr_en_clear_r(NVGPU_MC_INTR_NONSTALLING),
+                                0xffffffff);
+        g->mc_intr_mask_restore[NVGPU_MC_INTR_NONSTALLING] =
+                                mc_intr_pfifo_pending_f() |
+                                 eng_intr_mask;
+        gk20a_writel(g, mc_intr_en_set_r(NVGPU_MC_INTR_NONSTALLING),
+                        g->mc_intr_mask_restore[NVGPU_MC_INTR_NONSTALLING]);
+}
+void mc_gp10b_intr_unit_config(struct gk20a *g, bool enable,
+                bool is_stalling, u32 mask)
+{
+        u32 intr_index = 0;
+        u32 reg = 0;
+        intr_index = (is_stalling ? NVGPU_MC_INTR_STALLING :
+                        NVGPU_MC_INTR_NONSTALLING);
+        if (enable) {
+                reg = mc_intr_en_set_r(intr_index);
+                g->mc_intr_mask_restore[intr_index] |= mask;
+        } else {
+                reg = mc_intr_en_clear_r(intr_index);
+                g->mc_intr_mask_restore[intr_index] &= ~mask;
+        }
+        gk20a_writel(g, reg, mask);
+}
+void mc_gp10b_isr_stall(struct gk20a *g)
+{
+        u32 mc_intr_0;
+        u32 engine_id_idx;
+        u32 active_engine_id = 0;
+        u32 engine_enum = ENGINE_INVAL_GK20A;
+        mc_intr_0 = gk20a_readl(g, mc_intr_r(0));
+        gk20a_dbg(gpu_dbg_intr, "stall intr 0x%08x\n", mc_intr_0);
+        for (engine_id_idx = 0; engine_id_idx < g->fifo.num_engines; engine_id_idx++) {
+                active_engine_id = g->fifo.active_engines_list[engine_id_idx];
+                if (mc_intr_0 & g->fifo.engine_info[active_engine_id].intr_mask) {
+                        engine_enum = g->fifo.engine_info[active_engine_id].engine_enum;
+                        /* GR Engine */
+                        if (engine_enum == ENGINE_GR_GK20A) {
+                                gr_gk20a_elpg_protected_call(g, gk20a_gr_isr(g));
+                        }
+                        /* CE Engine */
+                        if (((engine_enum == ENGINE_GRCE_GK20A) ||
+                                (engine_enum == ENGINE_ASYNC_CE_GK20A)) &&
+                                g->ops.ce2.isr_stall){
+                                        g->ops.ce2.isr_stall(g,
+                                        g->fifo.engine_info[active_engine_id].inst_id,
+                                        g->fifo.engine_info[active_engine_id].pri_base);
+                        }
+                }
+        }
+        if (g->ops.mc.is_intr_hub_pending &&
+                 g->ops.mc.is_intr_hub_pending(g, mc_intr_0))
+                g->ops.fb.hub_isr(g);
+        if (mc_intr_0 & mc_intr_pfifo_pending_f())
+                gk20a_fifo_isr(g);
+        if (mc_intr_0 & mc_intr_pmu_pending_f())
+                gk20a_pmu_isr(g);
+        if (mc_intr_0 & mc_intr_priv_ring_pending_f())
+                g->ops.priv_ring.isr(g);
+        if (mc_intr_0 & mc_intr_ltc_pending_f())
+                g->ops.ltc.isr(g);
+        if (mc_intr_0 & mc_intr_pbus_pending_f())
+                g->ops.bus.isr(g);
+        gk20a_dbg(gpu_dbg_intr, "stall intr done 0x%08x\n", mc_intr_0);
+}
+u32 mc_gp10b_intr_stall(struct gk20a *g)
+{
+        return gk20a_readl(g, mc_intr_r(NVGPU_MC_INTR_STALLING));
+}
+void mc_gp10b_intr_stall_pause(struct gk20a *g)
+{
+        gk20a_writel(g, mc_intr_en_clear_r(NVGPU_MC_INTR_STALLING), 0xffffffff);
+}
+void mc_gp10b_intr_stall_resume(struct gk20a *g)
+{
+        gk20a_writel(g, mc_intr_en_set_r(NVGPU_MC_INTR_STALLING),
+                        g->mc_intr_mask_restore[NVGPU_MC_INTR_STALLING]);
+}
+u32 mc_gp10b_intr_nonstall(struct gk20a *g)
+{
+        return gk20a_readl(g, mc_intr_r(NVGPU_MC_INTR_NONSTALLING));
+}
+void mc_gp10b_intr_nonstall_pause(struct gk20a *g)
+{
+        gk20a_writel(g, mc_intr_en_clear_r(NVGPU_MC_INTR_NONSTALLING),
+                     0xffffffff);
+}
+void mc_gp10b_intr_nonstall_resume(struct gk20a *g)
+{
+        gk20a_writel(g, mc_intr_en_set_r(NVGPU_MC_INTR_NONSTALLING),
+                        g->mc_intr_mask_restore[NVGPU_MC_INTR_NONSTALLING]);
+}
+bool mc_gp10b_is_intr1_pending(struct gk20a *g,
+                                      enum nvgpu_unit unit, u32 mc_intr_1)
+{
+        u32 mask = 0;
+        bool is_pending;
+        switch (unit) {
+        case NVGPU_UNIT_FIFO:
+                mask = mc_intr_pfifo_pending_f();
+                break;
+        default:
+                break;
+        }
+        if (mask == 0) {
+                nvgpu_err(g, "unknown unit %d", unit);
+                is_pending = false;
+        } else {
+                is_pending = (mc_intr_1 & mask) ? true : false;
+        }
+        return is_pending;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/mc_gp10b.h b/drivers/gpu/nvgpu/gp10b/mc_gp10b.h
new file mode 100644
index 00000000..0eb4dd16
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/mc_gp10b.h
@@ -0,0 +1,46 @@
+/*
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef MC_GP20B_H
+#define MC_GP20B_H
+struct gk20a;
+enum MC_INTERRUPT_REGLIST {
+        NVGPU_MC_INTR_STALLING = 0,
+        NVGPU_MC_INTR_NONSTALLING,
+};
+void mc_gp10b_intr_enable(struct gk20a *g);
+void mc_gp10b_intr_unit_config(struct gk20a *g, bool enable,
+                bool is_stalling, u32 mask);
+void mc_gp10b_isr_stall(struct gk20a *g);
+bool mc_gp10b_is_intr1_pending(struct gk20a *g,
+                                      enum nvgpu_unit unit, u32 mc_intr_1);
+u32 mc_gp10b_intr_stall(struct gk20a *g);
+void mc_gp10b_intr_stall_pause(struct gk20a *g);
+void mc_gp10b_intr_stall_resume(struct gk20a *g);
+u32 mc_gp10b_intr_nonstall(struct gk20a *g);
+void mc_gp10b_intr_nonstall_pause(struct gk20a *g);
+void mc_gp10b_intr_nonstall_resume(struct gk20a *g);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/mm_gp10b.c b/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
new file mode 100644
index 00000000..4b985af4
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
@@ -0,0 +1,446 @@
+/*
+ * GP10B MMU
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <nvgpu/mm.h>
+#include <nvgpu/dma.h>
+#include <nvgpu/gmmu.h>
+#include "gk20a/gk20a.h"
+#include "gm20b/mm_gm20b.h"
+#include "mm_gp10b.h"
+#include "rpfb_gp10b.h"
+#include <nvgpu/hw/gp10b/hw_fb_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_ram_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_bus_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_gmmu_gp10b.h>
+u32 gp10b_mm_get_default_big_page_size(void)
+{
+        return SZ_64K;
+}
+u32 gp10b_mm_get_iommu_bit(struct gk20a *g)
+{
+        return 36;
+}
+int gp10b_init_mm_setup_hw(struct gk20a *g)
+{
+        struct mm_gk20a *mm = &g->mm;
+        struct nvgpu_mem *inst_block = &mm->bar1.inst_block;
+        int err = 0;
+        gk20a_dbg_fn("");
+        g->ops.fb.set_mmu_page_size(g);
+        gk20a_writel(g, fb_niso_flush_sysmem_addr_r(),
+                     nvgpu_mem_get_addr(g, &g->mm.sysmem_flush) >> 8ULL);
+        g->ops.bus.bar1_bind(g, inst_block);
+        if (g->ops.mm.init_bar2_mm_hw_setup) {
+                err = g->ops.mm.init_bar2_mm_hw_setup(g);
+                if (err)
+                        return err;
+        }
+        if (gk20a_mm_fb_flush(g) || gk20a_mm_fb_flush(g))
+                return -EBUSY;
+        err = gp10b_replayable_pagefault_buffer_init(g);
+        gk20a_dbg_fn("done");
+        return err;
+}
+int gb10b_init_bar2_vm(struct gk20a *g)
+{
+        int err;
+        struct mm_gk20a *mm = &g->mm;
+        struct nvgpu_mem *inst_block = &mm->bar2.inst_block;
+        u32 big_page_size = g->ops.mm.get_default_big_page_size();
+        /* BAR2 aperture size is 32MB */
+        mm->bar2.aperture_size = 32 << 20;
+        gk20a_dbg_info("bar2 vm size = 0x%x", mm->bar2.aperture_size);
+        mm->bar2.vm = nvgpu_vm_init(g, big_page_size, SZ_4K,
+                mm->bar2.aperture_size - SZ_4K,
+                mm->bar2.aperture_size, false, false, "bar2");
+        if (!mm->bar2.vm)
+                return -ENOMEM;
+        /* allocate instance mem for bar2 */
+        err = g->ops.mm.alloc_inst_block(g, inst_block);
+        if (err)
+                goto clean_up_va;
+        g->ops.mm.init_inst_block(inst_block, mm->bar2.vm, big_page_size);
+        return 0;
+clean_up_va:
+        nvgpu_vm_put(mm->bar2.vm);
+        return err;
+}
+int gb10b_init_bar2_mm_hw_setup(struct gk20a *g)
+{
+        struct mm_gk20a *mm = &g->mm;
+        struct nvgpu_mem *inst_block = &mm->bar2.inst_block;
+        u64 inst_pa = nvgpu_inst_block_addr(g, inst_block);
+        gk20a_dbg_fn("");
+        g->ops.fb.set_mmu_page_size(g);
+        inst_pa = (u32)(inst_pa >> bus_bar2_block_ptr_shift_v());
+        gk20a_dbg_info("bar2 inst block ptr: 0x%08x",  (u32)inst_pa);
+        gk20a_writel(g, bus_bar2_block_r(),
+                     nvgpu_aperture_mask(g, inst_block,
+                                bus_bar2_block_target_sys_mem_ncoh_f(),
+                                bus_bar2_block_target_vid_mem_f()) |
+                     bus_bar2_block_mode_virtual_f() |
+                     bus_bar2_block_ptr_f(inst_pa));
+        gk20a_dbg_fn("done");
+        return 0;
+}
+static void update_gmmu_pde3_locked(struct vm_gk20a *vm,
+                                    const struct gk20a_mmu_level *l,
+                                    struct nvgpu_gmmu_pd *pd,
+                                    u32 pd_idx,
+                                    u64 virt_addr,
+                                    u64 phys_addr,
+                                    struct nvgpu_gmmu_attrs *attrs)
+{
+        struct gk20a *g = gk20a_from_vm(vm);
+        u32 pd_offset = pd_offset_from_index(l, pd_idx);
+        u32 pde_v[2] = {0, 0};
+        phys_addr >>= gmmu_new_pde_address_shift_v();
+        pde_v[0] |= nvgpu_aperture_mask(g, pd->mem,
+                        gmmu_new_pde_aperture_sys_mem_ncoh_f(),
+                        gmmu_new_pde_aperture_video_memory_f());
+        pde_v[0] |= gmmu_new_pde_address_sys_f(u64_lo32(phys_addr));
+        pde_v[0] |= gmmu_new_pde_vol_true_f();
+        pde_v[1] |= phys_addr >> 24;
+        pd_write(g, pd, pd_offset + 0, pde_v[0]);
+        pd_write(g, pd, pd_offset + 1, pde_v[1]);
+        pte_dbg(g, attrs,
+                "PDE: i=%-4u size=%-2u offs=%-4u pgsz: -- | "
+                "GPU %#-12llx  phys %#-12llx "
+                "[0x%08x, 0x%08x]",
+                pd_idx, l->entry_size, pd_offset,
+                virt_addr, phys_addr,
+                pde_v[1], pde_v[0]);
+}
+static void update_gmmu_pde0_locked(struct vm_gk20a *vm,
+                                    const struct gk20a_mmu_level *l,
+                                    struct nvgpu_gmmu_pd *pd,
+                                    u32 pd_idx,
+                                    u64 virt_addr,
+                                    u64 phys_addr,
+                                    struct nvgpu_gmmu_attrs *attrs)
+{
+        struct gk20a *g = gk20a_from_vm(vm);
+        bool small_valid, big_valid;
+        u32 small_addr = 0, big_addr = 0;
+        u32 pd_offset = pd_offset_from_index(l, pd_idx);
+        u32 pde_v[4] = {0, 0, 0, 0};
+        small_valid = attrs->pgsz == gmmu_page_size_small;
+        big_valid   = attrs->pgsz == gmmu_page_size_big;
+        if (small_valid)
+                small_addr = phys_addr >> gmmu_new_dual_pde_address_shift_v();
+        if (big_valid)
+                big_addr = phys_addr >> gmmu_new_dual_pde_address_big_shift_v();
+        if (small_valid) {
+                pde_v[2] |=
+                        gmmu_new_dual_pde_address_small_sys_f(small_addr);
+                pde_v[2] |= nvgpu_aperture_mask(g, pd->mem,
+                        gmmu_new_dual_pde_aperture_small_sys_mem_ncoh_f(),
+                        gmmu_new_dual_pde_aperture_small_video_memory_f());
+                pde_v[2] |= gmmu_new_dual_pde_vol_small_true_f();
+                pde_v[3] |= small_addr >> 24;
+        }
+        if (big_valid) {
+                pde_v[0] |= gmmu_new_dual_pde_address_big_sys_f(big_addr);
+                pde_v[0] |= gmmu_new_dual_pde_vol_big_true_f();
+                pde_v[0] |= nvgpu_aperture_mask(g, pd->mem,
+                        gmmu_new_dual_pde_aperture_big_sys_mem_ncoh_f(),
+                        gmmu_new_dual_pde_aperture_big_video_memory_f());
+                pde_v[1] |= big_addr >> 28;
+        }
+        pd_write(g, pd, pd_offset + 0, pde_v[0]);
+        pd_write(g, pd, pd_offset + 1, pde_v[1]);
+        pd_write(g, pd, pd_offset + 2, pde_v[2]);
+        pd_write(g, pd, pd_offset + 3, pde_v[3]);
+        pte_dbg(g, attrs,
+                "PDE: i=%-4u size=%-2u offs=%-4u pgsz: %c%c | "
+                "GPU %#-12llx  phys %#-12llx "
+                "[0x%08x, 0x%08x, 0x%08x, 0x%08x]",
+                pd_idx, l->entry_size, pd_offset,
+                small_valid ? 'S' : '-',
+                big_valid ?   'B' : '-',
+                virt_addr, phys_addr,
+                pde_v[3], pde_v[2], pde_v[1], pde_v[0]);
+}
+static void __update_pte(struct vm_gk20a *vm,
+                         u32 *pte_w,
+                         u64 phys_addr,
+                         struct nvgpu_gmmu_attrs *attrs)
+{
+        struct gk20a *g = gk20a_from_vm(vm);
+        u64 ctag_granularity = g->ops.fb.compression_page_size(g);
+        u32 page_size = vm->gmmu_page_sizes[attrs->pgsz];
+        u32 pte_valid = attrs->valid ?
+                gmmu_new_pte_valid_true_f() :
+                gmmu_new_pte_valid_false_f();
+        u32 phys_shifted = phys_addr >> gmmu_new_pte_address_shift_v();
+        u32 pte_addr = attrs->aperture == APERTURE_SYSMEM ?
+                gmmu_new_pte_address_sys_f(phys_shifted) :
+                gmmu_new_pte_address_vid_f(phys_shifted);
+        u32 pte_tgt = __nvgpu_aperture_mask(g,
+                        attrs->aperture,
+                        attrs->coherent ?
+                                gmmu_new_pte_aperture_sys_mem_coh_f() :
+                                gmmu_new_pte_aperture_sys_mem_ncoh_f(),
+                        gmmu_new_pte_aperture_video_memory_f());
+        pte_w[0] = pte_valid | pte_addr | pte_tgt;
+        if (attrs->priv)
+                pte_w[0] |= gmmu_new_pte_privilege_true_f();
+        pte_w[1] = phys_addr >> (24 + gmmu_new_pte_address_shift_v()) |
+                gmmu_new_pte_kind_f(attrs->kind_v) |
+                gmmu_new_pte_comptagline_f((u32)(attrs->ctag /
+                                                 ctag_granularity));
+        if (attrs->rw_flag == gk20a_mem_flag_read_only)
+                pte_w[0] |= gmmu_new_pte_read_only_true_f();
+        if (!attrs->valid && !attrs->cacheable)
+                pte_w[0] |= gmmu_new_pte_read_only_true_f();
+        else if (!attrs->cacheable)
+                pte_w[0] |= gmmu_new_pte_vol_true_f();
+        if (attrs->ctag)
+                attrs->ctag += page_size;
+}
+static void __update_pte_sparse(u32 *pte_w)
+{
+        pte_w[0] = gmmu_new_pte_valid_false_f();
+        pte_w[0] |= gmmu_new_pte_vol_true_f();
+}
+static void update_gmmu_pte_locked(struct vm_gk20a *vm,
+                                   const struct gk20a_mmu_level *l,
+                                   struct nvgpu_gmmu_pd *pd,
+                                   u32 pd_idx,
+                                   u64 virt_addr,
+                                   u64 phys_addr,
+                                   struct nvgpu_gmmu_attrs *attrs)
+{
+        struct gk20a *g = vm->mm->g;
+        u32 page_size  = vm->gmmu_page_sizes[attrs->pgsz];
+        u32 pd_offset = pd_offset_from_index(l, pd_idx);
+        u32 pte_w[2] = {0, 0};
+        if (phys_addr)
+                __update_pte(vm, pte_w, phys_addr, attrs);
+        else if (attrs->sparse)
+                __update_pte_sparse(pte_w);
+        pte_dbg(g, attrs,
+                "vm=%s "
+                "PTE: i=%-4u size=%-2u | "
+                "GPU %#-12llx  phys %#-12llx "
+                "pgsz: %3dkb perm=%-2s kind=%#02x APT=%-6s %c%c%c%c%c "
+                "ctag=0x%08x "
+                "[0x%08x, 0x%08x]",
+                vm->name,
+                pd_idx, l->entry_size,
+                virt_addr, phys_addr,
+                page_size >> 10,
+                nvgpu_gmmu_perm_str(attrs->rw_flag),
+                attrs->kind_v,
+                nvgpu_aperture_str(attrs->aperture),
+                attrs->cacheable ? 'C' : 'v',
+                attrs->sparse    ? 'S' : '-',
+                attrs->priv      ? 'P' : '-',
+                attrs->coherent  ? 'c' : '-',
+                attrs->valid     ? 'V' : '-',
+                (u32)attrs->ctag / g->ops.fb.compression_page_size(g),
+                pte_w[1], pte_w[0]);
+        pd_write(g, pd, pd_offset + 0, pte_w[0]);
+        pd_write(g, pd, pd_offset + 1, pte_w[1]);
+}
+#define GP10B_PDE0_ENTRY_SIZE 16
+/*
+ * Calculate the pgsz of the pde level
+ * Pascal+ implements a 5 level page table structure with only the last
+ * level having a different number of entries depending on whether it holds
+ * big pages or small pages.
+ */
+static enum gmmu_pgsz_gk20a gp10b_get_pde0_pgsz(struct gk20a *g,
+                                        struct nvgpu_gmmu_pd *pd, u32 pd_idx)
+{
+        u32 pde_base = pd->mem_offs / sizeof(u32);
+        u32 pde_v[GP10B_PDE0_ENTRY_SIZE >> 2];
+        u32 i;
+        enum gmmu_pgsz_gk20a pgsz = gmmu_nr_page_sizes;
+        if (!pd->mem)
+                return pgsz;
+        nvgpu_mem_begin(g, pd->mem);
+        for (i = 0; i < GP10B_PDE0_ENTRY_SIZE >> 2; i++)
+                pde_v[i] = nvgpu_mem_rd32(g, pd->mem, pde_base + i);
+        nvgpu_mem_end(g, pd->mem);
+        /*
+         * Check if the aperture AND address are set
+         */
+        if (pde_v[2] & (gmmu_new_dual_pde_aperture_small_sys_mem_ncoh_f() ||
+                        gmmu_new_dual_pde_aperture_small_video_memory_f())) {
+                u64 addr = ((u64) (pde_v[2] &
+                        gmmu_new_dual_pde_address_small_sys_f(~0)) <<
+                        gmmu_new_dual_pde_address_shift_v()) |
+                        ((u64) pde_v[3] << 32);
+                if (addr)
+                        pgsz = gmmu_page_size_small;
+        }
+        if (pde_v[0] & (gmmu_new_dual_pde_aperture_big_sys_mem_ncoh_f() |
+                        gmmu_new_dual_pde_aperture_big_video_memory_f())) {
+                u64 addr = ((u64) (pde_v[0] &
+                        gmmu_new_dual_pde_address_big_sys_f(~0)) <<
+                        gmmu_new_dual_pde_address_big_shift_v()) |
+                        ((u64) pde_v[1] << 32);
+                if (addr) {
+                        /*
+                         * If small is set that means that somehow MM allowed
+                         * both small and big to be set, the PDE is not valid
+                         * and may be corrupted
+                         */
+                        if (pgsz == gmmu_page_size_small) {
+                                nvgpu_err(g,
+                                        "both small and big apertures enabled");
+                                return gmmu_nr_page_sizes;
+                        }
+                }
+                pgsz = gmmu_page_size_big;
+        }
+        return pgsz;
+}
+static const struct gk20a_mmu_level gp10b_mm_levels[] = {
+        {.hi_bit = {48, 48},
+         .lo_bit = {47, 47},
+         .update_entry = update_gmmu_pde3_locked,
+         .entry_size = 8,
+         .get_pgsz = gk20a_get_pde_pgsz},
+        {.hi_bit = {46, 46},
+         .lo_bit = {38, 38},
+         .update_entry = update_gmmu_pde3_locked,
+         .entry_size = 8,
+         .get_pgsz = gk20a_get_pde_pgsz},
+        {.hi_bit = {37, 37},
+         .lo_bit = {29, 29},
+         .update_entry = update_gmmu_pde3_locked,
+         .entry_size = 8,
+         .get_pgsz = gk20a_get_pde_pgsz},
+        {.hi_bit = {28, 28},
+         .lo_bit = {21, 21},
+         .update_entry = update_gmmu_pde0_locked,
+         .entry_size = GP10B_PDE0_ENTRY_SIZE,
+         .get_pgsz = gp10b_get_pde0_pgsz},
+        {.hi_bit = {20, 20},
+         .lo_bit = {12, 16},
+         .update_entry = update_gmmu_pte_locked,
+         .entry_size = 8,
+         .get_pgsz = gk20a_get_pte_pgsz},
+        {.update_entry = NULL}
+};
+const struct gk20a_mmu_level *gp10b_mm_get_mmu_levels(struct gk20a *g,
+        u32 big_page_size)
+{
+        return gp10b_mm_levels;
+}
+void gp10b_mm_init_pdb(struct gk20a *g, struct nvgpu_mem *inst_block,
+                struct vm_gk20a *vm)
+{
+        u64 pdb_addr = nvgpu_mem_get_addr(g, vm->pdb.mem);
+        u32 pdb_addr_lo = u64_lo32(pdb_addr >> ram_in_base_shift_v());
+        u32 pdb_addr_hi = u64_hi32(pdb_addr);
+        gk20a_dbg_info("pde pa=0x%llx", pdb_addr);
+        nvgpu_mem_wr32(g, inst_block, ram_in_page_dir_base_lo_w(),
+                nvgpu_aperture_mask(g, vm->pdb.mem,
+                  ram_in_page_dir_base_target_sys_mem_ncoh_f(),
+                  ram_in_page_dir_base_target_vid_mem_f()) |
+                ram_in_page_dir_base_vol_true_f() |
+                ram_in_page_dir_base_lo_f(pdb_addr_lo) |
+                1 << 10);
+        nvgpu_mem_wr32(g, inst_block, ram_in_page_dir_base_hi_w(),
+                ram_in_page_dir_base_hi_f(pdb_addr_hi));
+}
+void gp10b_remove_bar2_vm(struct gk20a *g)
+{
+        struct mm_gk20a *mm = &g->mm;
+        gp10b_replayable_pagefault_buffer_deinit(g);
+        nvgpu_free_inst_block(g, &mm->bar2.inst_block);
+        nvgpu_vm_put(mm->bar2.vm);
+}
diff --git a/drivers/gpu/nvgpu/gp10b/mm_gp10b.h b/drivers/gpu/nvgpu/gp10b/mm_gp10b.h
new file mode 100644
index 00000000..b6bcb04a
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/mm_gp10b.h
@@ -0,0 +1,42 @@
+/*
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef MM_GP10B_H
+#define MM_GP10B_H
+struct gk20a;
+struct gk20a_mmu_level;
+struct nvgpu_mem;
+struct vm_gk20a;
+u32 gp10b_mm_get_default_big_page_size(void);
+u32 gp10b_mm_get_iommu_bit(struct gk20a *g);
+int gp10b_init_mm_setup_hw(struct gk20a *g);
+int gb10b_init_bar2_vm(struct gk20a *g);
+int gb10b_init_bar2_mm_hw_setup(struct gk20a *g);
+const struct gk20a_mmu_level *gp10b_mm_get_mmu_levels(struct gk20a *g,
+        u32 big_page_size);
+void gp10b_mm_init_pdb(struct gk20a *g, struct nvgpu_mem *inst_block,
+                struct vm_gk20a *vm);
+void gp10b_remove_bar2_vm(struct gk20a *g);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/platform_gp10b.h b/drivers/gpu/nvgpu/gp10b/platform_gp10b.h
new file mode 100644
index 00000000..0791c2fe
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/platform_gp10b.h
@@ -0,0 +1,34 @@
+/*
+ * GP10B Platform (SoC) Interface
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef _GP10B_PLATFORM_H_
+#define _GP10B_PLATFORM_H_
+struct device;
+int gp10b_tegra_get_clocks(struct device *dev);
+int gp10b_tegra_reset_assert(struct device *dev);
+int gp10b_tegra_reset_deassert(struct device *dev);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/pmu_gp10b.c b/drivers/gpu/nvgpu/gp10b/pmu_gp10b.c
new file mode 100644
index 00000000..147cd020
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/pmu_gp10b.c
@@ -0,0 +1,399 @@
+/*
+ * GP10B PMU
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <nvgpu/pmu.h>
+#include <nvgpu/log.h>
+#include <nvgpu/fuse.h>
+#include <nvgpu/enabled.h>
+#include "gk20a/gk20a.h"
+#include "gk20a/pmu_gk20a.h"
+#include "gm20b/acr_gm20b.h"
+#include "gm20b/pmu_gm20b.h"
+#include "pmu_gp10b.h"
+#include <nvgpu/hw/gp10b/hw_pwr_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fuse_gp10b.h>
+#define gp10b_dbg_pmu(fmt, arg...) \
+        gk20a_dbg(gpu_dbg_pmu, fmt, ##arg)
+/*!
+ * Structure/object which single register write need to be done during PG init
+ * sequence to set PROD values.
+ */
+struct pg_init_sequence_list {
+        u32 regaddr;
+        u32 writeval;
+};
+/* PROD settings for ELPG sequencing registers*/
+static struct pg_init_sequence_list _pginitseq_gp10b[] = {
+                {0x0010ab10, 0x0000868B} ,
+                {0x0010e118, 0x8590848F} ,
+                {0x0010e000, 0} ,
+                {0x0010e06c, 0x000000A3} ,
+                {0x0010e06c, 0x000000A0} ,
+                {0x0010e06c, 0x00000095} ,
+                {0x0010e06c, 0x000000A6} ,
+                {0x0010e06c, 0x0000008C} ,
+                {0x0010e06c, 0x00000080} ,
+                {0x0010e06c, 0x00000081} ,
+                {0x0010e06c, 0x00000087} ,
+                {0x0010e06c, 0x00000088} ,
+                {0x0010e06c, 0x0000008D} ,
+                {0x0010e06c, 0x00000082} ,
+                {0x0010e06c, 0x00000083} ,
+                {0x0010e06c, 0x00000089} ,
+                {0x0010e06c, 0x0000008A} ,
+                {0x0010e06c, 0x000000A2} ,
+                {0x0010e06c, 0x00000097} ,
+                {0x0010e06c, 0x00000092} ,
+                {0x0010e06c, 0x00000099} ,
+                {0x0010e06c, 0x0000009B} ,
+                {0x0010e06c, 0x0000009D} ,
+                {0x0010e06c, 0x0000009F} ,
+                {0x0010e06c, 0x000000A1} ,
+                {0x0010e06c, 0x00000096} ,
+                {0x0010e06c, 0x00000091} ,
+                {0x0010e06c, 0x00000098} ,
+                {0x0010e06c, 0x0000009A} ,
+                {0x0010e06c, 0x0000009C} ,
+                {0x0010e06c, 0x0000009E} ,
+                {0x0010ab14, 0x00000000} ,
+                {0x0010e024, 0x00000000} ,
+                {0x0010e028, 0x00000000} ,
+                {0x0010e11c, 0x00000000} ,
+                {0x0010ab1c, 0x140B0BFF} ,
+                {0x0010e020, 0x0E2626FF} ,
+                {0x0010e124, 0x251010FF} ,
+                {0x0010ab20, 0x89abcdef} ,
+                {0x0010ab24, 0x00000000} ,
+                {0x0010e02c, 0x89abcdef} ,
+                {0x0010e030, 0x00000000} ,
+                {0x0010e128, 0x89abcdef} ,
+                {0x0010e12c, 0x00000000} ,
+                {0x0010ab28, 0x7FFFFFFF} ,
+                {0x0010ab2c, 0x70000000} ,
+                {0x0010e034, 0x7FFFFFFF} ,
+                {0x0010e038, 0x70000000} ,
+                {0x0010e130, 0x7FFFFFFF} ,
+                {0x0010e134, 0x70000000} ,
+                {0x0010ab30, 0x00000000} ,
+                {0x0010ab34, 0x00000001} ,
+                {0x00020004, 0x00000000} ,
+                {0x0010e138, 0x00000000} ,
+                {0x0010e040, 0x00000000} ,
+                {0x0010e168, 0x00000000} ,
+                {0x0010e114, 0x0000A5A4} ,
+                {0x0010e110, 0x00000000} ,
+                {0x0010e10c, 0x8590848F} ,
+                {0x0010e05c, 0x00000000} ,
+                {0x0010e044, 0x00000000} ,
+                {0x0010a644, 0x0000868B} ,
+                {0x0010a648, 0x00000000} ,
+                {0x0010a64c, 0x00829493} ,
+                {0x0010a650, 0x00000000} ,
+                {0x0010e000, 0} ,
+                {0x0010e068, 0x000000A3} ,
+                {0x0010e068, 0x000000A0} ,
+                {0x0010e068, 0x00000095} ,
+                {0x0010e068, 0x000000A6} ,
+                {0x0010e068, 0x0000008C} ,
+                {0x0010e068, 0x00000080} ,
+                {0x0010e068, 0x00000081} ,
+                {0x0010e068, 0x00000087} ,
+                {0x0010e068, 0x00000088} ,
+                {0x0010e068, 0x0000008D} ,
+                {0x0010e068, 0x00000082} ,
+                {0x0010e068, 0x00000083} ,
+                {0x0010e068, 0x00000089} ,
+                {0x0010e068, 0x0000008A} ,
+                {0x0010e068, 0x000000A2} ,
+                {0x0010e068, 0x00000097} ,
+                {0x0010e068, 0x00000092} ,
+                {0x0010e068, 0x00000099} ,
+                {0x0010e068, 0x0000009B} ,
+                {0x0010e068, 0x0000009D} ,
+                {0x0010e068, 0x0000009F} ,
+                {0x0010e068, 0x000000A1} ,
+                {0x0010e068, 0x00000096} ,
+                {0x0010e068, 0x00000091} ,
+                {0x0010e068, 0x00000098} ,
+                {0x0010e068, 0x0000009A} ,
+                {0x0010e068, 0x0000009C} ,
+                {0x0010e068, 0x0000009E} ,
+                {0x0010e000, 0} ,
+                {0x0010e004, 0x0000008E},
+};
+static void gp10b_pmu_load_multiple_falcons(struct gk20a *g, u32 falconidmask,
+                                         u32 flags)
+{
+        struct nvgpu_pmu *pmu = &g->pmu;
+        struct pmu_cmd cmd;
+        u32 seq;
+        gk20a_dbg_fn("");
+        gp10b_dbg_pmu("wprinit status = %x\n", g->pmu_lsf_pmu_wpr_init_done);
+        if (g->pmu_lsf_pmu_wpr_init_done) {
+                /* send message to load FECS falcon */
+                memset(&cmd, 0, sizeof(struct pmu_cmd));
+                cmd.hdr.unit_id = PMU_UNIT_ACR;
+                cmd.hdr.size = PMU_CMD_HDR_SIZE +
+                  sizeof(struct pmu_acr_cmd_bootstrap_multiple_falcons);
+                cmd.cmd.acr.boot_falcons.cmd_type =
+                  PMU_ACR_CMD_ID_BOOTSTRAP_MULTIPLE_FALCONS;
+                cmd.cmd.acr.boot_falcons.flags = flags;
+                cmd.cmd.acr.boot_falcons.falconidmask =
+                                falconidmask;
+                cmd.cmd.acr.boot_falcons.usevamask = 0;
+                cmd.cmd.acr.boot_falcons.wprvirtualbase.lo = 0x0;
+                cmd.cmd.acr.boot_falcons.wprvirtualbase.hi = 0x0;
+                gp10b_dbg_pmu("PMU_ACR_CMD_ID_BOOTSTRAP_MULTIPLE_FALCONS:%x\n",
+                                falconidmask);
+                nvgpu_pmu_cmd_post(g, &cmd, NULL, NULL, PMU_COMMAND_QUEUE_HPQ,
+                                pmu_handle_fecs_boot_acr_msg, pmu, &seq, ~0);
+        }
+        gk20a_dbg_fn("done");
+        return;
+}
+int gp10b_load_falcon_ucode(struct gk20a *g, u32 falconidmask)
+{
+        u32 flags = PMU_ACR_CMD_BOOTSTRAP_FALCON_FLAGS_RESET_YES;
+        /* GM20B PMU supports loading FECS and GPCCS only */
+        if (falconidmask == 0)
+                return -EINVAL;
+        if (falconidmask & ~((1 << LSF_FALCON_ID_FECS) |
+                                (1 << LSF_FALCON_ID_GPCCS)))
+                                return -EINVAL;
+        g->pmu_lsf_loaded_falcon_id = 0;
+        /* check whether pmu is ready to bootstrap lsf if not wait for it */
+        if (!g->pmu_lsf_pmu_wpr_init_done) {
+                pmu_wait_message_cond(&g->pmu,
+                                gk20a_get_gr_idle_timeout(g),
+                                &g->pmu_lsf_pmu_wpr_init_done, 1);
+                /* check again if it still not ready indicate an error */
+                if (!g->pmu_lsf_pmu_wpr_init_done) {
+                        nvgpu_err(g, "PMU not ready to load LSF");
+                        return -ETIMEDOUT;
+                }
+        }
+        /* load falcon(s) */
+        gp10b_pmu_load_multiple_falcons(g, falconidmask, flags);
+        pmu_wait_message_cond(&g->pmu,
+                        gk20a_get_gr_idle_timeout(g),
+                        &g->pmu_lsf_loaded_falcon_id, falconidmask);
+        if (g->pmu_lsf_loaded_falcon_id != falconidmask)
+                return -ETIMEDOUT;
+        return 0;
+}
+static void pmu_handle_gr_param_msg(struct gk20a *g, struct pmu_msg *msg,
+                        void *param, u32 handle, u32 status)
+{
+        gk20a_dbg_fn("");
+        if (status != 0) {
+                nvgpu_err(g, "GR PARAM cmd aborted");
+                /* TBD: disable ELPG */
+                return;
+        }
+        gp10b_dbg_pmu("GR PARAM is acknowledged from PMU %x \n",
+                        msg->msg.pg.msg_type);
+        return;
+}
+int gp10b_pg_gr_init(struct gk20a *g, u32 pg_engine_id)
+{
+        struct nvgpu_pmu *pmu = &g->pmu;
+        struct pmu_cmd cmd;
+        u32 seq;
+        if (pg_engine_id == PMU_PG_ELPG_ENGINE_ID_GRAPHICS) {
+                memset(&cmd, 0, sizeof(struct pmu_cmd));
+                cmd.hdr.unit_id = PMU_UNIT_PG;
+                cmd.hdr.size = PMU_CMD_HDR_SIZE +
+                                sizeof(struct pmu_pg_cmd_gr_init_param);
+                cmd.cmd.pg.gr_init_param.cmd_type =
+                                PMU_PG_CMD_ID_PG_PARAM;
+                cmd.cmd.pg.gr_init_param.sub_cmd_id =
+                                PMU_PG_PARAM_CMD_GR_INIT_PARAM;
+                cmd.cmd.pg.gr_init_param.featuremask =
+                                PMU_PG_FEATURE_GR_POWER_GATING_ENABLED;
+                gp10b_dbg_pmu("cmd post PMU_PG_CMD_ID_PG_PARAM ");
+                nvgpu_pmu_cmd_post(g, &cmd, NULL, NULL, PMU_COMMAND_QUEUE_HPQ,
+                                pmu_handle_gr_param_msg, pmu, &seq, ~0);
+        } else
+                return -EINVAL;
+        return 0;
+}
+void gp10b_pmu_elpg_statistics(struct gk20a *g, u32 pg_engine_id,
+                struct pmu_pg_stats_data *pg_stat_data)
+{
+        struct nvgpu_pmu *pmu = &g->pmu;
+        struct pmu_pg_stats_v1 stats;
+        nvgpu_flcn_copy_from_dmem(pmu->flcn,
+                pmu->stat_dmem_offset[pg_engine_id],
+                (u8 *)&stats, sizeof(struct pmu_pg_stats_v1), 0);
+        pg_stat_data->ingating_time = stats.total_sleep_timeus;
+        pg_stat_data->ungating_time = stats.total_nonsleep_timeus;
+        pg_stat_data->gating_cnt = stats.entry_count;
+        pg_stat_data->avg_entry_latency_us = stats.entrylatency_avgus;
+        pg_stat_data->avg_exit_latency_us = stats.exitlatency_avgus;
+}
+int gp10b_pmu_setup_elpg(struct gk20a *g)
+{
+        int ret = 0;
+        u32 reg_writes;
+        u32 index;
+        gk20a_dbg_fn("");
+        if (g->elpg_enabled) {
+                reg_writes = ((sizeof(_pginitseq_gp10b) /
+                                sizeof((_pginitseq_gp10b)[0])));
+                /* Initialize registers with production values*/
+                for (index = 0; index < reg_writes; index++) {
+                        gk20a_writel(g, _pginitseq_gp10b[index].regaddr,
+                                _pginitseq_gp10b[index].writeval);
+                }
+        }
+        gk20a_dbg_fn("done");
+        return ret;
+}
+void gp10b_write_dmatrfbase(struct gk20a *g, u32 addr)
+{
+        gk20a_writel(g, pwr_falcon_dmatrfbase_r(),
+                                addr);
+        gk20a_writel(g, pwr_falcon_dmatrfbase1_r(),
+                                0x0);
+}
+int gp10b_init_pmu_setup_hw1(struct gk20a *g)
+{
+        struct nvgpu_pmu *pmu = &g->pmu;
+        int err;
+        gk20a_dbg_fn("");
+        nvgpu_mutex_acquire(&pmu->isr_mutex);
+        nvgpu_flcn_reset(pmu->flcn);
+        pmu->isr_enabled = true;
+        nvgpu_mutex_release(&pmu->isr_mutex);
+        /* setup apertures - virtual */
+        gk20a_writel(g, pwr_fbif_transcfg_r(GK20A_PMU_DMAIDX_UCODE),
+                pwr_fbif_transcfg_mem_type_virtual_f());
+        gk20a_writel(g, pwr_fbif_transcfg_r(GK20A_PMU_DMAIDX_VIRT),
+                pwr_fbif_transcfg_mem_type_virtual_f());
+        /* setup apertures - physical */
+        gk20a_writel(g, pwr_fbif_transcfg_r(GK20A_PMU_DMAIDX_PHYS_VID),
+                pwr_fbif_transcfg_mem_type_physical_f() |
+                pwr_fbif_transcfg_target_local_fb_f());
+        gk20a_writel(g, pwr_fbif_transcfg_r(GK20A_PMU_DMAIDX_PHYS_SYS_COH),
+                pwr_fbif_transcfg_mem_type_physical_f() |
+                pwr_fbif_transcfg_target_coherent_sysmem_f());
+        gk20a_writel(g, pwr_fbif_transcfg_r(GK20A_PMU_DMAIDX_PHYS_SYS_NCOH),
+                pwr_fbif_transcfg_mem_type_physical_f() |
+                pwr_fbif_transcfg_target_noncoherent_sysmem_f());
+        err = g->ops.pmu.pmu_nsbootstrap(pmu);
+        if (err)
+                return err;
+        gk20a_dbg_fn("done");
+        return 0;
+}
+bool gp10b_is_lazy_bootstrap(u32 falcon_id)
+{
+        bool enable_status = false;
+        switch (falcon_id) {
+        case LSF_FALCON_ID_FECS:
+                enable_status = false;
+                break;
+        case LSF_FALCON_ID_GPCCS:
+                enable_status = true;
+                break;
+        default:
+                break;
+        }
+        return enable_status;
+}
+bool gp10b_is_priv_load(u32 falcon_id)
+{
+        bool enable_status = false;
+        switch (falcon_id) {
+        case LSF_FALCON_ID_FECS:
+                enable_status = false;
+                break;
+        case LSF_FALCON_ID_GPCCS:
+                enable_status = true;
+                break;
+        default:
+                break;
+        }
+        return enable_status;
+}
+/*Dump Security related fuses*/
+void pmu_dump_security_fuses_gp10b(struct gk20a *g)
+{
+        u32 val;
+        nvgpu_err(g, "FUSE_OPT_SEC_DEBUG_EN_0: 0x%x",
+                        gk20a_readl(g, fuse_opt_sec_debug_en_r()));
+        nvgpu_err(g, "FUSE_OPT_PRIV_SEC_EN_0: 0x%x",
+                        gk20a_readl(g, fuse_opt_priv_sec_en_r()));
+        nvgpu_tegra_fuse_read_gcplex_config_fuse(g, &val);
+        nvgpu_err(g, "FUSE_GCPLEX_CONFIG_FUSE_0: 0x%x", val);
+}
+bool gp10b_is_pmu_supported(struct gk20a *g)
+{
+        return true;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/pmu_gp10b.h b/drivers/gpu/nvgpu/gp10b/pmu_gp10b.h
new file mode 100644
index 00000000..44e0ec98
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/pmu_gp10b.h
@@ -0,0 +1,43 @@
+/*
+ * GP10B PMU
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef __PMU_GP10B_H_
+#define __PMU_GP10B_H_
+struct gk20a;
+bool gp10b_is_lazy_bootstrap(u32 falcon_id);
+bool gp10b_is_priv_load(u32 falcon_id);
+bool gp10b_is_pmu_supported(struct gk20a *g);
+int gp10b_init_pmu_setup_hw1(struct gk20a *g);
+void gp10b_pmu_elpg_statistics(struct gk20a *g, u32 pg_engine_id,
+                struct pmu_pg_stats_data *pg_stat_data);
+int gp10b_pmu_setup_elpg(struct gk20a *g);
+void pmu_dump_security_fuses_gp10b(struct gk20a *g);
+int gp10b_load_falcon_ucode(struct gk20a *g, u32 falconidmask);
+int gp10b_pg_gr_init(struct gk20a *g, u32 pg_engine_id);
+void gp10b_write_dmatrfbase(struct gk20a *g, u32 addr);
+#endif /*__PMU_GP10B_H_*/
diff --git a/drivers/gpu/nvgpu/gp10b/priv_ring_gp10b.c b/drivers/gpu/nvgpu/gp10b/priv_ring_gp10b.c
new file mode 100644
index 00000000..b780457f
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/priv_ring_gp10b.c
@@ -0,0 +1,112 @@
+/*
+ * GP10B priv ring
+ *
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include <nvgpu/log.h>
+#include <nvgpu/timers.h>
+#include <nvgpu/enabled.h>
+#include <nvgpu/hw/gp10b/hw_mc_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_pri_ringmaster_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_pri_ringstation_sys_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_pri_ringstation_gpc_gp10b.h>
+void gp10b_priv_ring_isr(struct gk20a *g)
+{
+        u32 status0, status1;
+        u32 cmd;
+        s32 retry = 100;
+        u32 gpc;
+        u32 gpc_stride, offset;
+        if (nvgpu_is_enabled(g, NVGPU_IS_FMODEL)) {
+                nvgpu_info(g, "unhandled priv ring intr");
+                return;
+        }
+        status0 = gk20a_readl(g, pri_ringmaster_intr_status0_r());
+        status1 = gk20a_readl(g, pri_ringmaster_intr_status1_r());
+        nvgpu_err(g, "ringmaster intr status0: 0x%08x,"
+                "status1: 0x%08x", status0, status1);
+        if (pri_ringmaster_intr_status0_ring_start_conn_fault_v(status0) != 0)
+                nvgpu_err(g,
+                        "BUG: connectivity problem on the startup sequence");
+        if (pri_ringmaster_intr_status0_disconnect_fault_v(status0) != 0)
+                nvgpu_err(g, "ring disconnected");
+        if (pri_ringmaster_intr_status0_overflow_fault_v(status0) != 0)
+                nvgpu_err(g, "ring overflowed");
+        if (pri_ringmaster_intr_status0_gbl_write_error_sys_v(status0) != 0) {
+                nvgpu_err(g, "SYS write error. ADR %08x WRDAT %08x INFO %08x, CODE %08x",
+                        gk20a_readl(g, pri_ringstation_sys_priv_error_adr_r()),
+                        gk20a_readl(g, pri_ringstation_sys_priv_error_wrdat_r()),
+                        gk20a_readl(g, pri_ringstation_sys_priv_error_info_r()),
+                        gk20a_readl(g, pri_ringstation_sys_priv_error_code_r()));
+        }
+        if (status1) {
+                gpc_stride = nvgpu_get_litter_value(g, GPU_LIT_GPC_STRIDE);
+                for (gpc = 0; gpc < g->gr.gpc_count; gpc++) {
+                        offset = gpc * gpc_stride;
+                        if (status1 & BIT(gpc)) {
+                                nvgpu_err(g, "GPC%u write error. ADR %08x "
+                                        "WRDAT %08x INFO %08x, CODE %08x", gpc,
+                                        gk20a_readl(g,
+                                        pri_ringstation_gpc_gpc0_priv_error_adr_r() + offset),
+                                        gk20a_readl(g,
+                                        pri_ringstation_gpc_gpc0_priv_error_wrdat_r() + offset),
+                                        gk20a_readl(g,
+                                        pri_ringstation_gpc_gpc0_priv_error_info_r() + offset),
+                                        gk20a_readl(g,
+                                        pri_ringstation_gpc_gpc0_priv_error_code_r() + offset));
+                                status1 = status1 & (~(BIT(gpc)));
+                                if (!status1)
+                                        break;
+                        }
+                }
+        }
+        /* clear interrupt */
+        cmd = gk20a_readl(g, pri_ringmaster_command_r());
+        cmd = set_field(cmd, pri_ringmaster_command_cmd_m(),
+                pri_ringmaster_command_cmd_ack_interrupt_f());
+        gk20a_writel(g, pri_ringmaster_command_r(), cmd);
+        /* poll for clear interrupt done */
+        cmd = pri_ringmaster_command_cmd_v(
+                gk20a_readl(g, pri_ringmaster_command_r()));
+        while (cmd != pri_ringmaster_command_cmd_no_cmd_v() && retry) {
+                nvgpu_udelay(20);
+                cmd = pri_ringmaster_command_cmd_v(
+                        gk20a_readl(g, pri_ringmaster_command_r()));
+                retry--;
+        }
+        if (retry == 0)
+                nvgpu_err(g, "priv ringmaster intr ack failed");
+}
diff --git a/drivers/gpu/nvgpu/gp10b/priv_ring_gp10b.h b/drivers/gpu/nvgpu/gp10b/priv_ring_gp10b.h
new file mode 100644
index 00000000..5b004a58
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/priv_ring_gp10b.h
@@ -0,0 +1,31 @@
+/*
+ * GP10B PRIV ringmaster
+ *
+ * Copyright (c) 2011-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef __PRIV_RING_GP10B_H__
+#define __PRIV_RING_GP10B_H__
+struct gk20a;
+void gp10b_priv_ring_isr(struct gk20a *g);
+#endif /*__PRIV_RING_GP10B_H__*/
diff --git a/drivers/gpu/nvgpu/gp10b/regops_gp10b.c b/drivers/gpu/nvgpu/gp10b/regops_gp10b.c
new file mode 100644
index 00000000..bf360d6f
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/regops_gp10b.c
@@ -0,0 +1,479 @@
+/*
+ * Tegra GK20A GPU Debugger Driver Register Ops
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <uapi/linux/nvgpu.h>
+#include "gk20a/gk20a.h"
+#include "gk20a/dbg_gpu_gk20a.h"
+#include "gk20a/regops_gk20a.h"
+#include "regops_gp10b.h"
+#include <nvgpu/bsearch.h>
+static const struct regop_offset_range gp10b_global_whitelist_ranges[] = {
+        { 0x000004f0,   1},
+        { 0x00001a00,   3},
+        { 0x00002800, 128},
+        { 0x00009400,   1},
+        { 0x00009410,   1},
+        { 0x00009480,   1},
+        { 0x00020200,  24},
+        { 0x00021c00,   4},
+        { 0x00021c14,   3},
+        { 0x00021c24,   1},
+        { 0x00021c2c,  69},
+        { 0x00021d44,   1},
+        { 0x00021d4c,   1},
+        { 0x00021d54,   1},
+        { 0x00021d5c,   1},
+        { 0x00021d64,   2},
+        { 0x00021d70,  16},
+        { 0x00022430,   7},
+        { 0x00022450,   1},
+        { 0x0002245c,   1},
+        { 0x00070000,   5},
+        { 0x000884e0,   1},
+        { 0x0008e00c,   1},
+        { 0x00100c18,   3},
+        { 0x00100c84,   1},
+        { 0x00104038,   1},
+        { 0x0010a0a8,   1},
+        { 0x0010a4f0,   1},
+        { 0x0010e490,   1},
+        { 0x0013cc14,   1},
+        { 0x00140028,   1},
+        { 0x00140280,   1},
+        { 0x001402a0,   1},
+        { 0x00140350,   1},
+        { 0x00140480,   1},
+        { 0x001404a0,   1},
+        { 0x00140550,   1},
+        { 0x00142028,   1},
+        { 0x00142280,   1},
+        { 0x001422a0,   1},
+        { 0x00142350,   1},
+        { 0x00142480,   1},
+        { 0x001424a0,   1},
+        { 0x00142550,   1},
+        { 0x0017e028,   1},
+        { 0x0017e280,   1},
+        { 0x0017e294,   1},
+        { 0x0017e29c,   2},
+        { 0x0017e2ac,   1},
+        { 0x0017e350,   1},
+        { 0x0017e39c,   1},
+        { 0x0017e480,   1},
+        { 0x0017e4a0,   1},
+        { 0x0017e550,   1},
+        { 0x00180040,  41},
+        { 0x001800ec,  10},
+        { 0x00180240,  41},
+        { 0x001802ec,  10},
+        { 0x00180440,  41},
+        { 0x001804ec,  10},
+        { 0x00180640,  41},
+        { 0x001806ec,  10},
+        { 0x00180840,  41},
+        { 0x001808ec,  10},
+        { 0x00180a40,  41},
+        { 0x00180aec,  10},
+        { 0x00180c40,  41},
+        { 0x00180cec,  10},
+        { 0x00180e40,  41},
+        { 0x00180eec,  10},
+        { 0x001a0040,  41},
+        { 0x001a00ec,  10},
+        { 0x001a0240,  41},
+        { 0x001a02ec,  10},
+        { 0x001a0440,  41},
+        { 0x001a04ec,  10},
+        { 0x001a0640,  41},
+        { 0x001a06ec,  10},
+        { 0x001a0840,  41},
+        { 0x001a08ec,  10},
+        { 0x001a0a40,  41},
+        { 0x001a0aec,  10},
+        { 0x001a0c40,  41},
+        { 0x001a0cec,  10},
+        { 0x001a0e40,  41},
+        { 0x001a0eec,  10},
+        { 0x001b0040,  41},
+        { 0x001b00ec,  10},
+        { 0x001b0240,  41},
+        { 0x001b02ec,  10},
+        { 0x001b0440,  41},
+        { 0x001b04ec,  10},
+        { 0x001b0640,  41},
+        { 0x001b06ec,  10},
+        { 0x001b0840,  41},
+        { 0x001b08ec,  10},
+        { 0x001b0a40,  41},
+        { 0x001b0aec,  10},
+        { 0x001b0c40,  41},
+        { 0x001b0cec,  10},
+        { 0x001b0e40,  41},
+        { 0x001b0eec,  10},
+        { 0x001b4000,   1},
+        { 0x001b4008,   1},
+        { 0x001b4010,   3},
+        { 0x001b4020,   3},
+        { 0x001b4030,   3},
+        { 0x001b4040,   3},
+        { 0x001b4050,   3},
+        { 0x001b4060,   4},
+        { 0x001b4074,   7},
+        { 0x001b4094,   3},
+        { 0x001b40a4,   1},
+        { 0x001b4100,   6},
+        { 0x001b4124,   2},
+        { 0x001b8000,   1},
+        { 0x001b8008,   1},
+        { 0x001b8010,   3},
+        { 0x001bc000,   1},
+        { 0x001bc008,   1},
+        { 0x001bc010,   3},
+        { 0x001be000,   1},
+        { 0x001be008,   1},
+        { 0x001be010,   3},
+        { 0x00400500,   1},
+        { 0x0040415c,   1},
+        { 0x00404468,   1},
+        { 0x00404498,   1},
+        { 0x00405800,   1},
+        { 0x00405840,   2},
+        { 0x00405850,   1},
+        { 0x00405908,   1},
+        { 0x00405b40,   1},
+        { 0x00405b50,   1},
+        { 0x00406024,   5},
+        { 0x00407010,   1},
+        { 0x00407808,   1},
+        { 0x0040803c,   1},
+        { 0x00408804,   1},
+        { 0x0040880c,   1},
+        { 0x00408900,   2},
+        { 0x00408910,   1},
+        { 0x00408944,   1},
+        { 0x00408984,   1},
+        { 0x004090a8,   1},
+        { 0x004098a0,   1},
+        { 0x00409b00,   1},
+        { 0x0041000c,   1},
+        { 0x00410110,   1},
+        { 0x00410184,   1},
+        { 0x0041040c,   1},
+        { 0x00410510,   1},
+        { 0x00410584,   1},
+        { 0x00418000,   1},
+        { 0x00418008,   1},
+        { 0x00418380,   2},
+        { 0x00418400,   2},
+        { 0x004184a0,   1},
+        { 0x00418604,   1},
+        { 0x00418680,   1},
+        { 0x00418704,   1},
+        { 0x00418714,   1},
+        { 0x00418800,   1},
+        { 0x0041881c,   1},
+        { 0x00418830,   1},
+        { 0x00418884,   1},
+        { 0x004188b0,   1},
+        { 0x004188c8,   3},
+        { 0x004188fc,   1},
+        { 0x00418b04,   1},
+        { 0x00418c04,   1},
+        { 0x00418c10,   8},
+        { 0x00418c88,   1},
+        { 0x00418d00,   1},
+        { 0x00418e00,   1},
+        { 0x00418e08,   1},
+        { 0x00418e34,   1},
+        { 0x00418e40,   4},
+        { 0x00418e58,  16},
+        { 0x00418f08,   1},
+        { 0x00419000,   1},
+        { 0x0041900c,   1},
+        { 0x00419018,   1},
+        { 0x00419854,   1},
+        { 0x00419864,   1},
+        { 0x00419a04,   2},
+        { 0x00419a14,   1},
+        { 0x00419ab0,   1},
+        { 0x00419ab8,   3},
+        { 0x00419c0c,   1},
+        { 0x00419c8c,   2},
+        { 0x00419d00,   1},
+        { 0x00419d08,   2},
+        { 0x00419e00,  11},
+        { 0x00419e34,   2},
+        { 0x00419e44,  11},
+        { 0x00419e74,  10},
+        { 0x00419ea4,   1},
+        { 0x00419eac,   2},
+        { 0x00419ee8,   1},
+        { 0x00419ef0,  28},
+        { 0x00419f70,   1},
+        { 0x00419f78,   2},
+        { 0x00419f98,   2},
+        { 0x00419fdc,   1},
+        { 0x0041a02c,   2},
+        { 0x0041a0a0,   1},
+        { 0x0041a0a8,   1},
+        { 0x0041a890,   2},
+        { 0x0041a8a0,   3},
+        { 0x0041a8b0,   2},
+        { 0x0041b014,   1},
+        { 0x0041b0a0,   1},
+        { 0x0041b0cc,   1},
+        { 0x0041b1dc,   1},
+        { 0x0041be0c,   3},
+        { 0x0041bea0,   1},
+        { 0x0041becc,   1},
+        { 0x0041bfdc,   1},
+        { 0x0041c054,   1},
+        { 0x0041c2b0,   1},
+        { 0x0041c2b8,   3},
+        { 0x0041c40c,   1},
+        { 0x0041c48c,   2},
+        { 0x0041c500,   1},
+        { 0x0041c508,   2},
+        { 0x0041c600,  11},
+        { 0x0041c634,   2},
+        { 0x0041c644,  11},
+        { 0x0041c674,  10},
+        { 0x0041c6a4,   1},
+        { 0x0041c6ac,   2},
+        { 0x0041c6e8,   1},
+        { 0x0041c6f0,  28},
+        { 0x0041c770,   1},
+        { 0x0041c778,   2},
+        { 0x0041c798,   2},
+        { 0x0041c7dc,   1},
+        { 0x0041c854,   1},
+        { 0x0041cab0,   1},
+        { 0x0041cab8,   3},
+        { 0x0041cc0c,   1},
+        { 0x0041cc8c,   2},
+        { 0x0041cd00,   1},
+        { 0x0041cd08,   2},
+        { 0x0041ce00,  11},
+        { 0x0041ce34,   2},
+        { 0x0041ce44,  11},
+        { 0x0041ce74,  10},
+        { 0x0041cea4,   1},
+        { 0x0041ceac,   2},
+        { 0x0041cee8,   1},
+        { 0x0041cef0,  28},
+        { 0x0041cf70,   1},
+        { 0x0041cf78,   2},
+        { 0x0041cf98,   2},
+        { 0x0041cfdc,   1},
+        { 0x00500384,   1},
+        { 0x005004a0,   1},
+        { 0x00500604,   1},
+        { 0x00500680,   1},
+        { 0x00500714,   1},
+        { 0x0050081c,   1},
+        { 0x00500884,   1},
+        { 0x005008b0,   1},
+        { 0x005008c8,   3},
+        { 0x005008fc,   1},
+        { 0x00500b04,   1},
+        { 0x00500c04,   1},
+        { 0x00500c10,   8},
+        { 0x00500c88,   1},
+        { 0x00500d00,   1},
+        { 0x00500e08,   1},
+        { 0x00500f08,   1},
+        { 0x00501000,   1},
+        { 0x0050100c,   1},
+        { 0x00501018,   1},
+        { 0x00501854,   1},
+        { 0x00501ab0,   1},
+        { 0x00501ab8,   3},
+        { 0x00501c0c,   1},
+        { 0x00501c8c,   2},
+        { 0x00501d00,   1},
+        { 0x00501d08,   2},
+        { 0x00501e00,  11},
+        { 0x00501e34,   2},
+        { 0x00501e44,  11},
+        { 0x00501e74,  10},
+        { 0x00501ea4,   1},
+        { 0x00501eac,   2},
+        { 0x00501ee8,   1},
+        { 0x00501ef0,  28},
+        { 0x00501f70,   1},
+        { 0x00501f78,   2},
+        { 0x00501f98,   2},
+        { 0x00501fdc,   1},
+        { 0x0050202c,   2},
+        { 0x005020a0,   1},
+        { 0x005020a8,   1},
+        { 0x00502890,   2},
+        { 0x005028a0,   3},
+        { 0x005028b0,   2},
+        { 0x00503014,   1},
+        { 0x005030a0,   1},
+        { 0x005030cc,   1},
+        { 0x005031dc,   1},
+        { 0x00503e14,   1},
+        { 0x00503ea0,   1},
+        { 0x00503ecc,   1},
+        { 0x00503fdc,   1},
+        { 0x00504054,   1},
+        { 0x005042b0,   1},
+        { 0x005042b8,   3},
+        { 0x0050440c,   1},
+        { 0x0050448c,   2},
+        { 0x00504500,   1},
+        { 0x00504508,   2},
+        { 0x00504600,  11},
+        { 0x00504634,   2},
+        { 0x00504644,  11},
+        { 0x00504674,  10},
+        { 0x005046a4,   1},
+        { 0x005046ac,   2},
+        { 0x005046e8,   1},
+        { 0x005046f0,  28},
+        { 0x00504770,   1},
+        { 0x00504778,   2},
+        { 0x00504798,   2},
+        { 0x005047dc,   1},
+        { 0x00504854,   1},
+        { 0x00504ab0,   1},
+        { 0x00504ab8,   3},
+        { 0x00504c0c,   1},
+        { 0x00504c8c,   2},
+        { 0x00504d00,   1},
+        { 0x00504d08,   2},
+        { 0x00504e00,  11},
+        { 0x00504e34,   2},
+        { 0x00504e44,  11},
+        { 0x00504e74,  10},
+        { 0x00504ea4,   1},
+        { 0x00504eac,   2},
+        { 0x00504ee8,   1},
+        { 0x00504ef0,  28},
+        { 0x00504f70,   1},
+        { 0x00504f78,   2},
+        { 0x00504f98,   2},
+        { 0x00504fdc,   1},
+        { 0x00900100,   1},
+        { 0x009a0100,   1},
+};
+static const u32 gp10b_global_whitelist_ranges_count =
+        ARRAY_SIZE(gp10b_global_whitelist_ranges);
+/* context */
+/* runcontrol */
+static const u32 gp10b_runcontrol_whitelist[] = {
+};
+static const u32 gp10b_runcontrol_whitelist_count =
+        ARRAY_SIZE(gp10b_runcontrol_whitelist);
+static const struct regop_offset_range gp10b_runcontrol_whitelist_ranges[] = {
+};
+static const u32 gp10b_runcontrol_whitelist_ranges_count =
+        ARRAY_SIZE(gp10b_runcontrol_whitelist_ranges);
+/* quad ctl */
+static const u32 gp10b_qctl_whitelist[] = {
+};
+static const u32 gp10b_qctl_whitelist_count =
+        ARRAY_SIZE(gp10b_qctl_whitelist);
+static const struct regop_offset_range gp10b_qctl_whitelist_ranges[] = {
+};
+static const u32 gp10b_qctl_whitelist_ranges_count =
+        ARRAY_SIZE(gp10b_qctl_whitelist_ranges);
+const struct regop_offset_range *gp10b_get_global_whitelist_ranges(void)
+{
+        return gp10b_global_whitelist_ranges;
+}
+int gp10b_get_global_whitelist_ranges_count(void)
+{
+        return gp10b_global_whitelist_ranges_count;
+}
+const struct regop_offset_range *gp10b_get_context_whitelist_ranges(void)
+{
+        return gp10b_global_whitelist_ranges;
+}
+int gp10b_get_context_whitelist_ranges_count(void)
+{
+        return gp10b_global_whitelist_ranges_count;
+}
+const u32 *gp10b_get_runcontrol_whitelist(void)
+{
+        return gp10b_runcontrol_whitelist;
+}
+int gp10b_get_runcontrol_whitelist_count(void)
+{
+        return gp10b_runcontrol_whitelist_count;
+}
+const struct regop_offset_range *gp10b_get_runcontrol_whitelist_ranges(void)
+{
+        return gp10b_runcontrol_whitelist_ranges;
+}
+int gp10b_get_runcontrol_whitelist_ranges_count(void)
+{
+        return gp10b_runcontrol_whitelist_ranges_count;
+}
+const u32 *gp10b_get_qctl_whitelist(void)
+{
+        return gp10b_qctl_whitelist;
+}
+int gp10b_get_qctl_whitelist_count(void)
+{
+        return gp10b_qctl_whitelist_count;
+}
+const struct regop_offset_range *gp10b_get_qctl_whitelist_ranges(void)
+{
+        return gp10b_qctl_whitelist_ranges;
+}
+int gp10b_get_qctl_whitelist_ranges_count(void)
+{
+        return gp10b_qctl_whitelist_ranges_count;
+}
+int gp10b_apply_smpc_war(struct dbg_session_gk20a *dbg_s)
+{
+        /* Not needed on gp10b */
+        return 0;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/regops_gp10b.h b/drivers/gpu/nvgpu/gp10b/regops_gp10b.h
new file mode 100644
index 00000000..7bc08189
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/regops_gp10b.h
@@ -0,0 +1,44 @@
+/*
+ *
+ * Tegra GP10B GPU Debugger Driver Register Ops
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION. All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef __REGOPS_GP10B_H_
+#define __REGOPS_GP10B_H_
+struct dbg_session_gk20a;
+const struct regop_offset_range *gp10b_get_global_whitelist_ranges(void);
+int gp10b_get_global_whitelist_ranges_count(void);
+const struct regop_offset_range *gp10b_get_context_whitelist_ranges(void);
+int gp10b_get_context_whitelist_ranges_count(void);
+const u32 *gp10b_get_runcontrol_whitelist(void);
+int gp10b_get_runcontrol_whitelist_count(void);
+const struct regop_offset_range *gp10b_get_runcontrol_whitelist_ranges(void);
+int gp10b_get_runcontrol_whitelist_ranges_count(void);
+const u32 *gp10b_get_qctl_whitelist(void);
+int gp10b_get_qctl_whitelist_count(void);
+const struct regop_offset_range *gp10b_get_qctl_whitelist_ranges(void);
+int gp10b_get_qctl_whitelist_ranges_count(void);
+int gp10b_apply_smpc_war(struct dbg_session_gk20a *dbg_s);
+#endif /* __REGOPS_GP10B_H_ */
diff --git a/drivers/gpu/nvgpu/gp10b/rpfb_gp10b.c b/drivers/gpu/nvgpu/gp10b/rpfb_gp10b.c
new file mode 100644
index 00000000..3bbfde0a
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/rpfb_gp10b.c
@@ -0,0 +1,160 @@
+/*
+ * GP10B RPFB
+ *
+ * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include <nvgpu/dma.h>
+#include "gk20a/gk20a.h"
+#include "rpfb_gp10b.h"
+#include <nvgpu/hw/gp10b/hw_fifo_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_fb_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_bus_gp10b.h>
+#include <nvgpu/hw/gp10b/hw_gmmu_gp10b.h>
+int gp10b_replayable_pagefault_buffer_init(struct gk20a *g)
+{
+        u32 addr_lo;
+        u32 addr_hi;
+        struct vm_gk20a *vm = g->mm.bar2.vm;
+        int err;
+        size_t rbfb_size = NV_UVM_FAULT_BUF_SIZE *
+                fifo_replay_fault_buffer_size_hw_entries_v();
+        gk20a_dbg_fn("");
+        if (!g->mm.bar2_desc.gpu_va) {
+                err = nvgpu_dma_alloc_map_sys(vm, rbfb_size,
+                                                &g->mm.bar2_desc);
+                if (err) {
+                        nvgpu_err(g, "Error in replayable fault buffer");
+                        return err;
+                }
+        }
+        addr_lo = u64_lo32(g->mm.bar2_desc.gpu_va >> 12);
+        addr_hi = u64_hi32(g->mm.bar2_desc.gpu_va);
+        gk20a_writel(g, fifo_replay_fault_buffer_hi_r(),
+                        fifo_replay_fault_buffer_hi_base_f(addr_hi));
+        gk20a_writel(g, fifo_replay_fault_buffer_lo_r(),
+                        fifo_replay_fault_buffer_lo_base_f(addr_lo) |
+                        fifo_replay_fault_buffer_lo_enable_true_v());
+        gk20a_dbg_fn("done");
+        return 0;
+}
+void gp10b_replayable_pagefault_buffer_deinit(struct gk20a *g)
+{
+        struct vm_gk20a *vm = g->mm.bar2.vm;
+        nvgpu_dma_unmap_free(vm, &g->mm.bar2_desc);
+}
+u32 gp10b_replayable_pagefault_buffer_get_index(struct gk20a *g)
+{
+        u32 get_idx = 0;
+        gk20a_dbg_fn("");
+        get_idx = gk20a_readl(g, fifo_replay_fault_buffer_get_r());
+        if (get_idx >= fifo_replay_fault_buffer_size_hw_entries_v())
+                nvgpu_err(g, "Error in replayable fault buffer");
+        gk20a_dbg_fn("done");
+        return get_idx;
+}
+u32 gp10b_replayable_pagefault_buffer_put_index(struct gk20a *g)
+{
+        u32 put_idx = 0;
+        gk20a_dbg_fn("");
+        put_idx = gk20a_readl(g, fifo_replay_fault_buffer_put_r());
+        if (put_idx >= fifo_replay_fault_buffer_size_hw_entries_v())
+                nvgpu_err(g, "Error in UVM");
+        gk20a_dbg_fn("done");
+        return put_idx;
+}
+bool gp10b_replayable_pagefault_buffer_is_empty(struct gk20a *g)
+{
+        u32 get_idx = gk20a_readl(g, fifo_replay_fault_buffer_get_r());
+        u32 put_idx = gk20a_readl(g, fifo_replay_fault_buffer_put_r());
+        return (get_idx == put_idx ? true : false);
+}
+bool gp10b_replayable_pagefault_buffer_is_full(struct gk20a *g)
+{
+        u32 get_idx = gk20a_readl(g, fifo_replay_fault_buffer_get_r());
+        u32 put_idx = gk20a_readl(g, fifo_replay_fault_buffer_put_r());
+        u32 hw_entries = gk20a_readl(g, fifo_replay_fault_buffer_size_r());
+        return (get_idx == ((put_idx + 1) % hw_entries) ? true : false);
+}
+bool gp10b_replayable_pagefault_buffer_is_overflow(struct gk20a *g)
+{
+        u32 info = gk20a_readl(g, fifo_replay_fault_buffer_info_r());
+        return fifo_replay_fault_buffer_info_overflow_f(info);
+}
+void gp10b_replayable_pagefault_buffer_clear_overflow(struct gk20a *g)
+{
+        u32 info = gk20a_readl(g, fifo_replay_fault_buffer_info_r());
+        info |= fifo_replay_fault_buffer_info_overflow_clear_v();
+        gk20a_writel(g, fifo_replay_fault_buffer_info_r(), info);
+}
+void gp10b_replayable_pagefault_buffer_info(struct gk20a *g)
+{
+        gk20a_dbg_fn("");
+        pr_info("rpfb low: 0x%x\n",
+                (gk20a_readl(g, fifo_replay_fault_buffer_lo_r()) >> 12));
+        pr_info("rpfb hi: 0x%x\n",
+                gk20a_readl(g, fifo_replay_fault_buffer_hi_r()));
+        pr_info("rpfb enabled: 0x%x\n",
+                (gk20a_readl(g, fifo_replay_fault_buffer_lo_r()) & 0x1));
+        pr_info("rpfb size: %d\n",
+                gk20a_readl(g, fifo_replay_fault_buffer_size_r()));
+        pr_info("rpfb get index: %d\n",
+                gp10b_replayable_pagefault_buffer_get_index(g));
+        pr_info("rpfb put index: %d\n",
+                gp10b_replayable_pagefault_buffer_put_index(g));
+        pr_info("rpfb empty: %d\n",
+                gp10b_replayable_pagefault_buffer_is_empty(g));
+        pr_info("rpfb full  %d\n",
+                gp10b_replayable_pagefault_buffer_is_full(g));
+        pr_info("rpfb overflow  %d\n",
+                gp10b_replayable_pagefault_buffer_is_overflow(g));
+        gk20a_dbg_fn("done");
+}
diff --git a/drivers/gpu/nvgpu/gp10b/rpfb_gp10b.h b/drivers/gpu/nvgpu/gp10b/rpfb_gp10b.h
new file mode 100644
index 00000000..ee210a5f
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/rpfb_gp10b.h
@@ -0,0 +1,39 @@
+/*
+ * Copyright (c) 2015, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef RPFB_GP20B_H
+#define RPFB_GP20B_H
+struct gk20a;
+#define NV_UVM_FAULT_BUF_SIZE 32
+int gp10b_replayable_pagefault_buffer_init(struct gk20a *g);
+u32 gp10b_replayable_pagefault_buffer_get_index(struct gk20a *g);
+u32 gp10b_replayable_pagefault_buffer_put_index(struct gk20a *g);
+bool gp10b_replayable_pagefault_buffer_is_empty(struct gk20a *g);
+bool gp10b_replayable_pagefault_buffer_is_full(struct gk20a *g);
+bool gp10b_replayable_pagefault_buffer_is_overflow(struct gk20a *g);
+void gp10b_replayable_pagefault_buffer_clear_overflow(struct gk20a *g);
+void gp10b_replayable_pagefault_buffer_info(struct gk20a *g);
+void gp10b_replayable_pagefault_buffer_deinit(struct gk20a *g);
+#endif
diff --git a/drivers/gpu/nvgpu/gp10b/therm_gp10b.c b/drivers/gpu/nvgpu/gp10b/therm_gp10b.c
new file mode 100644
index 00000000..e02259d8
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/therm_gp10b.c
@@ -0,0 +1,141 @@
+/*
+ * GP10B Therm
+ *
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#include "gk20a/gk20a.h"
+#include "therm_gp10b.h"
+#include <nvgpu/soc.h>
+#include <nvgpu/hw/gp10b/hw_therm_gp10b.h>
+int gp10b_init_therm_setup_hw(struct gk20a *g)
+{
+        u32 v;
+        gk20a_dbg_fn("");
+        /* program NV_THERM registers */
+        gk20a_writel(g, therm_use_a_r(), therm_use_a_ext_therm_0_enable_f() |
+                                        therm_use_a_ext_therm_1_enable_f()  |
+                                        therm_use_a_ext_therm_2_enable_f());
+        gk20a_writel(g, therm_evt_ext_therm_0_r(),
+                therm_evt_ext_therm_0_slow_factor_f(0x2));
+        gk20a_writel(g, therm_evt_ext_therm_1_r(),
+                therm_evt_ext_therm_1_slow_factor_f(0x6));
+        gk20a_writel(g, therm_evt_ext_therm_2_r(),
+                therm_evt_ext_therm_2_slow_factor_f(0xe));
+        gk20a_writel(g, therm_grad_stepping_table_r(0),
+                therm_grad_stepping_table_slowdown_factor0_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by1p5_f()) |
+                therm_grad_stepping_table_slowdown_factor1_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by2_f()) |
+                therm_grad_stepping_table_slowdown_factor2_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by4_f()) |
+                therm_grad_stepping_table_slowdown_factor3_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by8_f()) |
+                therm_grad_stepping_table_slowdown_factor4_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by8_f()));
+        gk20a_writel(g, therm_grad_stepping_table_r(1),
+                therm_grad_stepping_table_slowdown_factor0_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by8_f()) |
+                therm_grad_stepping_table_slowdown_factor1_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by8_f()) |
+                therm_grad_stepping_table_slowdown_factor2_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by8_f()) |
+                therm_grad_stepping_table_slowdown_factor3_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by8_f()) |
+                therm_grad_stepping_table_slowdown_factor4_f(
+                therm_grad_stepping_table_slowdown_factor0_fpdiv_by8_f()));
+        v = gk20a_readl(g, therm_clk_timing_r(0));
+        v |= therm_clk_timing_grad_slowdown_enabled_f();
+        gk20a_writel(g, therm_clk_timing_r(0), v);
+        v = gk20a_readl(g, therm_config2_r());
+        v |= therm_config2_grad_enable_f(1);
+        v |= therm_config2_slowdown_factor_extended_f(1);
+        gk20a_writel(g, therm_config2_r(), v);
+        gk20a_writel(g, therm_grad_stepping1_r(),
+                        therm_grad_stepping1_pdiv_duration_f(32));
+        v = gk20a_readl(g, therm_grad_stepping0_r());
+        v |= therm_grad_stepping0_feature_enable_f();
+        gk20a_writel(g, therm_grad_stepping0_r(), v);
+        return 0;
+}
+int gp10b_elcg_init_idle_filters(struct gk20a *g)
+{
+        u32 gate_ctrl, idle_filter;
+        u32 engine_id;
+        u32 active_engine_id = 0;
+        struct fifo_gk20a *f = &g->fifo;
+        gk20a_dbg_fn("");
+        for (engine_id = 0; engine_id < f->num_engines; engine_id++) {
+                active_engine_id = f->active_engines_list[engine_id];
+                gate_ctrl = gk20a_readl(g, therm_gate_ctrl_r(active_engine_id));
+                if (nvgpu_platform_is_simulation(g)) {
+                        gate_ctrl = set_field(gate_ctrl,
+                                therm_gate_ctrl_eng_delay_after_m(),
+                                therm_gate_ctrl_eng_delay_after_f(4));
+                }
+                /* 2 * (1 << 9) = 1024 clks */
+                gate_ctrl = set_field(gate_ctrl,
+                        therm_gate_ctrl_eng_idle_filt_exp_m(),
+                        therm_gate_ctrl_eng_idle_filt_exp_f(9));
+                gate_ctrl = set_field(gate_ctrl,
+                        therm_gate_ctrl_eng_idle_filt_mant_m(),
+                        therm_gate_ctrl_eng_idle_filt_mant_f(2));
+                gate_ctrl = set_field(gate_ctrl,
+                        therm_gate_ctrl_eng_delay_before_m(),
+                        therm_gate_ctrl_eng_delay_before_f(4));
+                gk20a_writel(g, therm_gate_ctrl_r(active_engine_id), gate_ctrl);
+        }
+        /* default fecs_idle_filter to 0 */
+        idle_filter = gk20a_readl(g, therm_fecs_idle_filter_r());
+        idle_filter &= ~therm_fecs_idle_filter_value_m();
+        gk20a_writel(g, therm_fecs_idle_filter_r(), idle_filter);
+        /* default hubmmu_idle_filter to 0 */
+        idle_filter = gk20a_readl(g, therm_hubmmu_idle_filter_r());
+        idle_filter &= ~therm_hubmmu_idle_filter_value_m();
+        gk20a_writel(g, therm_hubmmu_idle_filter_r(), idle_filter);
+        gk20a_dbg_fn("done");
+        return 0;
+}
+void gp10b_init_therm_ops(struct gpu_ops *gops)
+{
+        gops->therm.init_therm_setup_hw = gp10b_init_therm_setup_hw;
+        gops->therm.elcg_init_idle_filters = gp10b_elcg_init_idle_filters;
+}
diff --git a/drivers/gpu/nvgpu/gp10b/therm_gp10b.h b/drivers/gpu/nvgpu/gp10b/therm_gp10b.h
new file mode 100644
index 00000000..2a40b73c
--- /dev/null
+++ b/drivers/gpu/nvgpu/gp10b/therm_gp10b.h
@@ -0,0 +1,29 @@
+/*
+ * Copyright (c) 2015-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+#ifndef THERM_GP10B_H
+#define THERM_GP10B_H
+struct gk20a;
+int gp10b_init_therm_setup_hw(struct gk20a *g);
+int gp10b_elcg_init_idle_filters(struct gk20a *g);
+#endif /* THERM_GP10B_H */