From de8e057f7eebcfe676278826ab457bf86b1b36fd Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Thu, 3 Aug 2017 21:43:50 -0700
Subject: gpu: nvgpu: GV100 support

Adds support of GV100 up to devinit.

JIRA: EVLR-1693

Change-Id: Ic7aa5f1c20714e05954139f143abb6a3459858fc
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1532747
Reviewed-by: svccoveritychecker <svccoveritychecker@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 441 ++++++++++++++++++++++++++++++++++++
 1 file changed, 441 insertions(+)
 create mode 100644 drivers/gpu/nvgpu/gv100/hal_gv100.c

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
new file mode 100644
index 00000000..337c607f
--- /dev/null
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -0,0 +1,441 @@
+/*
+ * GV100 Tegra HAL interface
+ *
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ */
+
+#include <linux/types.h>
+#include <linux/printk.h>
+
+#include <linux/types.h>
+#include <linux/tegra_gpu_t19x.h>
+
+#include "gk20a/gk20a.h"
+#include "gk20a/fifo_gk20a.h"
+#include "gk20a/ctxsw_trace_gk20a.h"
+#include "gk20a/fecs_trace_gk20a.h"
+#include "gk20a/css_gr_gk20a.h"
+#include "gk20a/mc_gk20a.h"
+#include "gk20a/dbg_gpu_gk20a.h"
+#include "gk20a/bus_gk20a.h"
+#include "gk20a/pramin_gk20a.h"
+#include "gk20a/flcn_gk20a.h"
+#include "gk20a/regops_gk20a.h"
+
+#include "gm20b/ltc_gm20b.h"
+#include "gm20b/gr_gm20b.h"
+#include "gm20b/fifo_gm20b.h"
+
+#include "gp106/clk_gp106.h"
+#include "gp106/clk_arb_gp106.h"
+#include "gp106/pmu_gp106.h"
+
+#include "gm206/bios_gm206.h"
+#include "gp106/therm_gp106.h"
+#include "gp106/xve_gp106.h"
+#include "gp106/clk_gp106.h"
+#include "gp106/flcn_gp106.h"
+#include "gp10b/ltc_gp10b.h"
+#include "gp10b/therm_gp10b.h"
+#include "gp10b/mc_gp10b.h"
+#include "gp10b/ce_gp10b.h"
+#include "gp10b/priv_ring_gp10b.h"
+#include "gp10b/fifo_gp10b.h"
+#include "gp10b/fecs_trace_gp10b.h"
+
+#include "gv11b/hal_gv11b.h"
+#include "gv11b/gr_gv11b.h"
+#include "gv11b/mc_gv11b.h"
+#include "gv11b/ltc_gv11b.h"
+#include "gv11b/gv11b.h"
+#include "gv11b/ce_gv11b.h"
+#include "gv100/gr_ctx_gv100.h"
+#include "gv100/mm_gv100.h"
+#include "gv11b/pmu_gv11b.h"
+#include "gv100/fb_gv100.h"
+#include "gv11b/fifo_gv11b.h"
+#include "gv11b/gv11b_gating_reglist.h"
+#include "gv11b/regops_gv11b.h"
+#include "gv11b/subctx_gv11b.h"
+
+#include "gv100.h"
+#include "hal_gv100.h"
+
+#include <nvgpu/debug.h>
+#include <nvgpu/enabled.h>
+
+#include <nvgpu/hw/gv100/hw_proj_gv100.h>
+#include <nvgpu/hw/gv100/hw_fifo_gv100.h>
+#include <nvgpu/hw/gv100/hw_ram_gv100.h>
+#include <nvgpu/hw/gv100/hw_top_gv100.h>
+#include <nvgpu/hw/gv100/hw_pram_gv100.h>
+
+static int gv100_get_litter_value(struct gk20a *g, int value)
+{
+	int ret = EINVAL;
+	switch (value) {
+	case GPU_LIT_NUM_GPCS:
+		ret = proj_scal_litter_num_gpcs_v();
+		break;
+	case GPU_LIT_NUM_PES_PER_GPC:
+		ret = proj_scal_litter_num_pes_per_gpc_v();
+		break;
+	case GPU_LIT_NUM_ZCULL_BANKS:
+		ret = proj_scal_litter_num_zcull_banks_v();
+		break;
+	case GPU_LIT_NUM_TPC_PER_GPC:
+		ret = proj_scal_litter_num_tpc_per_gpc_v();
+		break;
+	case GPU_LIT_NUM_SM_PER_TPC:
+		ret = proj_scal_litter_num_sm_per_tpc_v();
+		break;
+	case GPU_LIT_NUM_FBPS:
+		ret = proj_scal_litter_num_fbps_v();
+		break;
+	case GPU_LIT_GPC_BASE:
+		ret = proj_gpc_base_v();
+		break;
+	case GPU_LIT_GPC_STRIDE:
+		ret = proj_gpc_stride_v();
+		break;
+	case GPU_LIT_GPC_SHARED_BASE:
+		ret = proj_gpc_shared_base_v();
+		break;
+	case GPU_LIT_TPC_IN_GPC_BASE:
+		ret = proj_tpc_in_gpc_base_v();
+		break;
+	case GPU_LIT_TPC_IN_GPC_STRIDE:
+		ret = proj_tpc_in_gpc_stride_v();
+		break;
+	case GPU_LIT_TPC_IN_GPC_SHARED_BASE:
+		ret = proj_tpc_in_gpc_shared_base_v();
+		break;
+	case GPU_LIT_PPC_IN_GPC_BASE:
+		ret = proj_ppc_in_gpc_base_v();
+	case GPU_LIT_PPC_IN_GPC_STRIDE:
+		ret = proj_ppc_in_gpc_stride_v();
+		break;
+	case GPU_LIT_ROP_BASE:
+		ret = proj_rop_base_v();
+		break;
+	case GPU_LIT_ROP_STRIDE:
+		ret = proj_rop_stride_v();
+		break;
+	case GPU_LIT_ROP_SHARED_BASE:
+		ret = proj_rop_shared_base_v();
+		break;
+	case GPU_LIT_HOST_NUM_ENGINES:
+		ret = proj_host_num_engines_v();
+		break;
+	case GPU_LIT_HOST_NUM_PBDMA:
+		ret = proj_host_num_pbdma_v();
+		break;
+	case GPU_LIT_LTC_STRIDE:
+		ret = proj_ltc_stride_v();
+		break;
+	case GPU_LIT_LTS_STRIDE:
+		ret = proj_lts_stride_v();
+		break;
+	case GPU_LIT_NUM_FBPAS:
+		ret = proj_scal_litter_num_fbpas_v();
+		break;
+	case GPU_LIT_FBPA_STRIDE:
+		ret = proj_fbpa_stride_v();
+		break;
+	case GPU_LIT_SM_PRI_STRIDE:
+		ret = proj_sm_stride_v();
+		break;
+
+	default:
+		break;
+	}
+
+	return ret;
+}
+
+int gv100_init_gpu_characteristics(struct gk20a *g)
+{
+	struct nvgpu_gpu_characteristics *gpu = &g->gpu_characteristics;
+
+	int err;
+
+	err = gk20a_init_gpu_characteristics(g);
+	if (err)
+		return err;
+
+	gpu->flags |=
+		NVGPU_GPU_FLAGS_SUPPORT_TSG_SUBCONTEXTS;
+
+	return 0;
+}
+
+
+
+static const struct gpu_ops gv100_ops = {
+	.ltc = {
+		.determine_L2_size_bytes = gp10b_determine_L2_size_bytes,
+		.set_zbc_s_entry = gv11b_ltc_set_zbc_stencil_entry,
+		.set_zbc_color_entry = gm20b_ltc_set_zbc_color_entry,
+		.set_zbc_depth_entry = gm20b_ltc_set_zbc_depth_entry,
+		.init_cbc = NULL,
+		.init_fs_state = gv11b_ltc_init_fs_state,
+		.init_comptags = gp10b_ltc_init_comptags,
+		.cbc_ctrl = gm20b_ltc_cbc_ctrl,
+		.isr = gv11b_ltc_isr,
+		.cbc_fix_config = gv11b_ltc_cbc_fix_config,
+		.flush = gm20b_flush_ltc,
+		.set_enabled = gp10b_ltc_set_enabled,
+	},
+	.ce2 = {
+		.isr_stall = gv11b_ce_isr,
+		.isr_nonstall = gp10b_ce_nonstall_isr,
+		.get_num_pce = gv11b_ce_get_num_pce,
+	},
+	.fifo = {
+		.init_fifo_setup_hw = gv11b_init_fifo_setup_hw,
+		.bind_channel = channel_gm20b_bind,
+		.unbind_channel = channel_gv11b_unbind,
+		.disable_channel = gk20a_fifo_disable_channel,
+		.enable_channel = gk20a_fifo_enable_channel,
+		.alloc_inst = gk20a_fifo_alloc_inst,
+		.free_inst = gk20a_fifo_free_inst,
+		.setup_ramfc = channel_gv11b_setup_ramfc,
+		.channel_set_priority = gk20a_fifo_set_priority,
+		.channel_set_timeslice = gk20a_fifo_set_timeslice,
+		.default_timeslice_us = gk20a_fifo_default_timeslice_us,
+		.setup_userd = gk20a_fifo_setup_userd,
+		.userd_gp_get = gv11b_userd_gp_get,
+		.userd_gp_put = gv11b_userd_gp_put,
+		.userd_pb_get = gv11b_userd_pb_get,
+		.pbdma_acquire_val = gk20a_fifo_pbdma_acquire_val,
+		.preempt_channel = gv11b_fifo_preempt_channel,
+		.preempt_tsg = gv11b_fifo_preempt_tsg,
+		.update_runlist = gk20a_fifo_update_runlist,
+		.trigger_mmu_fault = NULL,
+		.get_mmu_fault_info = NULL,
+		.wait_engine_idle = gk20a_fifo_wait_engine_idle,
+		.get_num_fifos = gv11b_fifo_get_num_fifos,
+		.get_pbdma_signature = gp10b_fifo_get_pbdma_signature,
+		.set_runlist_interleave = gk20a_fifo_set_runlist_interleave,
+		.tsg_set_timeslice = gk20a_fifo_tsg_set_timeslice,
+		.force_reset_ch = gk20a_fifo_force_reset_ch,
+		.engine_enum_from_type = gp10b_fifo_engine_enum_from_type,
+		.device_info_data_parse = gp10b_device_info_data_parse,
+		.eng_runlist_base_size = fifo_eng_runlist_base__size_1_v,
+		.init_engine_info = gk20a_fifo_init_engine_info,
+		.runlist_entry_size = ram_rl_entry_size_v,
+		.get_tsg_runlist_entry = gv11b_get_tsg_runlist_entry,
+		.get_ch_runlist_entry = gv11b_get_ch_runlist_entry,
+		.is_fault_engine_subid_gpc = gv11b_is_fault_engine_subid_gpc,
+		.dump_pbdma_status = gk20a_dump_pbdma_status,
+		.dump_eng_status = gv11b_dump_eng_status,
+		.dump_channel_status_ramfc = gv11b_dump_channel_status_ramfc,
+		.intr_0_error_mask = gv11b_fifo_intr_0_error_mask,
+		.is_preempt_pending = gv11b_fifo_is_preempt_pending,
+		.init_pbdma_intr_descs = gv11b_fifo_init_pbdma_intr_descs,
+		.reset_enable_hw = gv11b_init_fifo_reset_enable_hw,
+		.teardown_ch_tsg = gv11b_fifo_teardown_ch_tsg,
+		.handle_sched_error = gv11b_fifo_handle_sched_error,
+		.handle_pbdma_intr_0 = gv11b_fifo_handle_pbdma_intr_0,
+		.handle_pbdma_intr_1 = gv11b_fifo_handle_pbdma_intr_1,
+		.init_eng_method_buffers = gv11b_fifo_init_eng_method_buffers,
+		.deinit_eng_method_buffers =
+			gv11b_fifo_deinit_eng_method_buffers,
+		.tsg_bind_channel = gk20a_tsg_bind_channel,
+		.tsg_unbind_channel = gk20a_tsg_unbind_channel,
+#ifdef CONFIG_TEGRA_GK20A_NVHOST
+		.alloc_syncpt_buf = gv11b_fifo_alloc_syncpt_buf,
+		.free_syncpt_buf = gv11b_fifo_free_syncpt_buf,
+		.add_syncpt_wait_cmd = gv11b_fifo_add_syncpt_wait_cmd,
+		.get_syncpt_wait_cmd_size = gv11b_fifo_get_syncpt_wait_cmd_size,
+		.add_syncpt_incr_cmd = gv11b_fifo_add_syncpt_incr_cmd,
+		.get_syncpt_incr_cmd_size = gv11b_fifo_get_syncpt_incr_cmd_size,
+#endif
+		.resetup_ramfc = NULL,
+		.device_info_fault_id = top_device_info_data_fault_id_enum_v,
+		.free_channel_ctx_header = gv11b_free_subctx_header,
+		.preempt_ch_tsg = gv11b_fifo_preempt_ch_tsg,
+		.handle_ctxsw_timeout = gv11b_fifo_handle_ctxsw_timeout,
+	},
+	.gr_ctx = {
+		.get_netlist_name = gr_gv100_get_netlist_name,
+		.is_fw_defined = gr_gv100_is_firmware_defined,
+	},
+#ifdef CONFIG_GK20A_CTXSW_TRACE
+	.fecs_trace = {
+		.alloc_user_buffer = gk20a_ctxsw_dev_ring_alloc,
+		.free_user_buffer = gk20a_ctxsw_dev_ring_free,
+		.mmap_user_buffer = gk20a_ctxsw_dev_mmap_buffer,
+		.init = gk20a_fecs_trace_init,
+		.deinit = gk20a_fecs_trace_deinit,
+		.enable = gk20a_fecs_trace_enable,
+		.disable = gk20a_fecs_trace_disable,
+		.is_enabled = gk20a_fecs_trace_is_enabled,
+		.reset = gk20a_fecs_trace_reset,
+		.flush = gp10b_fecs_trace_flush,
+		.poll = gk20a_fecs_trace_poll,
+		.bind_channel = gk20a_fecs_trace_bind_channel,
+		.unbind_channel = gk20a_fecs_trace_unbind_channel,
+		.max_entries = gk20a_gr_max_entries,
+	},
+#endif /* CONFIG_GK20A_CTXSW_TRACE */
+	.pramin = {
+		.enter = gk20a_pramin_enter,
+		.exit = gk20a_pramin_exit,
+		.data032_r = pram_data032_r,
+	},
+	.clk = {
+		.init_clk_support = gp106_init_clk_support,
+		.get_crystal_clk_hz = gp106_crystal_clk_hz,
+		.measure_freq = gp106_clk_measure_freq,
+		.suspend_clk_support = gp106_suspend_clk_support,
+	},
+	.clk_arb = {
+		.get_arbiter_clk_domains = gp106_get_arbiter_clk_domains,
+		.get_arbiter_clk_range = gp106_get_arbiter_clk_range,
+		.get_arbiter_clk_default = gp106_get_arbiter_clk_default,
+		.get_current_pstate = nvgpu_clk_arb_get_current_pstate,
+	},
+	.mc = {
+		.intr_enable = mc_gv11b_intr_enable,
+		.intr_unit_config = mc_gp10b_intr_unit_config,
+		.isr_stall = mc_gp10b_isr_stall,
+		.intr_stall = mc_gp10b_intr_stall,
+		.intr_stall_pause = mc_gp10b_intr_stall_pause,
+		.intr_stall_resume = mc_gp10b_intr_stall_resume,
+		.intr_nonstall = mc_gp10b_intr_nonstall,
+		.intr_nonstall_pause = mc_gp10b_intr_nonstall_pause,
+		.intr_nonstall_resume = mc_gp10b_intr_nonstall_resume,
+		.enable = gk20a_mc_enable,
+		.disable = gk20a_mc_disable,
+		.reset = gk20a_mc_reset,
+		.boot_0 = gk20a_mc_boot_0,
+		.is_intr1_pending = mc_gp10b_is_intr1_pending,
+		.is_intr_hub_pending = gv11b_mc_is_intr_hub_pending,
+	},
+	.debug = {
+		.show_dump = gk20a_debug_show_dump,
+	},
+	.dbg_session_ops = {
+		.exec_reg_ops = exec_regops_gk20a,
+		.dbg_set_powergate = dbg_set_powergate,
+		.check_and_set_global_reservation =
+			nvgpu_check_and_set_global_reservation,
+		.check_and_set_context_reservation =
+			nvgpu_check_and_set_context_reservation,
+		.release_profiler_reservation =
+			nvgpu_release_profiler_reservation,
+		.perfbuffer_enable = gk20a_perfbuf_enable_locked,
+		.perfbuffer_disable = gk20a_perfbuf_disable_locked,
+	},
+	.bus = {
+		.init_hw = gk20a_bus_init_hw,
+		.isr = gk20a_bus_isr,
+		.read_ptimer = gk20a_read_ptimer,
+		.bar1_bind = NULL,
+	},
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+	.css = {
+		.enable_snapshot = css_hw_enable_snapshot,
+		.disable_snapshot = css_hw_disable_snapshot,
+		.check_data_available = css_hw_check_data_available,
+		.set_handled_snapshots = css_hw_set_handled_snapshots,
+		.allocate_perfmon_ids = css_gr_allocate_perfmon_ids,
+		.release_perfmon_ids = css_gr_release_perfmon_ids,
+	},
+#endif
+	.xve = {
+		.sw_init          = xve_sw_init_gp106,
+		.get_speed        = xve_get_speed_gp106,
+		.set_speed        = xve_set_speed_gp106,
+		.available_speeds = xve_available_speeds_gp106,
+		.xve_readl        = xve_xve_readl_gp106,
+		.xve_writel       = xve_xve_writel_gp106,
+		.disable_aspm     = xve_disable_aspm_gp106,
+		.reset_gpu        = xve_reset_gpu_gp106,
+#if defined(CONFIG_PCI_MSI)
+		.rearm_msi        = xve_rearm_msi_gp106,
+#endif
+		.enable_shadow_rom = xve_enable_shadow_rom_gp106,
+		.disable_shadow_rom = xve_disable_shadow_rom_gp106,
+	},
+	.falcon = {
+		.falcon_hal_sw_init = gp106_falcon_hal_sw_init,
+	},
+	.priv_ring = {
+		.isr = gp10b_priv_ring_isr,
+	},
+	.chip_init_gpu_characteristics = gv100_init_gpu_characteristics,
+	.get_litter_value = gv100_get_litter_value,
+	.bios_init = gm206_bios_init,
+};
+
+int gv100_init_hal(struct gk20a *g)
+{
+	struct gpu_ops *gops = &g->ops;
+	struct nvgpu_gpu_characteristics *c = &g->gpu_characteristics;
+
+	gops->ltc = gv100_ops.ltc;
+	gops->ce2 = gv100_ops.ce2;
+	gops->clock_gating = gv100_ops.clock_gating;
+	gops->fifo = gv100_ops.fifo;
+	gops->gr_ctx = gv100_ops.gr_ctx;
+	gops->fecs_trace = gv100_ops.fecs_trace;
+	gops->pramin = gv100_ops.pramin;
+	gops->therm = gv100_ops.therm;
+	gops->mc = gv100_ops.mc;
+	gops->debug = gv100_ops.debug;
+	gops->dbg_session_ops = gv100_ops.dbg_session_ops;
+	gops->bus = gv100_ops.bus;
+#if defined(CONFIG_GK20A_CYCLE_STATS)
+	gops->css = gv100_ops.css;
+#endif
+	gops->xve = gv100_ops.xve;
+	gops->falcon = gv100_ops.falcon;
+	gops->priv_ring = gv100_ops.priv_ring;
+
+	/* clocks */
+	gops->clk.init_clk_support = gv100_ops.clk.init_clk_support;
+	gops->clk.get_crystal_clk_hz = gv100_ops.clk.get_crystal_clk_hz;
+	gops->clk.measure_freq = gv100_ops.clk.measure_freq;
+	gops->clk.suspend_clk_support = gv100_ops.clk.suspend_clk_support;
+
+	/* Lone functions */
+	gops->chip_init_gpu_characteristics =
+		gv100_ops.chip_init_gpu_characteristics;
+	gops->get_litter_value = gv100_ops.get_litter_value;
+	gops->bios_init = gv100_ops.bios_init;
+
+	__nvgpu_set_enabled(g, NVGPU_GR_USE_DMA_FOR_FW_BOOTSTRAP, true);
+	__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
+	__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+	/* for now */
+	__nvgpu_set_enabled(g, NVGPU_PMU_PSTATE, false);
+
+	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
+
+	gv11b_init_gr(g);
+	gv100_init_fb(gops);
+	gv100_init_mm(gops);
+	gp106_init_pmu_ops(g);
+
+	g->name = "gv10x";
+
+	c->twod_class = FERMI_TWOD_A;
+	c->threed_class = VOLTA_A;
+	c->compute_class = VOLTA_COMPUTE_A;
+	c->gpfifo_class = VOLTA_CHANNEL_GPFIFO_A;
+	c->inline_to_memory_class = KEPLER_INLINE_TO_MEMORY_B;
+	c->dma_copy_class = VOLTA_DMA_COPY_A;
+
+	return 0;
+}
-- 
cgit v1.2.2


From 4bb0896912440d126ae47da350b448f37dabc63d Mon Sep 17 00:00:00 2001
From: Sunny He <suhe@nvidia.com>
Date: Mon, 31 Jul 2017 14:40:46 -0700
Subject: gpu: nvgpu: Reorg fb HAL initialization

Reorganize HAL initialization to remove inheritance and construct
the gpu_ops struct at compile time. This patch only covers the
fb sub-module of the gpu_ops struct.

Perform HAL function assignments in hal_gxxxx.c through the
population of a chip-specific copy of gpu_ops.

Jira NVGPU-74

Change-Id: I3fdbf6059ef664caf8d33797a8a5f3f8eb6485bf
Signed-off-by: Sunny He <suhe@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1537748
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 28 ++++++++++++++++++++++++++--
 1 file changed, 26 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 337c607f..a2a131da 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -30,10 +30,14 @@
 #include "gk20a/pramin_gk20a.h"
 #include "gk20a/flcn_gk20a.h"
 #include "gk20a/regops_gk20a.h"
+#include "gk20a/fb_gk20a.h"
 
 #include "gm20b/ltc_gm20b.h"
 #include "gm20b/gr_gm20b.h"
 #include "gm20b/fifo_gm20b.h"
+#include "gm20b/fb_gm20b.h"
+
+#include "gp10b/fb_gp10b.h"
 
 #include "gp106/clk_gp106.h"
 #include "gp106/clk_arb_gp106.h"
@@ -61,7 +65,7 @@
 #include "gv100/gr_ctx_gv100.h"
 #include "gv100/mm_gv100.h"
 #include "gv11b/pmu_gv11b.h"
-#include "gv100/fb_gv100.h"
+#include "gv11b/fb_gv11b.h"
 #include "gv11b/fifo_gv11b.h"
 #include "gv11b/gv11b_gating_reglist.h"
 #include "gv11b/regops_gv11b.h"
@@ -69,6 +73,7 @@
 
 #include "gv100.h"
 #include "hal_gv100.h"
+#include "gv100/fb_gv100.h"
 
 #include <nvgpu/debug.h>
 #include <nvgpu/enabled.h>
@@ -200,6 +205,23 @@ static const struct gpu_ops gv100_ops = {
 		.isr_nonstall = gp10b_ce_nonstall_isr,
 		.get_num_pce = gv11b_ce_get_num_pce,
 	},
+	.fb = {
+		.reset = gv100_fb_reset,
+		.init_hw = gk20a_fb_init_hw,
+		.init_fs_state = gv11b_fb_init_fs_state,
+		.init_cbc = gv11b_fb_init_cbc,
+		.set_mmu_page_size = gm20b_fb_set_mmu_page_size,
+		.set_use_full_comp_tag_line =
+			gm20b_fb_set_use_full_comp_tag_line,
+		.compression_page_size = gp10b_fb_compression_page_size,
+		.compressible_page_size = gp10b_fb_compressible_page_size,
+		.vpr_info_fetch = gm20b_fb_vpr_info_fetch,
+		.dump_vpr_wpr_info = gm20b_fb_dump_vpr_wpr_info,
+		.is_debug_mode_enabled = gm20b_fb_debug_mode_enabled,
+		.set_debug_mode = gm20b_fb_set_debug_mode,
+		.tlb_invalidate = gk20a_fb_tlb_invalidate,
+		.hub_isr = gv11b_fb_hub_isr,
+	},
 	.fifo = {
 		.init_fifo_setup_hw = gv11b_init_fifo_setup_hw,
 		.bind_channel = channel_gm20b_bind,
@@ -424,10 +446,12 @@ int gv100_init_hal(struct gk20a *g)
 	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
 
 	gv11b_init_gr(g);
-	gv100_init_fb(gops);
 	gv100_init_mm(gops);
 	gp106_init_pmu_ops(g);
 
+	gv11b_init_uncompressed_kind_map();
+	gv11b_init_kind_attr();
+
 	g->name = "gv10x";
 
 	c->twod_class = FERMI_TWOD_A;
-- 
cgit v1.2.2


From 8ab6445df5b24c200ac4e346684119a85008e0e3 Mon Sep 17 00:00:00 2001
From: Sunny He <suhe@nvidia.com>
Date: Wed, 26 Jul 2017 14:23:01 -0700
Subject: gpu: nvgpu: Reorg mm HAL initialization

Reorganize HAL initialization to remove inheritance and construct
the gpu_ops struct at compile time. This patch only covers the
mm sub-module of the gpu_ops struct.

Perform HAL function assignments in hal_gxxxx.c through the
population of a chip-specific copy of gpu_ops.

Jira NVGPU-74

Change-Id: I5fd295c6473d5b4a6178c0c6be8fcf8f4c33f2e3
Signed-off-by: Sunny He <suhe@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1537754
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 33 +++++++++++++++++++++++++++++++--
 1 file changed, 31 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index a2a131da..74bc48fb 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -31,11 +31,13 @@
 #include "gk20a/flcn_gk20a.h"
 #include "gk20a/regops_gk20a.h"
 #include "gk20a/fb_gk20a.h"
+#include "gk20a/mm_gk20a.h"
 
 #include "gm20b/ltc_gm20b.h"
 #include "gm20b/gr_gm20b.h"
 #include "gm20b/fifo_gm20b.h"
 #include "gm20b/fb_gm20b.h"
+#include "gm20b/mm_gm20b.h"
 
 #include "gp10b/fb_gp10b.h"
 
@@ -55,6 +57,7 @@
 #include "gp10b/priv_ring_gp10b.h"
 #include "gp10b/fifo_gp10b.h"
 #include "gp10b/fecs_trace_gp10b.h"
+#include "gp10b/mm_gp10b.h"
 
 #include "gv11b/hal_gv11b.h"
 #include "gv11b/gr_gv11b.h"
@@ -63,7 +66,7 @@
 #include "gv11b/gv11b.h"
 #include "gv11b/ce_gv11b.h"
 #include "gv100/gr_ctx_gv100.h"
-#include "gv100/mm_gv100.h"
+#include "gv11b/mm_gv11b.h"
 #include "gv11b/pmu_gv11b.h"
 #include "gv11b/fb_gv11b.h"
 #include "gv11b/fifo_gv11b.h"
@@ -74,6 +77,7 @@
 #include "gv100.h"
 #include "hal_gv100.h"
 #include "gv100/fb_gv100.h"
+#include "gv100/mm_gv100.h"
 
 #include <nvgpu/debug.h>
 #include <nvgpu/enabled.h>
@@ -310,6 +314,32 @@ static const struct gpu_ops gv100_ops = {
 		.max_entries = gk20a_gr_max_entries,
 	},
 #endif /* CONFIG_GK20A_CTXSW_TRACE */
+	.mm = {
+		.support_sparse = gm20b_mm_support_sparse,
+		.gmmu_map = gk20a_locked_gmmu_map,
+		.gmmu_unmap = gk20a_locked_gmmu_unmap,
+		.vm_bind_channel = gk20a_vm_bind_channel,
+		.fb_flush = gk20a_mm_fb_flush,
+		.l2_invalidate = gk20a_mm_l2_invalidate,
+		.l2_flush = gv11b_mm_l2_flush,
+		.cbc_clean = gk20a_mm_cbc_clean,
+		.set_big_page_size = gm20b_mm_set_big_page_size,
+		.get_big_page_sizes = gm20b_mm_get_big_page_sizes,
+		.get_default_big_page_size = gp10b_mm_get_default_big_page_size,
+		.gpu_phys_addr = gv11b_gpu_phys_addr,
+		.get_physical_addr_bits = NULL,
+		.get_mmu_levels = gp10b_mm_get_mmu_levels,
+		.get_vidmem_size = gv100_mm_get_vidmem_size,
+		.init_pdb = gp10b_mm_init_pdb,
+		.init_mm_setup_hw = gv11b_init_mm_setup_hw,
+		.is_bar1_supported = gv11b_mm_is_bar1_supported,
+		.init_inst_block = gv11b_init_inst_block,
+		.mmu_fault_pending = gv11b_mm_mmu_fault_pending,
+		.init_bar2_vm = gb10b_init_bar2_vm,
+		.init_bar2_mm_hw_setup = gv11b_init_bar2_mm_hw_setup,
+		.remove_bar2_vm = gv11b_mm_remove_bar2_vm,
+		.fault_info_mem_destroy = gv11b_mm_fault_info_mem_destroy,
+	},
 	.pramin = {
 		.enter = gk20a_pramin_enter,
 		.exit = gk20a_pramin_exit,
@@ -446,7 +476,6 @@ int gv100_init_hal(struct gk20a *g)
 	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
 
 	gv11b_init_gr(g);
-	gv100_init_mm(gops);
 	gp106_init_pmu_ops(g);
 
 	gv11b_init_uncompressed_kind_map();
-- 
cgit v1.2.2


From cce0a55d2106865be14b3b39c083a0f55881f2a5 Mon Sep 17 00:00:00 2001
From: Sunny He <suhe@nvidia.com>
Date: Tue, 1 Aug 2017 17:12:03 -0700
Subject: gpu: nvgpu: gv11b: Reorg pmu HAL init

Reorganize HAL initialization to remove inheritance and construct
the gpu_ops struct at compile time. This patch only covers the
pmu sub-module of the gpu_ops struct.

Perform HAL function assignments in hal_gxxxx.c through the
population of a chip-specific copy of gpu_ops.

Jira NVGPU-74

Change-Id: I3f8a763a7bebf201c2242eecde7ff998aad07d0a
Signed-off-by: Sunny He <suhe@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1530983
Reviewed-by: Automatic_Commit_Validation_User
Reviewed-by: svccoveritychecker <svccoveritychecker@nvidia.com>
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 51 +++++++++++++++++++++++++++++++++++--
 1 file changed, 49 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 74bc48fb..bd13ec08 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -32,19 +32,23 @@
 #include "gk20a/regops_gk20a.h"
 #include "gk20a/fb_gk20a.h"
 #include "gk20a/mm_gk20a.h"
+#include "gk20a/pmu_gk20a.h"
 
 #include "gm20b/ltc_gm20b.h"
 #include "gm20b/gr_gm20b.h"
 #include "gm20b/fifo_gm20b.h"
 #include "gm20b/fb_gm20b.h"
 #include "gm20b/mm_gm20b.h"
+#include "gm20b/pmu_gm20b.h"
+#include "gm20b/acr_gm20b.h"
 
 #include "gp10b/fb_gp10b.h"
 
 #include "gp106/clk_gp106.h"
 #include "gp106/clk_arb_gp106.h"
 #include "gp106/pmu_gp106.h"
-
+#include "gp106/acr_gp106.h"
+#include "gp106/sec2_gp106.h"
 #include "gm206/bios_gm206.h"
 #include "gp106/therm_gp106.h"
 #include "gp106/xve_gp106.h"
@@ -58,6 +62,7 @@
 #include "gp10b/fifo_gp10b.h"
 #include "gp10b/fecs_trace_gp10b.h"
 #include "gp10b/mm_gp10b.h"
+#include "gp10b/pmu_gp10b.h"
 
 #include "gv11b/hal_gv11b.h"
 #include "gv11b/gr_gv11b.h"
@@ -87,6 +92,7 @@
 #include <nvgpu/hw/gv100/hw_ram_gv100.h>
 #include <nvgpu/hw/gv100/hw_top_gv100.h>
 #include <nvgpu/hw/gv100/hw_pram_gv100.h>
+#include <nvgpu/hw/gv100/hw_pwr_gv100.h>
 
 static int gv100_get_litter_value(struct gk20a *g, int value)
 {
@@ -345,6 +351,45 @@ static const struct gpu_ops gv100_ops = {
 		.exit = gk20a_pramin_exit,
 		.data032_r = pram_data032_r,
 	},
+	.pmu = {
+		.init_wpr_region = gm20b_pmu_init_acr,
+		.load_lsfalcon_ucode = gp106_load_falcon_ucode,
+		.is_lazy_bootstrap = gp106_is_lazy_bootstrap,
+		.is_priv_load = gp106_is_priv_load,
+		.prepare_ucode = gp106_prepare_ucode_blob,
+		.pmu_setup_hw_and_bootstrap = gp106_bootstrap_hs_flcn,
+		.get_wpr = gp106_wpr_info,
+		.alloc_blob_space = gp106_alloc_blob_space,
+		.pmu_populate_loader_cfg = gp106_pmu_populate_loader_cfg,
+		.flcn_populate_bl_dmem_desc = gp106_flcn_populate_bl_dmem_desc,
+		.falcon_wait_for_halt = sec2_wait_for_halt,
+		.falcon_clear_halt_interrupt_status =
+			sec2_clear_halt_interrupt_status,
+		.init_falcon_setup_hw = init_sec2_setup_hw1,
+		.pmu_queue_tail = gk20a_pmu_queue_tail,
+		.pmu_get_queue_head = pwr_pmu_queue_head_r,
+		.pmu_mutex_release = gk20a_pmu_mutex_release,
+		.is_pmu_supported = gp106_is_pmu_supported,
+		.pmu_pg_supported_engines_list = gp106_pmu_pg_engines_list,
+		.pmu_elpg_statistics = gp106_pmu_elpg_statistics,
+		.pmu_mutex_acquire = gk20a_pmu_mutex_acquire,
+		.pmu_is_lpwr_feature_supported =
+			gp106_pmu_is_lpwr_feature_supported,
+		.pmu_msgq_tail = gk20a_pmu_msgq_tail,
+		.pmu_pg_engines_feature_list = gp106_pmu_pg_feature_list,
+		.pmu_get_queue_head_size = pwr_pmu_queue_head__size_1_v,
+		.pmu_queue_head = gk20a_pmu_queue_head,
+		.pmu_pg_param_post_init = nvgpu_lpwr_post_init,
+		.pmu_get_queue_tail_size = pwr_pmu_queue_tail__size_1_v,
+		.pmu_pg_init_param = gp106_pg_param_init,
+		.reset_engine = gp106_pmu_engine_reset,
+		.pmu_lpwr_disable_pg = nvgpu_lpwr_disable_pg,
+		.write_dmatrfbase = gp10b_write_dmatrfbase,
+		.pmu_mutex_size = pwr_pmu_mutex__size_1_v,
+		.is_engine_in_reset = gp106_pmu_is_engine_in_reset,
+		.pmu_get_queue_tail = pwr_pmu_queue_tail_r,
+		.pmu_lpwr_enable_pg = nvgpu_lpwr_enable_pg,
+	},
 	.clk = {
 		.init_clk_support = gp106_init_clk_support,
 		.get_crystal_clk_hz = gp106_crystal_clk_hz,
@@ -444,6 +489,7 @@ int gv100_init_hal(struct gk20a *g)
 	gops->fecs_trace = gv100_ops.fecs_trace;
 	gops->pramin = gv100_ops.pramin;
 	gops->therm = gv100_ops.therm;
+	gops->pmu = gv100_ops.pmu;
 	gops->mc = gv100_ops.mc;
 	gops->debug = gv100_ops.debug;
 	gops->dbg_session_ops = gv100_ops.dbg_session_ops;
@@ -470,13 +516,14 @@ int gv100_init_hal(struct gk20a *g)
 	__nvgpu_set_enabled(g, NVGPU_GR_USE_DMA_FOR_FW_BOOTSTRAP, true);
 	__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
 	__nvgpu_set_enabled(g, NVGPU_SEC_SECUREGPCCS, true);
+	__nvgpu_set_enabled(g, NVGPU_PMU_FECS_BOOTSTRAP_DONE, false);
 	/* for now */
 	__nvgpu_set_enabled(g, NVGPU_PMU_PSTATE, false);
 
+	g->pmu_lsf_pmu_wpr_init_done = 0;
 	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
 
 	gv11b_init_gr(g);
-	gp106_init_pmu_ops(g);
 
 	gv11b_init_uncompressed_kind_map();
 	gv11b_init_kind_attr();
-- 
cgit v1.2.2


From 2370fce04396b4bb66b679a54112731a0dbd7018 Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Fri, 18 Aug 2017 10:35:34 -0700
Subject: gpu: nvpgu: gv100: Enable gv100 fb and mm ops

Assign fb and mm ops for gv100.

Change-Id: I031031935cdb1fa33fd9f06af2f2229480740bc5
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1541339
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 2 ++
 1 file changed, 2 insertions(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index bd13ec08..e3c2d1cb 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -483,9 +483,11 @@ int gv100_init_hal(struct gk20a *g)
 
 	gops->ltc = gv100_ops.ltc;
 	gops->ce2 = gv100_ops.ce2;
+	gops->fb = gv100_ops.fb;
 	gops->clock_gating = gv100_ops.clock_gating;
 	gops->fifo = gv100_ops.fifo;
 	gops->gr_ctx = gv100_ops.gr_ctx;
+	gops->mm = gv100_ops.mm;
 	gops->fecs_trace = gv100_ops.fecs_trace;
 	gops->pramin = gv100_ops.pramin;
 	gops->therm = gv100_ops.therm;
-- 
cgit v1.2.2


From 866165749a0b7b2e6b219bb26bffd69d790d97c5 Mon Sep 17 00:00:00 2001
From: Sunny He <suhe@nvidia.com>
Date: Thu, 17 Aug 2017 16:10:42 -0700
Subject: gpu: nvgpu: Reorg gr HAL initialization

Reorganize HAL initialization to remove inheritance and construct
the gpu_ops struct at compile time. This patch only covers the
gr sub-module of the gpu_ops struct.

Perform HAL function assignments in hal_gxxxx.c through the
population of a chip-specific copy of gpu_ops.

Jira NVGPU-74

Change-Id: I8feaa95a9830969221f7ac70a5ef61cdf25094c3
Signed-off-by: Sunny He <suhe@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1542988
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 149 +++++++++++++++++++++++++++++++++++-
 1 file changed, 147 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index e3c2d1cb..4f21e433 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -33,6 +33,7 @@
 #include "gk20a/fb_gk20a.h"
 #include "gk20a/mm_gk20a.h"
 #include "gk20a/pmu_gk20a.h"
+#include "gk20a/gr_gk20a.h"
 
 #include "gm20b/ltc_gm20b.h"
 #include "gm20b/gr_gm20b.h"
@@ -43,6 +44,7 @@
 #include "gm20b/acr_gm20b.h"
 
 #include "gp10b/fb_gp10b.h"
+#include "gp10b/gr_gp10b.h"
 
 #include "gp106/clk_gp106.h"
 #include "gp106/clk_arb_gp106.h"
@@ -215,6 +217,150 @@ static const struct gpu_ops gv100_ops = {
 		.isr_nonstall = gp10b_ce_nonstall_isr,
 		.get_num_pce = gv11b_ce_get_num_pce,
 	},
+	.gr = {
+		.init_gpc_mmu = gr_gv11b_init_gpc_mmu,
+		.bundle_cb_defaults = gr_gv11b_bundle_cb_defaults,
+		.cb_size_default = gr_gv11b_cb_size_default,
+		.calc_global_ctx_buffer_size =
+			gr_gv11b_calc_global_ctx_buffer_size,
+		.commit_global_attrib_cb = gr_gv11b_commit_global_attrib_cb,
+		.commit_global_bundle_cb = gr_gp10b_commit_global_bundle_cb,
+		.commit_global_cb_manager = gr_gp10b_commit_global_cb_manager,
+		.commit_global_pagepool = gr_gp10b_commit_global_pagepool,
+		.handle_sw_method = gr_gv11b_handle_sw_method,
+		.set_alpha_circular_buffer_size =
+			gr_gv11b_set_alpha_circular_buffer_size,
+		.set_circular_buffer_size = gr_gv11b_set_circular_buffer_size,
+		.enable_hww_exceptions = gr_gv11b_enable_hww_exceptions,
+		.is_valid_class = gr_gv11b_is_valid_class,
+		.is_valid_gfx_class = gr_gv11b_is_valid_gfx_class,
+		.is_valid_compute_class = gr_gv11b_is_valid_compute_class,
+		.get_sm_dsm_perf_regs = gv11b_gr_get_sm_dsm_perf_regs,
+		.get_sm_dsm_perf_ctrl_regs = gv11b_gr_get_sm_dsm_perf_ctrl_regs,
+		.init_fs_state = gr_gv11b_init_fs_state,
+		.set_hww_esr_report_mask = gv11b_gr_set_hww_esr_report_mask,
+		.falcon_load_ucode = gr_gm20b_load_ctxsw_ucode_segments,
+		.load_ctxsw_ucode = gr_gm20b_load_ctxsw_ucode,
+		.set_gpc_tpc_mask = gr_gv11b_set_gpc_tpc_mask,
+		.get_gpc_tpc_mask = gr_gm20b_get_gpc_tpc_mask,
+		.free_channel_ctx = gk20a_free_channel_ctx,
+		.alloc_obj_ctx = gk20a_alloc_obj_ctx,
+		.bind_ctxsw_zcull = gr_gk20a_bind_ctxsw_zcull,
+		.get_zcull_info = gr_gk20a_get_zcull_info,
+		.is_tpc_addr = gr_gm20b_is_tpc_addr,
+		.get_tpc_num = gr_gm20b_get_tpc_num,
+		.detect_sm_arch = gr_gv11b_detect_sm_arch,
+		.add_zbc_color = gr_gp10b_add_zbc_color,
+		.add_zbc_depth = gr_gp10b_add_zbc_depth,
+		.zbc_set_table = gk20a_gr_zbc_set_table,
+		.zbc_query_table = gr_gk20a_query_zbc,
+		.pmu_save_zbc = gk20a_pmu_save_zbc,
+		.add_zbc = gr_gk20a_add_zbc,
+		.pagepool_default_size = gr_gv11b_pagepool_default_size,
+		.init_ctx_state = gr_gp10b_init_ctx_state,
+		.alloc_gr_ctx = gr_gp10b_alloc_gr_ctx,
+		.free_gr_ctx = gr_gp10b_free_gr_ctx,
+		.update_ctxsw_preemption_mode =
+			gr_gp10b_update_ctxsw_preemption_mode,
+		.dump_gr_regs = gr_gv11b_dump_gr_status_regs,
+		.update_pc_sampling = gr_gm20b_update_pc_sampling,
+		.get_fbp_en_mask = gr_gm20b_get_fbp_en_mask,
+		.get_max_ltc_per_fbp = gr_gm20b_get_max_ltc_per_fbp,
+		.get_max_lts_per_ltc = gr_gm20b_get_max_lts_per_ltc,
+		.get_rop_l2_en_mask = gr_gm20b_rop_l2_en_mask,
+		.get_max_fbps_count = gr_gm20b_get_max_fbps_count,
+		.init_sm_dsm_reg_info = gv11b_gr_init_sm_dsm_reg_info,
+		.wait_empty = gr_gv11b_wait_empty,
+		.init_cyclestats = gr_gv11b_init_cyclestats,
+		.set_sm_debug_mode = gv11b_gr_set_sm_debug_mode,
+		.enable_cde_in_fecs = gr_gm20b_enable_cde_in_fecs,
+		.bpt_reg_info = gv11b_gr_bpt_reg_info,
+		.get_access_map = gr_gv11b_get_access_map,
+		.handle_fecs_error = gr_gv11b_handle_fecs_error,
+		.handle_sm_exception = gr_gk20a_handle_sm_exception,
+		.handle_tex_exception = gr_gv11b_handle_tex_exception,
+		.enable_gpc_exceptions = gr_gv11b_enable_gpc_exceptions,
+		.enable_exceptions = gr_gv11b_enable_exceptions,
+		.get_lrf_tex_ltc_dram_override = get_ecc_override_val,
+		.update_smpc_ctxsw_mode = gr_gk20a_update_smpc_ctxsw_mode,
+		.update_hwpm_ctxsw_mode = gr_gk20a_update_hwpm_ctxsw_mode,
+		.record_sm_error_state = gv11b_gr_record_sm_error_state,
+		.update_sm_error_state = gv11b_gr_update_sm_error_state,
+		.clear_sm_error_state = gm20b_gr_clear_sm_error_state,
+		.suspend_contexts = gr_gp10b_suspend_contexts,
+		.resume_contexts = gr_gk20a_resume_contexts,
+		.get_preemption_mode_flags = gr_gp10b_get_preemption_mode_flags,
+		.fuse_override = gp10b_gr_fuse_override,
+		.init_sm_id_table = gr_gv11b_init_sm_id_table,
+		.load_smid_config = gr_gv11b_load_smid_config,
+		.program_sm_id_numbering = gr_gv11b_program_sm_id_numbering,
+		.is_ltcs_ltss_addr = gr_gm20b_is_ltcs_ltss_addr,
+		.is_ltcn_ltss_addr = gr_gm20b_is_ltcn_ltss_addr,
+		.split_lts_broadcast_addr = gr_gm20b_split_lts_broadcast_addr,
+		.split_ltc_broadcast_addr = gr_gm20b_split_ltc_broadcast_addr,
+		.setup_rop_mapping = gr_gv11b_setup_rop_mapping,
+		.program_zcull_mapping = gr_gv11b_program_zcull_mapping,
+		.commit_global_timeslice = gr_gv11b_commit_global_timeslice,
+		.commit_inst = gr_gv11b_commit_inst,
+		.write_zcull_ptr = gr_gv11b_write_zcull_ptr,
+		.write_pm_ptr = gr_gv11b_write_pm_ptr,
+		.init_elcg_mode = gr_gv11b_init_elcg_mode,
+		.load_tpc_mask = gr_gv11b_load_tpc_mask,
+		.inval_icache = gr_gk20a_inval_icache,
+		.trigger_suspend = gv11b_gr_sm_trigger_suspend,
+		.wait_for_pause = gr_gk20a_wait_for_pause,
+		.resume_from_pause = gv11b_gr_resume_from_pause,
+		.clear_sm_errors = gr_gk20a_clear_sm_errors,
+		.tpc_enabled_exceptions = gr_gk20a_tpc_enabled_exceptions,
+		.get_esr_sm_sel = gv11b_gr_get_esr_sm_sel,
+		.sm_debugger_attached = gv11b_gr_sm_debugger_attached,
+		.suspend_single_sm = gv11b_gr_suspend_single_sm,
+		.suspend_all_sms = gv11b_gr_suspend_all_sms,
+		.resume_single_sm = gv11b_gr_resume_single_sm,
+		.resume_all_sms = gv11b_gr_resume_all_sms,
+		.get_sm_hww_warp_esr = gv11b_gr_get_sm_hww_warp_esr,
+		.get_sm_hww_global_esr = gv11b_gr_get_sm_hww_global_esr,
+		.get_sm_no_lock_down_hww_global_esr_mask =
+			gv11b_gr_get_sm_no_lock_down_hww_global_esr_mask,
+		.lock_down_sm = gv11b_gr_lock_down_sm,
+		.wait_for_sm_lock_down = gv11b_gr_wait_for_sm_lock_down,
+		.clear_sm_hww = gv11b_gr_clear_sm_hww,
+		.init_ovr_sm_dsm_perf =  gv11b_gr_init_ovr_sm_dsm_perf,
+		.get_ovr_perf_regs = gv11b_gr_get_ovr_perf_regs,
+		.disable_rd_coalesce = gm20a_gr_disable_rd_coalesce,
+		.set_boosted_ctx = gr_gp10b_set_boosted_ctx,
+		.set_preemption_mode = gr_gp10b_set_preemption_mode,
+		.set_czf_bypass = NULL,
+		.pre_process_sm_exception = gr_gv11b_pre_process_sm_exception,
+		.set_preemption_buffer_va = gr_gv11b_set_preemption_buffer_va,
+		.init_preemption_state = NULL,
+		.update_boosted_ctx = gr_gp10b_update_boosted_ctx,
+		.set_bes_crop_debug3 = gr_gp10b_set_bes_crop_debug3,
+		.create_gr_sysfs = gr_gv11b_create_sysfs,
+		.set_ctxsw_preemption_mode = gr_gp10b_set_ctxsw_preemption_mode,
+		.is_etpc_addr = gv11b_gr_pri_is_etpc_addr,
+		.egpc_etpc_priv_addr_table = gv11b_gr_egpc_etpc_priv_addr_table,
+		.handle_tpc_mpc_exception = gr_gv11b_handle_tpc_mpc_exception,
+		.zbc_s_query_table = gr_gv11b_zbc_s_query_table,
+		.load_zbc_s_default_tbl = gr_gv11b_load_stencil_default_tbl,
+		.restore_context_header = gv11b_restore_context_header,
+		.handle_gpc_gpcmmu_exception =
+			gr_gv11b_handle_gpc_gpcmmu_exception,
+		.add_zbc_type_s = gr_gv11b_add_zbc_type_s,
+		.get_egpc_base = gv11b_gr_get_egpc_base,
+		.get_egpc_etpc_num = gv11b_gr_get_egpc_etpc_num,
+		.handle_gpc_gpccs_exception =
+			gr_gv11b_handle_gpc_gpccs_exception,
+		.load_zbc_s_tbl = gr_gv11b_load_stencil_tbl,
+		.access_smpc_reg = gv11b_gr_access_smpc_reg,
+		.is_egpc_addr = gv11b_gr_pri_is_egpc_addr,
+		.add_zbc_s = gr_gv11b_add_zbc_stencil,
+		.handle_gcc_exception = gr_gv11b_handle_gcc_exception,
+		.init_sw_veid_bundle = gr_gv11b_init_sw_veid_bundle,
+		.handle_tpc_sm_ecc_exception =
+			gr_gv11b_handle_tpc_sm_ecc_exception,
+		.decode_egpc_addr = gv11b_gr_decode_egpc_addr,
+	},
 	.fb = {
 		.reset = gv100_fb_reset,
 		.init_hw = gk20a_fb_init_hw,
@@ -483,6 +629,7 @@ int gv100_init_hal(struct gk20a *g)
 
 	gops->ltc = gv100_ops.ltc;
 	gops->ce2 = gv100_ops.ce2;
+	gops->gr = gv100_ops.gr;
 	gops->fb = gv100_ops.fb;
 	gops->clock_gating = gv100_ops.clock_gating;
 	gops->fifo = gv100_ops.fifo;
@@ -525,8 +672,6 @@ int gv100_init_hal(struct gk20a *g)
 	g->pmu_lsf_pmu_wpr_init_done = 0;
 	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
 
-	gv11b_init_gr(g);
-
 	gv11b_init_uncompressed_kind_map();
 	gv11b_init_kind_attr();
 
-- 
cgit v1.2.2


From f98e3c8348d20b6542c4d27921cb9f9822aaa17a Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Wed, 6 Sep 2017 14:45:30 -0700
Subject: gpu: nvgpu: gv100: Don't assign XVE sw_init

XVE sw_init HAL is removed due to moving XVE debugfs code to
Linux module. Remove the assignment of the HAL.

Change-Id: I90beada58f87c78dc752011ea3ec2a5473f0acc1
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1553913
Reviewed-by: Automatic_Commit_Validation_User
Reviewed-by: svccoveritychecker <svccoveritychecker@nvidia.com>
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Alex Waterman <alexw@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 -
 1 file changed, 1 deletion(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 4f21e433..cd121455 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -597,7 +597,6 @@ static const struct gpu_ops gv100_ops = {
 	},
 #endif
 	.xve = {
-		.sw_init          = xve_sw_init_gp106,
 		.get_speed        = xve_get_speed_gp106,
 		.set_speed        = xve_set_speed_gp106,
 		.available_speeds = xve_available_speeds_gp106,
-- 
cgit v1.2.2


From 52f50addc6cedf57fc3d8ff06314921499fb59e3 Mon Sep 17 00:00:00 2001
From: Deepak Nibade <dnibade@nvidia.com>
Date: Wed, 13 Sep 2017 17:35:03 +0530
Subject: gpu: nvgpu: add TSG enable/disable operations

Add TSG enable/disable operations for gv11b/gv100

To disable a TSG we continue to use gk20a_disable_tsg()

To enable a TSG add new API gv11b_fifo_enable_tsg() since TSG enable sequence is
different for Volta than previous versions
For Volta it is sufficient to loop over all the channels in TSG and enable them
sequentially

Bug 1739362

Change-Id: Id4b4684959204c6101ceda83487a41fbfcba8b5f
Signed-off-by: Deepak Nibade <dnibade@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1560642
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Automatic_Commit_Validation_User
Reviewed-by: Seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 2 ++
 1 file changed, 2 insertions(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index cd121455..cc20fa43 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -397,6 +397,8 @@ static const struct gpu_ops gv100_ops = {
 		.pbdma_acquire_val = gk20a_fifo_pbdma_acquire_val,
 		.preempt_channel = gv11b_fifo_preempt_channel,
 		.preempt_tsg = gv11b_fifo_preempt_tsg,
+		.enable_tsg = gv11b_fifo_enable_tsg,
+		.disable_tsg = gk20a_disable_tsg,
 		.update_runlist = gk20a_fifo_update_runlist,
 		.trigger_mmu_fault = NULL,
 		.get_mmu_fault_info = NULL,
-- 
cgit v1.2.2


From f720b309f1ea87a301bcb216983396f3d9c55abc Mon Sep 17 00:00:00 2001
From: Deepak Nibade <dnibade@nvidia.com>
Date: Thu, 14 Sep 2017 05:48:07 -0700
Subject: gpu: nvgpu: add tsg_verify_status_faulted operation

Add new API gv11b_fifo_tsg_verify_status_faulted() and use that as
g->ops.fifo.tsg_verify_status_faulted operation for gv11b/gv100

This API will check if channel has ENG_FAULTED status set, if yes it will clear
CE method buffer in case saved out channel is same as faulted channel
We need to write 0 to method count to invalidate CE method buffer

Also set g->ops.fifo.tsg_verify_status_ctx_reload operation for gv11b/gv100

Bug 200327095

Change-Id: I9d2b0f13faf881b30680219bbcadfd4969c4dff6
Signed-off-by: Deepak Nibade <dnibade@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1560643
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 2 ++
 1 file changed, 2 insertions(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index cc20fa43..9a2807a2 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -399,6 +399,8 @@ static const struct gpu_ops gv100_ops = {
 		.preempt_tsg = gv11b_fifo_preempt_tsg,
 		.enable_tsg = gv11b_fifo_enable_tsg,
 		.disable_tsg = gk20a_disable_tsg,
+		.tsg_verify_status_ctx_reload = gm20b_fifo_tsg_verify_status_ctx_reload,
+		.tsg_verify_status_faulted = gv11b_fifo_tsg_verify_status_faulted,
 		.update_runlist = gk20a_fifo_update_runlist,
 		.trigger_mmu_fault = NULL,
 		.get_mmu_fault_info = NULL,
-- 
cgit v1.2.2


From 0a0da216db25e293c68b5c9c6fa88e559368dce2 Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Tue, 19 Sep 2017 12:12:49 -0700
Subject: gpu: nvgpu: Use VBIOS HAL from gp106 instead of gm206

Use VBIOS HAL from gp106 instead of gm206.

JIRA NVGPU-218

Change-Id: I835a1ce39818221f976ed5eca2bf3032317760b0
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1563741
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 9a2807a2..23ada798 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -51,7 +51,7 @@
 #include "gp106/pmu_gp106.h"
 #include "gp106/acr_gp106.h"
 #include "gp106/sec2_gp106.h"
-#include "gm206/bios_gm206.h"
+#include "gp106/bios_gp106.h"
 #include "gp106/therm_gp106.h"
 #include "gp106/xve_gp106.h"
 #include "gp106/clk_gp106.h"
@@ -622,7 +622,7 @@ static const struct gpu_ops gv100_ops = {
 	},
 	.chip_init_gpu_characteristics = gv100_init_gpu_characteristics,
 	.get_litter_value = gv100_get_litter_value,
-	.bios_init = gm206_bios_init,
+	.bios_init = gp106_bios_init,
 };
 
 int gv100_init_hal(struct gk20a *g)
-- 
cgit v1.2.2


From a24382d09788ffc8f8688a473a38d37df589b131 Mon Sep 17 00:00:00 2001
From: Mahantesh Kumbar <mkumbar@nvidia.com>
Date: Wed, 20 Sep 2017 22:34:54 +0530
Subject: gpu: nvgpu: Add support for WPR info read from FB

update .read_wpr_info HAL of gv11b & gv100
 to point to gm20b_fb_read_wpr_info()

JIRA NVGPU-128

Change-Id: I5ece4c72dbe0f9e7827888e2a15d8b7dda6fcb42
Signed-off-by: Mahantesh Kumbar <mkumbar@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1564684
Reviewed-by: Automatic_Commit_Validation_User
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: svccoveritychecker <svccoveritychecker@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Vijayakumar Subbu <vsubbu@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 +
 1 file changed, 1 insertion(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 23ada798..3dfe9e74 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -373,6 +373,7 @@ static const struct gpu_ops gv100_ops = {
 		.compressible_page_size = gp10b_fb_compressible_page_size,
 		.vpr_info_fetch = gm20b_fb_vpr_info_fetch,
 		.dump_vpr_wpr_info = gm20b_fb_dump_vpr_wpr_info,
+		.read_wpr_info = gm20b_fb_read_wpr_info,
 		.is_debug_mode_enabled = gm20b_fb_debug_mode_enabled,
 		.set_debug_mode = gm20b_fb_set_debug_mode,
 		.tlb_invalidate = gk20a_fb_tlb_invalidate,
-- 
cgit v1.2.2


From 4d5216922b288a70f7434ac8f7c6c8274cc1462b Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Thu, 21 Sep 2017 09:09:24 -0700
Subject: gpu: nvgpu: fix coverity issues in GV100 HAL

Fix value overwrite in switch statement on GV100 proj assignments

bug 200291879

Change-Id: Id25f811f820a05b3d50cc9070369fe52f65a6bf3
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1565538
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 +
 1 file changed, 1 insertion(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 3dfe9e74..8cf8e245 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -138,6 +138,7 @@ static int gv100_get_litter_value(struct gk20a *g, int value)
 		break;
 	case GPU_LIT_PPC_IN_GPC_BASE:
 		ret = proj_ppc_in_gpc_base_v();
+		break;
 	case GPU_LIT_PPC_IN_GPC_STRIDE:
 		ret = proj_ppc_in_gpc_stride_v();
 		break;
-- 
cgit v1.2.2


From d61643c0200983dc340d37962bb0a3ca900a3e97 Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Mon, 25 Sep 2017 08:59:28 -0700
Subject: gpu: nvgpu: gv11b: Change license for common files to MIT

Change license of OS independent source code files to MIT.

JIRA NVGPU-218

Change-Id: I93c0504f0544ee8ced4898c386b3f5fbaa6a99a9
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1567804
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: David Martinez Nieto <dmartineznie@nvidia.com>
Reviewed-by: Seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-by: svccoveritychecker <svccoveritychecker@nvidia.com>
GVS: Gerrit_Virtual_Submit
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 23 ++++++++++++++++-------
 1 file changed, 16 insertions(+), 7 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 8cf8e245..caa43a95 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -3,14 +3,23 @@
  *
  * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
  *
- * This program is free software; you can redistribute it and/or modify it
- * under the terms and conditions of the GNU General Public License,
- * version 2, as published by the Free Software Foundation.
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
  *
- * This program is distributed in the hope it will be useful, but WITHOUT
- * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
- * more details.
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
  */
 
 #include <linux/types.h>
-- 
cgit v1.2.2


From 058485d28538b033636180c11592a9088878c807 Mon Sep 17 00:00:00 2001
From: seshendra Gadagottu <sgadagottu@nvidia.com>
Date: Wed, 27 Sep 2017 14:15:02 -0700
Subject: gpu: nvgpu: gv100: disable ctxsw trace

ctxsw_trace need modifications with subcontext.
Disable it for time-being.

Change-Id: I0f0e3d0653e159dca09c40c8d0b4c46643cd0496
Signed-off-by: seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1569629
Reviewed-by: Automatic_Commit_Validation_User
Reviewed-by: David Martinez Nieto <dmartineznie@nvidia.com>
Tested-by: David Martinez Nieto <dmartineznie@nvidia.com>
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: svccoveritychecker <svccoveritychecker@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 28 ++++++++++++++--------------
 1 file changed, 14 insertions(+), 14 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index caa43a95..c9b9a1ca 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -465,20 +465,20 @@ static const struct gpu_ops gv100_ops = {
 	},
 #ifdef CONFIG_GK20A_CTXSW_TRACE
 	.fecs_trace = {
-		.alloc_user_buffer = gk20a_ctxsw_dev_ring_alloc,
-		.free_user_buffer = gk20a_ctxsw_dev_ring_free,
-		.mmap_user_buffer = gk20a_ctxsw_dev_mmap_buffer,
-		.init = gk20a_fecs_trace_init,
-		.deinit = gk20a_fecs_trace_deinit,
-		.enable = gk20a_fecs_trace_enable,
-		.disable = gk20a_fecs_trace_disable,
-		.is_enabled = gk20a_fecs_trace_is_enabled,
-		.reset = gk20a_fecs_trace_reset,
-		.flush = gp10b_fecs_trace_flush,
-		.poll = gk20a_fecs_trace_poll,
-		.bind_channel = gk20a_fecs_trace_bind_channel,
-		.unbind_channel = gk20a_fecs_trace_unbind_channel,
-		.max_entries = gk20a_gr_max_entries,
+		.alloc_user_buffer = NULL,
+		.free_user_buffer = NULL,
+		.mmap_user_buffer = NULL,
+		.init = NULL,
+		.deinit = NULL,
+		.enable = NULL,
+		.disable = NULL,
+		.is_enabled = NULL,
+		.reset = NULL,
+		.flush = NULL,
+		.poll = NULL,
+		.bind_channel = NULL,
+		.unbind_channel = NULL,
+		.max_entries = NULL,
 	},
 #endif /* CONFIG_GK20A_CTXSW_TRACE */
 	.mm = {
-- 
cgit v1.2.2


From dc5edb1417390b583b5ff2406e554ce0770e02ae Mon Sep 17 00:00:00 2001
From: Alex Waterman <alexw@nvidia.com>
Date: Wed, 16 Aug 2017 16:13:18 -0700
Subject: gpu: nvgpu: rename ops.mm.get_physical_addr_bits

T19x/gv100 version of same patch in kernel/nvgpu.

Change-Id: I7174864cf1e072af61609c0843da16fcafe54c02
Signed-off-by: Alex Waterman <alexw@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1566750
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 -
 1 file changed, 1 deletion(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index c9b9a1ca..72864c5f 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -494,7 +494,6 @@ static const struct gpu_ops gv100_ops = {
 		.get_big_page_sizes = gm20b_mm_get_big_page_sizes,
 		.get_default_big_page_size = gp10b_mm_get_default_big_page_size,
 		.gpu_phys_addr = gv11b_gpu_phys_addr,
-		.get_physical_addr_bits = NULL,
 		.get_mmu_levels = gp10b_mm_get_mmu_levels,
 		.get_vidmem_size = gv100_mm_get_vidmem_size,
 		.init_pdb = gp10b_mm_init_pdb,
-- 
cgit v1.2.2


From 19d602da31f81d9dc89a42b2bc84ce14a300773b Mon Sep 17 00:00:00 2001
From: Deepak Nibade <dnibade@nvidia.com>
Date: Tue, 3 Oct 2017 14:01:51 +0530
Subject: gpu: nvgpu: verify channel status while closing per-platform

We right now call gk20a_fifo_tsg_unbind_channel_verify_status() to verify
channel status while unbinding a channel from TSG while closing

Add support to do this verification per-platform and keep this disabled
for vgpu platforms

Bug 200327095

Change-Id: I6e2a6a09c784d24ac49477d5450b7d4b671878e3
Signed-off-by: Deepak Nibade <dnibade@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1572369
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 +
 1 file changed, 1 insertion(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 72864c5f..028c9d84 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -410,6 +410,7 @@ static const struct gpu_ops gv100_ops = {
 		.preempt_tsg = gv11b_fifo_preempt_tsg,
 		.enable_tsg = gv11b_fifo_enable_tsg,
 		.disable_tsg = gk20a_disable_tsg,
+		.tsg_verify_channel_status = gk20a_fifo_tsg_unbind_channel_verify_status,
 		.tsg_verify_status_ctx_reload = gm20b_fifo_tsg_verify_status_ctx_reload,
 		.tsg_verify_status_faulted = gv11b_fifo_tsg_verify_status_faulted,
 		.update_runlist = gk20a_fifo_update_runlist,
-- 
cgit v1.2.2


From f518304e0d8102216c7c0022cd4b66fcd844264c Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Thu, 3 Aug 2017 21:43:50 -0700
Subject: gpu: nvgpu: fix GV100 hal definitions

These changes allow GV100 to init the basic HALs to pass
nvgpu_submit_twod

(1) Allocate fault buffer from vidmem instead of sysmem to prevent coherency
issues
(2) Properly enable FB
(3) Fan control requires the execution of the pre-os FW, without it the SKU201
is extremely noisy

 JIRA: NVGPUGV100-9

Change-Id: I9b2072737e45432f957e7faae6d33bc0ab43b817
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1539926
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: svccoveritychecker <svccoveritychecker@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 22 ++++++++++++++++------
 1 file changed, 16 insertions(+), 6 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 028c9d84..7f7ab785 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -61,6 +61,7 @@
 #include "gp106/acr_gp106.h"
 #include "gp106/sec2_gp106.h"
 #include "gp106/bios_gp106.h"
+#include "gv100/bios_gv100.h"
 #include "gp106/therm_gp106.h"
 #include "gp106/xve_gp106.h"
 #include "gp106/clk_gp106.h"
@@ -85,6 +86,10 @@
 #include "gv11b/mm_gv11b.h"
 #include "gv11b/pmu_gv11b.h"
 #include "gv11b/fb_gv11b.h"
+#include "gv100/mm_gv100.h"
+#include "gv11b/pmu_gv11b.h"
+#include "gv100/fb_gv100.h"
+#include "gv100/fifo_gv100.h"
 #include "gv11b/fifo_gv11b.h"
 #include "gv11b/gv11b_gating_reglist.h"
 #include "gv11b/regops_gv11b.h"
@@ -208,6 +213,11 @@ int gv100_init_gpu_characteristics(struct gk20a *g)
 
 
 static const struct gpu_ops gv100_ops = {
+	.bios = {
+		.init = gp106_bios_init,
+		.preos_wait_for_halt = gv100_bios_preos_wait_for_halt,
+		.preos_reload_check = gv100_bios_preos_reload_check,
+	},
 	.ltc = {
 		.determine_L2_size_bytes = gp10b_determine_L2_size_bytes,
 		.set_zbc_s_entry = gv11b_ltc_set_zbc_stencil_entry,
@@ -218,7 +228,7 @@ static const struct gpu_ops gv100_ops = {
 		.init_comptags = gp10b_ltc_init_comptags,
 		.cbc_ctrl = gm20b_ltc_cbc_ctrl,
 		.isr = gv11b_ltc_isr,
-		.cbc_fix_config = gv11b_ltc_cbc_fix_config,
+		.cbc_fix_config = NULL,
 		.flush = gm20b_flush_ltc,
 		.set_enabled = gp10b_ltc_set_enabled,
 	},
@@ -374,8 +384,7 @@ static const struct gpu_ops gv100_ops = {
 	.fb = {
 		.reset = gv100_fb_reset,
 		.init_hw = gk20a_fb_init_hw,
-		.init_fs_state = gv11b_fb_init_fs_state,
-		.init_cbc = gv11b_fb_init_cbc,
+		.init_fs_state = NULL,
 		.set_mmu_page_size = gm20b_fb_set_mmu_page_size,
 		.set_use_full_comp_tag_line =
 			gm20b_fb_set_use_full_comp_tag_line,
@@ -417,7 +426,7 @@ static const struct gpu_ops gv100_ops = {
 		.trigger_mmu_fault = NULL,
 		.get_mmu_fault_info = NULL,
 		.wait_engine_idle = gk20a_fifo_wait_engine_idle,
-		.get_num_fifos = gv11b_fifo_get_num_fifos,
+		.get_num_fifos = gv100_fifo_get_num_fifos,
 		.get_pbdma_signature = gp10b_fifo_get_pbdma_signature,
 		.set_runlist_interleave = gk20a_fifo_set_runlist_interleave,
 		.tsg_set_timeslice = gk20a_fifo_tsg_set_timeslice,
@@ -633,7 +642,6 @@ static const struct gpu_ops gv100_ops = {
 	},
 	.chip_init_gpu_characteristics = gv100_init_gpu_characteristics,
 	.get_litter_value = gv100_get_litter_value,
-	.bios_init = gp106_bios_init,
 };
 
 int gv100_init_hal(struct gk20a *g)
@@ -641,6 +649,7 @@ int gv100_init_hal(struct gk20a *g)
 	struct gpu_ops *gops = &g->ops;
 	struct nvgpu_gpu_characteristics *c = &g->gpu_characteristics;
 
+	gops->bios = gv100_ops.bios;
 	gops->ltc = gv100_ops.ltc;
 	gops->ce2 = gv100_ops.ce2;
 	gops->gr = gv100_ops.gr;
@@ -674,7 +683,6 @@ int gv100_init_hal(struct gk20a *g)
 	gops->chip_init_gpu_characteristics =
 		gv100_ops.chip_init_gpu_characteristics;
 	gops->get_litter_value = gv100_ops.get_litter_value;
-	gops->bios_init = gv100_ops.bios_init;
 
 	__nvgpu_set_enabled(g, NVGPU_GR_USE_DMA_FOR_FW_BOOTSTRAP, true);
 	__nvgpu_set_enabled(g, NVGPU_SEC_PRIVSECURITY, true);
@@ -689,6 +697,8 @@ int gv100_init_hal(struct gk20a *g)
 	gv11b_init_uncompressed_kind_map();
 	gv11b_init_kind_attr();
 
+	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
+
 	g->name = "gv10x";
 
 	c->twod_class = FERMI_TWOD_A;
-- 
cgit v1.2.2


From e78cd6c42aec3ae18f12420fd8eb4cb58d09da2d Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Thu, 12 Oct 2017 11:35:32 -0700
Subject: gpu: nvgpu: add missing hal defines

Due to lack of GVS coverage some defines were left out in GV100, this change
adds them back

JIRA: NVGPUGV100-9

Change-Id: I2f5778529dcad535bb56c33c38c097415dbf11e5
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1577998
Reviewed-by: Automatic_Commit_Validation_User
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: Seshendra Gadagottu <sgadagottu@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Nirav Patel <nipatel@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 36 +++++++++++++++++++++++++++++++-----
 1 file changed, 31 insertions(+), 5 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 7f7ab785..7457c185 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -91,6 +91,8 @@
 #include "gv100/fb_gv100.h"
 #include "gv100/fifo_gv100.h"
 #include "gv11b/fifo_gv11b.h"
+#include "gv11b/regops_gv11b.h"
+
 #include "gv11b/gv11b_gating_reglist.h"
 #include "gv11b/regops_gv11b.h"
 #include "gv11b/subctx_gv11b.h"
@@ -100,6 +102,7 @@
 #include "gv100/fb_gv100.h"
 #include "gv100/mm_gv100.h"
 
+#include <nvgpu/bus.h>
 #include <nvgpu/debug.h>
 #include <nvgpu/enabled.h>
 
@@ -156,6 +159,9 @@ static int gv100_get_litter_value(struct gk20a *g, int value)
 	case GPU_LIT_PPC_IN_GPC_STRIDE:
 		ret = proj_ppc_in_gpc_stride_v();
 		break;
+	case GPU_LIT_PPC_IN_GPC_SHARED_BASE:
+		ret = proj_ppc_in_gpc_shared_base_v();
+		break;
 	case GPU_LIT_ROP_BASE:
 		ret = proj_rop_base_v();
 		break;
@@ -180,13 +186,30 @@ static int gv100_get_litter_value(struct gk20a *g, int value)
 	case GPU_LIT_NUM_FBPAS:
 		ret = proj_scal_litter_num_fbpas_v();
 		break;
+	case GPU_LIT_FBPA_SHARED_BASE:
+		ret = proj_fbpa_shared_base_v();
+		break;
+	case GPU_LIT_FBPA_BASE:
+		ret = proj_fbpa_base_v();
+		break;
 	case GPU_LIT_FBPA_STRIDE:
 		ret = proj_fbpa_stride_v();
 		break;
 	case GPU_LIT_SM_PRI_STRIDE:
 		ret = proj_sm_stride_v();
 		break;
-
+	case GPU_LIT_SMPC_PRI_BASE:
+		ret = proj_smpc_base_v();
+		break;
+	case GPU_LIT_SMPC_PRI_SHARED_BASE:
+		ret = proj_smpc_shared_base_v();
+		break;
+	case GPU_LIT_SMPC_PRI_UNIQUE_BASE:
+		ret = proj_smpc_unique_base_v();
+		break;
+	case GPU_LIT_SMPC_PRI_STRIDE:
+		ret = proj_smpc_stride_v();
+		break;
 	default:
 		break;
 	}
@@ -553,12 +576,10 @@ static const struct gpu_ops gv100_ops = {
 		.pmu_get_queue_tail_size = pwr_pmu_queue_tail__size_1_v,
 		.pmu_pg_init_param = gp106_pg_param_init,
 		.reset_engine = gp106_pmu_engine_reset,
-		.pmu_lpwr_disable_pg = nvgpu_lpwr_disable_pg,
 		.write_dmatrfbase = gp10b_write_dmatrfbase,
 		.pmu_mutex_size = pwr_pmu_mutex__size_1_v,
 		.is_engine_in_reset = gp106_pmu_is_engine_in_reset,
 		.pmu_get_queue_tail = pwr_pmu_queue_tail_r,
-		.pmu_lpwr_enable_pg = nvgpu_lpwr_enable_pg,
 	},
 	.clk = {
 		.init_clk_support = gp106_init_clk_support,
@@ -572,6 +593,9 @@ static const struct gpu_ops gv100_ops = {
 		.get_arbiter_clk_default = gp106_get_arbiter_clk_default,
 		.get_current_pstate = nvgpu_clk_arb_get_current_pstate,
 	},
+	.regops = {
+		.apply_smpc_war = gv11b_apply_smpc_war,
+	},
 	.mc = {
 		.intr_enable = mc_gv11b_intr_enable,
 		.intr_unit_config = mc_gp10b_intr_unit_config,
@@ -601,13 +625,14 @@ static const struct gpu_ops gv100_ops = {
 			nvgpu_check_and_set_context_reservation,
 		.release_profiler_reservation =
 			nvgpu_release_profiler_reservation,
-		.perfbuffer_enable = gk20a_perfbuf_enable_locked,
-		.perfbuffer_disable = gk20a_perfbuf_disable_locked,
+		.perfbuffer_enable = NULL,
+		.perfbuffer_disable = NULL,
 	},
 	.bus = {
 		.init_hw = gk20a_bus_init_hw,
 		.isr = gk20a_bus_isr,
 		.read_ptimer = gk20a_read_ptimer,
+		.get_timestamps_zipper = nvgpu_get_timestamps_zipper,
 		.bar1_bind = NULL,
 	},
 #if defined(CONFIG_GK20A_CYCLE_STATS)
@@ -662,6 +687,7 @@ int gv100_init_hal(struct gk20a *g)
 	gops->pramin = gv100_ops.pramin;
 	gops->therm = gv100_ops.therm;
 	gops->pmu = gv100_ops.pmu;
+	gops->regops = gv100_ops.regops;
 	gops->mc = gv100_ops.mc;
 	gops->debug = gv100_ops.debug;
 	gops->dbg_session_ops = gv100_ops.dbg_session_ops;
-- 
cgit v1.2.2


From 201ccbfa8503daee9562a22f50a5b626fe4cc6a1 Mon Sep 17 00:00:00 2001
From: seshendra Gadagottu <sgadagottu@nvidia.com>
Date: Mon, 16 Oct 2017 12:14:29 -0700
Subject: gpu: nvgpu: gv11b: update dbg ops

Updated following hal functions for gv11b and reused
them for gv100:
perfbuffer_enable
perfbuffer_disable

These changes are needed because of following reasons:
1. Register offsets for perf_pmasys_* are changed
   for gv11b/gv100 from gk20a.
2. Updated memory type for perf_pmasys_mem_block_target
   to sys_ncoh_f().

Bug 200327596

Change-Id: Ia672ac561917c8ed36caea9cc7e74b7fc7ce8188
Signed-off-by: seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1571074
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 7457c185..2ece7be8 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -76,6 +76,7 @@
 #include "gp10b/mm_gp10b.h"
 #include "gp10b/pmu_gp10b.h"
 
+#include "gv11b/dbg_gpu_gv11b.h"
 #include "gv11b/hal_gv11b.h"
 #include "gv11b/gr_gv11b.h"
 #include "gv11b/mc_gv11b.h"
@@ -625,8 +626,8 @@ static const struct gpu_ops gv100_ops = {
 			nvgpu_check_and_set_context_reservation,
 		.release_profiler_reservation =
 			nvgpu_release_profiler_reservation,
-		.perfbuffer_enable = NULL,
-		.perfbuffer_disable = NULL,
+		.perfbuffer_enable = gv11b_perfbuf_enable_locked,
+		.perfbuffer_disable = gv11b_perfbuf_disable_locked,
 	},
 	.bus = {
 		.init_hw = gk20a_bus_init_hw,
-- 
cgit v1.2.2


From 62e133029d5a89e07e3ba5e96475c0960c0bc3dd Mon Sep 17 00:00:00 2001
From: Alex Waterman <alexw@nvidia.com>
Date: Mon, 16 Oct 2017 12:38:46 -0700
Subject: gpu: nvgpu: Refactoring nvgpu_vm functions

Change required for equivalent change on nvgpu. This is required
since a few HALs were added that must be populated for all chips.

This patch adds those HAL definitions for gv11b, gv100, and the
vgpu.

JIRA NVGPU-30
JIRA NVGPU-138

Change-Id: I65374764350a5cacce8624b15d98947fada35a4a
Signed-off-by: Alex Waterman <alexw@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1579865
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 2 ++
 1 file changed, 2 insertions(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 2ece7be8..9d033d6d 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -535,6 +535,8 @@ static const struct gpu_ops gv100_ops = {
 		.is_bar1_supported = gv11b_mm_is_bar1_supported,
 		.init_inst_block = gv11b_init_inst_block,
 		.mmu_fault_pending = gv11b_mm_mmu_fault_pending,
+		.get_kind_invalid = gm20b_get_kind_invalid,
+		.get_kind_pitch = gm20b_get_kind_pitch,
 		.init_bar2_vm = gb10b_init_bar2_vm,
 		.init_bar2_mm_hw_setup = gv11b_init_bar2_mm_hw_setup,
 		.remove_bar2_vm = gv11b_mm_remove_bar2_vm,
-- 
cgit v1.2.2


From 387ecf8a6360f463a129ab569aaef921fe0a2b0e Mon Sep 17 00:00:00 2001
From: seshendra Gadagottu <sgadagottu@nvidia.com>
Date: Wed, 18 Oct 2017 11:40:46 -0700
Subject: gpu: nvgpu: gv1xx: Remove HAL for restore_context_header

gr restore_context_header is not required any more after
enabling per context va mode for subcontext. Cleaning-up
unused function pointers from gv100 and gv11b HAL.

Change-Id: I65cc7d12d3c96726d323defd99726c3e259e7e63
Signed-off-by: seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1581432
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 -
 1 file changed, 1 deletion(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 9d033d6d..f20d2dcf 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -387,7 +387,6 @@ static const struct gpu_ops gv100_ops = {
 		.handle_tpc_mpc_exception = gr_gv11b_handle_tpc_mpc_exception,
 		.zbc_s_query_table = gr_gv11b_zbc_s_query_table,
 		.load_zbc_s_default_tbl = gr_gv11b_load_stencil_default_tbl,
-		.restore_context_header = gv11b_restore_context_header,
 		.handle_gpc_gpcmmu_exception =
 			gr_gv11b_handle_gpc_gpcmmu_exception,
 		.add_zbc_type_s = gr_gv11b_add_zbc_type_s,
-- 
cgit v1.2.2


From ed8ac6e005d95e051bd03a182bbe0aa09a3c2266 Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Mon, 16 Oct 2017 12:24:59 -0700
Subject: gpu: nvgpu: fix smid generation of perf tables

SMID tables were generated according with the local tpc and the pagepool and cb
buffers from a different chip and did not take performance in consideration,
which made compute kernels hang with CTAs on the fly.

This change ensures we are using the right sizes and adds proper enumeration
of smids.

JIRA: NVGPUGV100-36
bug 2004378

Change-Id: Ic8f50c325d6d6720cca41d9740ae4f5f51e1100a
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1581664
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index f20d2dcf..cefaf1ae 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -78,7 +78,7 @@
 
 #include "gv11b/dbg_gpu_gv11b.h"
 #include "gv11b/hal_gv11b.h"
-#include "gv11b/gr_gv11b.h"
+#include "gv100/gr_gv100.h"
 #include "gv11b/mc_gv11b.h"
 #include "gv11b/ltc_gv11b.h"
 #include "gv11b/gv11b.h"
@@ -263,8 +263,8 @@ static const struct gpu_ops gv100_ops = {
 	},
 	.gr = {
 		.init_gpc_mmu = gr_gv11b_init_gpc_mmu,
-		.bundle_cb_defaults = gr_gv11b_bundle_cb_defaults,
-		.cb_size_default = gr_gv11b_cb_size_default,
+		.bundle_cb_defaults = gr_gv100_bundle_cb_defaults,
+		.cb_size_default = gr_gv100_cb_size_default,
 		.calc_global_ctx_buffer_size =
 			gr_gv11b_calc_global_ctx_buffer_size,
 		.commit_global_attrib_cb = gr_gv11b_commit_global_attrib_cb,
@@ -285,7 +285,7 @@ static const struct gpu_ops gv100_ops = {
 		.set_hww_esr_report_mask = gv11b_gr_set_hww_esr_report_mask,
 		.falcon_load_ucode = gr_gm20b_load_ctxsw_ucode_segments,
 		.load_ctxsw_ucode = gr_gm20b_load_ctxsw_ucode,
-		.set_gpc_tpc_mask = gr_gv11b_set_gpc_tpc_mask,
+		.set_gpc_tpc_mask = gr_gv100_set_gpc_tpc_mask,
 		.get_gpc_tpc_mask = gr_gm20b_get_gpc_tpc_mask,
 		.free_channel_ctx = gk20a_free_channel_ctx,
 		.alloc_obj_ctx = gk20a_alloc_obj_ctx,
@@ -335,7 +335,7 @@ static const struct gpu_ops gv100_ops = {
 		.resume_contexts = gr_gk20a_resume_contexts,
 		.get_preemption_mode_flags = gr_gp10b_get_preemption_mode_flags,
 		.fuse_override = gp10b_gr_fuse_override,
-		.init_sm_id_table = gr_gv11b_init_sm_id_table,
+		.init_sm_id_table = gr_gv100_init_sm_id_table,
 		.load_smid_config = gr_gv11b_load_smid_config,
 		.program_sm_id_numbering = gr_gv11b_program_sm_id_numbering,
 		.is_ltcs_ltss_addr = gr_gm20b_is_ltcs_ltss_addr,
-- 
cgit v1.2.2


From cf70c925cd3d8e6c83feee04316b080d5f258afc Mon Sep 17 00:00:00 2001
From: seshendra Gadagottu <sgadagottu@nvidia.com>
Date: Thu, 22 Jun 2017 16:28:19 -0700
Subject: gpu: nvgpu: gv11b: update css ops

Updated following hal functions for css gv11b and reused
them for gv100:
enable_snapshot
disable_snapshot
check_data_available

These changes are needed because of following reasons:
1. Register offsets for perf_pmasys_* are changed
   for gv11b/gv100 from gk20a.
2. Updated memory type for perf_pmasys_mem_block_target
   based on memory aperture used for hwpm inst_block.

Bug 200327596

Change-Id: I500d17670e2f389d8d0e77884374bcc3504a41f8
Signed-off-by: seshendra Gadagottu <sgadagottu@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1507546
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index cefaf1ae..2007eee0 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -76,6 +76,7 @@
 #include "gp10b/mm_gp10b.h"
 #include "gp10b/pmu_gp10b.h"
 
+#include "gv11b/css_gr_gv11b.h"
 #include "gv11b/dbg_gpu_gv11b.h"
 #include "gv11b/hal_gv11b.h"
 #include "gv100/gr_gv100.h"
@@ -639,9 +640,9 @@ static const struct gpu_ops gv100_ops = {
 	},
 #if defined(CONFIG_GK20A_CYCLE_STATS)
 	.css = {
-		.enable_snapshot = css_hw_enable_snapshot,
-		.disable_snapshot = css_hw_disable_snapshot,
-		.check_data_available = css_hw_check_data_available,
+		.enable_snapshot = gv11b_css_hw_enable_snapshot,
+		.disable_snapshot = gv11b_css_hw_disable_snapshot,
+		.check_data_available = gv11b_css_hw_check_data_available,
 		.set_handled_snapshots = css_hw_set_handled_snapshots,
 		.allocate_perfmon_ids = css_gr_allocate_perfmon_ids,
 		.release_perfmon_ids = css_gr_release_perfmon_ids,
-- 
cgit v1.2.2


From 2904e3ac0081d4e898378f6ba667658c85547368 Mon Sep 17 00:00:00 2001
From: Mahantesh Kumbar <mkumbar@nvidia.com>
Date: Wed, 4 Oct 2017 19:41:04 +0530
Subject: gpu: nvgpu: gv100 memory unlock support

- Added method to load mem unlock binary into
  nvdec falcon & execute to perform mem unlock
  if VPR enabled.
- Updated .mem_unlock gv100 HAL to point
  method gv100_fb_memory_unlock().
- Updated .mem_unlock gv11b HAL to NULL.
- Added vpr info hw registers
- Added nvdec enable hw register

Change-Id: Ia4bf820ae103baede679d300d1d390fd748c919a
Signed-off-by: Mahantesh Kumbar <mkumbar@nvidia.com>
(cherry picked from commit 2e176ad9d47316bf4d001692a2ae07e6c1fb1ccb)
Reviewed-on: https://git-master.nvidia.com/r/1573101
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 +
 1 file changed, 1 insertion(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 2007eee0..4e05f22b 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -421,6 +421,7 @@ static const struct gpu_ops gv100_ops = {
 		.set_debug_mode = gm20b_fb_set_debug_mode,
 		.tlb_invalidate = gk20a_fb_tlb_invalidate,
 		.hub_isr = gv11b_fb_hub_isr,
+		.mem_unlock = gv100_fb_memory_unlock,
 	},
 	.fifo = {
 		.init_fifo_setup_hw = gv11b_init_fifo_setup_hw,
-- 
cgit v1.2.2


From 6114553413297dbcae637bc50ef2ff2a6c0858d1 Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Thu, 19 Oct 2017 10:12:24 -0700
Subject: gpu: nvgpu: gv100: fix timeout handling

GV100 has a larger vidmem size and a slower sideband to sysmem so timeouts
need to be adjusted to avoid false positives.

JIRA: NVGPUGV100-36

Change-Id: I3cbc19aa1158c89bc48ae1fa6ec4bc755cd9389d
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1582092
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 4e05f22b..ff852168 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -424,6 +424,7 @@ static const struct gpu_ops gv100_ops = {
 		.mem_unlock = gv100_fb_memory_unlock,
 	},
 	.fifo = {
+		.get_preempt_timeout = gv100_fifo_get_preempt_timeout,
 		.init_fifo_setup_hw = gv11b_init_fifo_setup_hw,
 		.bind_channel = channel_gm20b_bind,
 		.unbind_channel = channel_gv11b_unbind,
@@ -470,7 +471,7 @@ static const struct gpu_ops gv100_ops = {
 		.intr_0_error_mask = gv11b_fifo_intr_0_error_mask,
 		.is_preempt_pending = gv11b_fifo_is_preempt_pending,
 		.init_pbdma_intr_descs = gv11b_fifo_init_pbdma_intr_descs,
-		.reset_enable_hw = gv11b_init_fifo_reset_enable_hw,
+		.reset_enable_hw = gk20a_init_fifo_reset_enable_hw,
 		.teardown_ch_tsg = gv11b_fifo_teardown_ch_tsg,
 		.handle_sched_error = gv11b_fifo_handle_sched_error,
 		.handle_pbdma_intr_0 = gv11b_fifo_handle_pbdma_intr_0,
@@ -523,7 +524,7 @@ static const struct gpu_ops gv100_ops = {
 		.vm_bind_channel = gk20a_vm_bind_channel,
 		.fb_flush = gk20a_mm_fb_flush,
 		.l2_invalidate = gk20a_mm_l2_invalidate,
-		.l2_flush = gv11b_mm_l2_flush,
+		.l2_flush = gk20a_mm_l2_flush,
 		.cbc_clean = gk20a_mm_cbc_clean,
 		.set_big_page_size = gm20b_mm_set_big_page_size,
 		.get_big_page_sizes = gm20b_mm_get_big_page_sizes,
@@ -542,6 +543,7 @@ static const struct gpu_ops gv100_ops = {
 		.init_bar2_mm_hw_setup = gv11b_init_bar2_mm_hw_setup,
 		.remove_bar2_vm = gv11b_mm_remove_bar2_vm,
 		.fault_info_mem_destroy = gv11b_mm_fault_info_mem_destroy,
+		.get_flush_retries = gv100_mm_get_flush_retries,
 	},
 	.pramin = {
 		.enter = gk20a_pramin_enter,
-- 
cgit v1.2.2


From f8c2b77e4f64fcb4adc889bfc0bd4b9ad368ecc6 Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Fri, 20 Oct 2017 14:58:13 -0700
Subject: gpu: nvgpu: Add gv10x regops whitelist

Add regops whitelists for GV100

JIRA: NVGPUGV100-36

Change-Id: Ifeb286e2e8df056ba9afdd32f457bacf1b4813fc
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1582835
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 24 ++++++++++++++++++++++--
 1 file changed, 22 insertions(+), 2 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index ff852168..3a8dc4b1 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -96,7 +96,7 @@
 #include "gv11b/regops_gv11b.h"
 
 #include "gv11b/gv11b_gating_reglist.h"
-#include "gv11b/regops_gv11b.h"
+#include "gv100/regops_gv100.h"
 #include "gv11b/subctx_gv11b.h"
 
 #include "gv100.h"
@@ -600,7 +600,27 @@ static const struct gpu_ops gv100_ops = {
 		.get_current_pstate = nvgpu_clk_arb_get_current_pstate,
 	},
 	.regops = {
-		.apply_smpc_war = gv11b_apply_smpc_war,
+		.get_global_whitelist_ranges =
+			gv100_get_global_whitelist_ranges,
+		.get_global_whitelist_ranges_count =
+			gv100_get_global_whitelist_ranges_count,
+		.get_context_whitelist_ranges =
+			gv100_get_context_whitelist_ranges,
+		.get_context_whitelist_ranges_count =
+			gv100_get_context_whitelist_ranges_count,
+		.get_runcontrol_whitelist = gv100_get_runcontrol_whitelist,
+		.get_runcontrol_whitelist_count =
+			gv100_get_runcontrol_whitelist_count,
+		.get_runcontrol_whitelist_ranges =
+			gv100_get_runcontrol_whitelist_ranges,
+		.get_runcontrol_whitelist_ranges_count =
+			gv100_get_runcontrol_whitelist_ranges_count,
+		.get_qctl_whitelist = gv100_get_qctl_whitelist,
+		.get_qctl_whitelist_count = gv100_get_qctl_whitelist_count,
+		.get_qctl_whitelist_ranges = gv100_get_qctl_whitelist_ranges,
+		.get_qctl_whitelist_ranges_count =
+			gv100_get_qctl_whitelist_ranges_count,
+		.apply_smpc_war = gv100_apply_smpc_war,
 	},
 	.mc = {
 		.intr_enable = mc_gv11b_intr_enable,
-- 
cgit v1.2.2


From 0899e11d4bb630381607a0c245f72476e2e9209e Mon Sep 17 00:00:00 2001
From: Alex Waterman <alexw@nvidia.com>
Date: Fri, 6 Oct 2017 17:20:12 -0700
Subject: gpu: nvgpu: Cleanup generic MM code

t19x changes necessary for change in core MM code.

JIRA NVGPU-30

Change-Id: I62f419450c1a33d0826390d7cbb5ad93569f8c89
Signed-off-by: Alex Waterman <alexw@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1577265
Reviewed-by: Automatic_Commit_Validation_User
GVS: Gerrit_Virtual_Submit
Reviewed-by: David Martinez Nieto <dmartineznie@nvidia.com>
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 +
 1 file changed, 1 insertion(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 3a8dc4b1..1ae424df 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -535,6 +535,7 @@ static const struct gpu_ops gv100_ops = {
 		.init_pdb = gp10b_mm_init_pdb,
 		.init_mm_setup_hw = gv11b_init_mm_setup_hw,
 		.is_bar1_supported = gv11b_mm_is_bar1_supported,
+		.alloc_inst_block = gk20a_alloc_inst_block,
 		.init_inst_block = gv11b_init_inst_block,
 		.mmu_fault_pending = gv11b_mm_mmu_fault_pending,
 		.get_kind_invalid = gm20b_get_kind_invalid,
-- 
cgit v1.2.2


From 1cbb5ea0235f15180b1d4299499cab85db23c5ce Mon Sep 17 00:00:00 2001
From: Peter Daifuku <pdaifuku@nvidia.com>
Date: Fri, 13 Oct 2017 17:15:46 -0700
Subject: gpu: nvgpu: init_cyclestats fixes

- in the native case, replace calls for init_cyclestats with
  the gm20b version, as each chip had identical versions of the code.

- in the virtual case, use the vgpu version of the function in order
  to get the new max_css_buffer_size characteristic set to the mempool
  size.

JIRA ESRM-54
Bug 200296210

Change-Id: I475876cb392978fb1350ede58e37d0962ae095c3
Signed-off-by: Peter Daifuku <pdaifuku@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1578934
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 1ae424df..e8be1a43 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -316,7 +316,7 @@ static const struct gpu_ops gv100_ops = {
 		.get_max_fbps_count = gr_gm20b_get_max_fbps_count,
 		.init_sm_dsm_reg_info = gv11b_gr_init_sm_dsm_reg_info,
 		.wait_empty = gr_gv11b_wait_empty,
-		.init_cyclestats = gr_gv11b_init_cyclestats,
+		.init_cyclestats = gr_gm20b_init_cyclestats,
 		.set_sm_debug_mode = gv11b_gr_set_sm_debug_mode,
 		.enable_cde_in_fecs = gr_gm20b_enable_cde_in_fecs,
 		.bpt_reg_info = gv11b_gr_bpt_reg_info,
-- 
cgit v1.2.2


From 938785f1525ce0ae654c2be0911e15816617995d Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Mon, 23 Oct 2017 08:45:13 -0700
Subject: gpu: nvgpu: Linux specific GPU characteristics flags

Make GPU characteristics flags specific to Linux code only. The
rest of driver is moved to using nvgpu_is_enabled() API.

JIRA NVGPU-259

Change-Id: I46a5a90bb34f170e9e755e7683be142ed6b18cce
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1583992
GVS: Gerrit_Virtual_Submit
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index e8be1a43..e51b4446 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -107,6 +107,7 @@
 #include <nvgpu/bus.h>
 #include <nvgpu/debug.h>
 #include <nvgpu/enabled.h>
+#include <nvgpu/enabled_t19x.h>
 
 #include <nvgpu/hw/gv100/hw_proj_gv100.h>
 #include <nvgpu/hw/gv100/hw_fifo_gv100.h>
@@ -221,16 +222,13 @@ static int gv100_get_litter_value(struct gk20a *g, int value)
 
 int gv100_init_gpu_characteristics(struct gk20a *g)
 {
-	struct nvgpu_gpu_characteristics *gpu = &g->gpu_characteristics;
-
 	int err;
 
 	err = gk20a_init_gpu_characteristics(g);
 	if (err)
 		return err;
 
-	gpu->flags |=
-		NVGPU_GPU_FLAGS_SUPPORT_TSG_SUBCONTEXTS;
+	__nvgpu_set_enabled(g, NVGPU_SUPPORT_TSG_SUBCONTEXTS, true);
 
 	return 0;
 }
-- 
cgit v1.2.2


From 20294264468eecc8c1a065aa83d5f1b46ff07e7e Mon Sep 17 00:00:00 2001
From: David Nieto <dmartineznie@nvidia.com>
Date: Mon, 23 Oct 2017 14:01:28 -0700
Subject: gpu: nvgpu: gv1xx: resize patch buffer

Follow the sizing consideration in bug 1753763 to support dynamic TPC modes
and subcontexts.

bug 200350539

Change-Id: Ibbdbf02f9c2ea3f082c1b2810ae7176b0775d461
Signed-off-by: David Nieto <dmartineznie@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1584034
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 +
 1 file changed, 1 insertion(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index e51b4446..61e9e46d 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -261,6 +261,7 @@ static const struct gpu_ops gv100_ops = {
 		.get_num_pce = gv11b_ce_get_num_pce,
 	},
 	.gr = {
+		.get_patch_slots = gr_gv100_get_patch_slots,
 		.init_gpc_mmu = gr_gv11b_init_gpc_mmu,
 		.bundle_cb_defaults = gr_gv100_bundle_cb_defaults,
 		.cb_size_default = gr_gv100_cb_size_default,
-- 
cgit v1.2.2


From afd1649cfcae97e873663586d55f9a4cfd671808 Mon Sep 17 00:00:00 2001
From: Alex Waterman <alexw@nvidia.com>
Date: Thu, 26 Oct 2017 15:20:39 -0700
Subject: gpu: nvgpu: Move ctxsw_trace_gk20a.c to common/linux

Fixups for the change of name subject in nvgpu.

JIRA NVGPU-287

Change-Id: I6c19733079061a42786b94fc48db374d715ccbef
Signed-off-by: Alex Waterman <alexw@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1586548
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 2 ++
 1 file changed, 2 insertions(+)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 61e9e46d..0950409f 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -709,7 +709,9 @@ int gv100_init_hal(struct gk20a *g)
 	gops->fifo = gv100_ops.fifo;
 	gops->gr_ctx = gv100_ops.gr_ctx;
 	gops->mm = gv100_ops.mm;
+#ifdef CONFIG_GK20A_CTXSW_TRACE
 	gops->fecs_trace = gv100_ops.fecs_trace;
+#endif
 	gops->pramin = gv100_ops.pramin;
 	gops->therm = gv100_ops.therm;
 	gops->pmu = gv100_ops.pmu;
-- 
cgit v1.2.2


From f472922b3582dbba78b633958a4cb7b65ddb3f03 Mon Sep 17 00:00:00 2001
From: Alex Waterman <alexw@nvidia.com>
Date: Tue, 31 Oct 2017 12:23:30 -0700
Subject: gpu: nvgpu: Split ctxsw_trace API into non-Linux component

T19x component for similar change in the main nvgpu code.

JIRA NVGPU-287

Change-Id: Ib126b3d1fb562850fbb3ab89103f2a7fdaa13306
Signed-off-by: Alex Waterman <alexw@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1589430
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 0950409f..30b8e2c3 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -30,7 +30,6 @@
 
 #include "gk20a/gk20a.h"
 #include "gk20a/fifo_gk20a.h"
-#include "gk20a/ctxsw_trace_gk20a.h"
 #include "gk20a/fecs_trace_gk20a.h"
 #include "gk20a/css_gr_gk20a.h"
 #include "gk20a/mc_gk20a.h"
@@ -108,6 +107,7 @@
 #include <nvgpu/debug.h>
 #include <nvgpu/enabled.h>
 #include <nvgpu/enabled_t19x.h>
+#include <nvgpu/ctxsw_trace.h>
 
 #include <nvgpu/hw/gv100/hw_proj_gv100.h>
 #include <nvgpu/hw/gv100/hw_fifo_gv100.h>
-- 
cgit v1.2.2


From 5b368d3e46b946ed2a6b1b70ad2ac600740e582a Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Tue, 7 Nov 2017 10:47:20 -0800
Subject: gpu: nvgpu: gv1xx: Move fuse override DT handling

Move fuse override DT handling to Linux code. All the chip specific
fuse override functions did the same thing, so delete the HAL and
call the same function to read the DT overrides on all chips.

Also remove the fuse override functionality from dGPU. There are no
DT entries for PCIe devices, so it would've failed anyway.

JIRA NVGPU-259

Change-Id: Ic672e25090cdfc207d9771ab61b6cf53185113a4
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1593693
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 -
 1 file changed, 1 deletion(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 30b8e2c3..4ee333b5 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -334,7 +334,6 @@ static const struct gpu_ops gv100_ops = {
 		.suspend_contexts = gr_gp10b_suspend_contexts,
 		.resume_contexts = gr_gk20a_resume_contexts,
 		.get_preemption_mode_flags = gr_gp10b_get_preemption_mode_flags,
-		.fuse_override = gp10b_gr_fuse_override,
 		.init_sm_id_table = gr_gv100_init_sm_id_table,
 		.load_smid_config = gr_gv11b_load_smid_config,
 		.program_sm_id_numbering = gr_gv11b_program_sm_id_numbering,
-- 
cgit v1.2.2


From c87e85af0cd812c6e1c138d4d1e48c23e3aa6bd3 Mon Sep 17 00:00:00 2001
From: Terje Bergstrom <tbergstrom@nvidia.com>
Date: Tue, 7 Nov 2017 09:31:37 -0800
Subject: gpu: nvgpu: Return GPU classes in get_litter_value

Return GPU classes in HAL get_litter_value() instead of assigning
them to GPU characteristics at HAL initialization time.

JIRA NVGPU-259

Change-Id: I92cbadf3bd07292a8715d30843972def879795f5
Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1593691
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 26 ++++++++++++++++++--------
 1 file changed, 18 insertions(+), 8 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 4ee333b5..88008e77 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -213,6 +213,24 @@ static int gv100_get_litter_value(struct gk20a *g, int value)
 	case GPU_LIT_SMPC_PRI_STRIDE:
 		ret = proj_smpc_stride_v();
 		break;
+	case GPU_LIT_TWOD_CLASS:
+		ret = FERMI_TWOD_A;
+		break;
+	case GPU_LIT_THREED_CLASS:
+		ret = VOLTA_A;
+		break;
+	case GPU_LIT_COMPUTE_CLASS:
+		ret = VOLTA_COMPUTE_A;
+		break;
+	case GPU_LIT_GPFIFO_CLASS:
+		ret = VOLTA_CHANNEL_GPFIFO_A;
+		break;
+	case GPU_LIT_I2M_CLASS:
+		ret = KEPLER_INLINE_TO_MEMORY_B;
+		break;
+	case GPU_LIT_DMA_COPY_CLASS:
+		ret = VOLTA_DMA_COPY_A;
+		break;
 	default:
 		break;
 	}
@@ -697,7 +715,6 @@ static const struct gpu_ops gv100_ops = {
 int gv100_init_hal(struct gk20a *g)
 {
 	struct gpu_ops *gops = &g->ops;
-	struct nvgpu_gpu_characteristics *c = &g->gpu_characteristics;
 
 	gops->bios = gv100_ops.bios;
 	gops->ltc = gv100_ops.ltc;
@@ -754,12 +771,5 @@ int gv100_init_hal(struct gk20a *g)
 
 	g->name = "gv10x";
 
-	c->twod_class = FERMI_TWOD_A;
-	c->threed_class = VOLTA_A;
-	c->compute_class = VOLTA_COMPUTE_A;
-	c->gpfifo_class = VOLTA_CHANNEL_GPFIFO_A;
-	c->inline_to_memory_class = KEPLER_INLINE_TO_MEMORY_B;
-	c->dma_copy_class = VOLTA_DMA_COPY_A;
-
 	return 0;
 }
-- 
cgit v1.2.2


From 98bd673a7371940f24d37ad3a6d7b426995e737e Mon Sep 17 00:00:00 2001
From: Sami Kiminki <skiminki@nvidia.com>
Date: Fri, 15 Sep 2017 18:58:58 +0300
Subject: gpu: nvgpu: Remove PTE kind code for GV100/GV11B

Remove gv11b_init_uncompressed_kind_map(), gv11b_init_kind_attr(), and
the related kind setup code. They are not needed anymore.

While we're doing these changes, remove a redundant assignment of
g->bootstrap_owner in hal_gv100.c.

Bug 1902982

Change-Id: Ib40d8f55cfbfa34143a3765c2b4913926ca021fd
Signed-off-by: Sami Kiminki <skiminki@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1560931
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 5 -----
 1 file changed, 5 deletions(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 88008e77..7f2b149b 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -764,11 +764,6 @@ int gv100_init_hal(struct gk20a *g)
 	g->pmu_lsf_pmu_wpr_init_done = 0;
 	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
 
-	gv11b_init_uncompressed_kind_map();
-	gv11b_init_kind_attr();
-
-	g->bootstrap_owner = LSF_FALCON_ID_SEC2;
-
 	g->name = "gv10x";
 
 	return 0;
-- 
cgit v1.2.2


From af5e4a1bf63037e7618adfa11a950244df5883f2 Mon Sep 17 00:00:00 2001
From: Deepak Nibade <dnibade@nvidia.com>
Date: Wed, 15 Nov 2017 15:10:51 +0530
Subject: gpu: nvgpu: deprecate TSG/CHANNEL_SET_PRIORITY IOCTLs

TSG/CHANNEL_SET_PRIORITY IOCTLs are deprecated and user space should be using
combination of timeslice and interleave levels to decide the priority

Hence remove the IOCTLs and all corresponding APIs

Jira NVGPU-393

Change-Id: Idce925631653784e39864223dc418a99a7e7ca3c
Signed-off-by: Deepak Nibade <dnibade@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1598582
Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com>
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c | 1 -
 1 file changed, 1 deletion(-)

(limited to 'drivers/gpu/nvgpu/gv100/hal_gv100.c')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index 7f2b149b..4044c4b5 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -449,7 +449,6 @@ static const struct gpu_ops gv100_ops = {
 		.alloc_inst = gk20a_fifo_alloc_inst,
 		.free_inst = gk20a_fifo_free_inst,
 		.setup_ramfc = channel_gv11b_setup_ramfc,
-		.channel_set_priority = gk20a_fifo_set_priority,
 		.channel_set_timeslice = gk20a_fifo_set_timeslice,
 		.default_timeslice_us = gk20a_fifo_default_timeslice_us,
 		.setup_userd = gk20a_fifo_setup_userd,
-- 
cgit v1.2.2