From ae809fddbe90bcec0d48e1213fa36cc5ba76550d Mon Sep 17 00:00:00 2001
From: Vaikundanathan S <vaikuns@nvidia.com>
Date: Tue, 28 Aug 2018 11:58:25 +0530
Subject: gpu:nvgpu: Add GV10x perf event

In case of VFE update, schedule work to set P0 clocks.
Added function nvgpu_clk_set_fll_clk_gv10x to update P0 clocks on perf event.
Fixed MISRA issues caused by this excluding external functions and MACROs

Bug 2331655

Change-Id: Id96c473092ee7f0b651413aefdd4b6f2f59e0b12
Signed-off-by: Vaikundanathan S <vaikuns@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1808014
Reviewed-on: https://git-master.nvidia.com/r/1813881
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/gv100/hal_gv100.c  |   3 +
 drivers/gpu/nvgpu/gv100/perf_gv100.c | 120 +++++++++++++++++++++++++++++++++++
 drivers/gpu/nvgpu/gv100/perf_gv100.h |  36 +++++++++++
 3 files changed, 159 insertions(+)
 create mode 100644 drivers/gpu/nvgpu/gv100/perf_gv100.c
 create mode 100644 drivers/gpu/nvgpu/gv100/perf_gv100.h

(limited to 'drivers/gpu/nvgpu/gv100')

diff --git a/drivers/gpu/nvgpu/gv100/hal_gv100.c b/drivers/gpu/nvgpu/gv100/hal_gv100.c
index ee6dd436..0c64ce58 100644
--- a/drivers/gpu/nvgpu/gv100/hal_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/hal_gv100.c
@@ -107,6 +107,7 @@
 #include "gv100/pmu_gv100.h"
 #include "gv100/nvlink_gv100.h"
 #include "gv100/regops_gv100.h"
+#include "gv100/perf_gv100.h"
 
 #include <nvgpu/ptimer.h>
 #include <nvgpu/debug.h>
@@ -770,6 +771,7 @@ static const struct gpu_ops gv100_ops = {
 		.get_rate_cntr = gp106_get_rate_cntr,
 		.measure_freq = gp106_clk_measure_freq,
 		.suspend_clk_support = gp106_suspend_clk_support,
+		.perf_pmu_vfe_load = gv100_perf_pmu_vfe_load,
 	},
 	.clk_arb = {
 		.get_arbiter_clk_domains = gp106_get_arbiter_clk_domains,
@@ -981,6 +983,7 @@ int gv100_init_hal(struct gk20a *g)
 	gops->clk.get_crystal_clk_hz = gv100_ops.clk.get_crystal_clk_hz;
 	gops->clk.measure_freq = gv100_ops.clk.measure_freq;
 	gops->clk.suspend_clk_support = gv100_ops.clk.suspend_clk_support;
+	gops->clk.perf_pmu_vfe_load = gv100_ops.clk.perf_pmu_vfe_load;
 
 	/* Lone functions */
 	gops->chip_init_gpu_characteristics =
diff --git a/drivers/gpu/nvgpu/gv100/perf_gv100.c b/drivers/gpu/nvgpu/gv100/perf_gv100.c
new file mode 100644
index 00000000..f3ba78ba
--- /dev/null
+++ b/drivers/gpu/nvgpu/gv100/perf_gv100.c
@@ -0,0 +1,120 @@
+/*
+ * GV100 PERF
+ *
+ * Copyright (c) 2018, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#include <nvgpu/pmu.h>
+#include <nvgpu/bug.h>
+
+#include "gk20a/gk20a.h"
+#include "gv100/perf_gv100.h"
+
+static int pmu_set_boot_clk_runcb_fn(void *arg)
+{
+	struct gk20a *g = (struct gk20a *)arg;
+	struct nvgpu_pmu *pmu = &g->pmu;
+	struct nv_pmu_rpc_struct_perf_load rpc;
+	struct perf_pmupstate *perf_pmu = &g->perf_pmu;
+	struct nvgpu_vfe_invalidate *vfe_init = &perf_pmu->vfe_init;
+	int status = 0;
+
+	nvgpu_log_fn(g, "thread start");
+
+	while (true) {
+		NVGPU_COND_WAIT_INTERRUPTIBLE(&vfe_init->wq,
+			(vfe_init->state_change == true), 0);
+
+		vfe_init->state_change = false;
+
+		memset(&rpc, 0, sizeof(struct nv_pmu_rpc_struct_perf_load));
+		PMU_RPC_EXECUTE_CPB(status, pmu, PERF, VFE_INVALIDATE, &rpc, 0);
+		if (status != 0) {
+			nvgpu_err(g, "Failed to execute RPC status=0x%x",
+					status);
+		}
+		status = nvgpu_clk_set_fll_clk_gv10x(g);
+	}
+
+	return 0;
+}
+
+static int gv100_pmu_handle_perf_event(struct gk20a *g, void *pmumsg)
+{
+	struct nv_pmu_perf_msg *msg = (struct nv_pmu_perf_msg *)pmumsg;
+	struct perf_pmupstate *perf_pmu = &g->perf_pmu;
+
+	nvgpu_log_fn(g, " ");
+	switch (msg->msg_type) {
+	case NV_PMU_PERF_MSG_ID_VFE_CALLBACK:
+		perf_pmu->vfe_init.state_change = true;
+		nvgpu_cond_signal(&perf_pmu->vfe_init.wq);
+		break;
+	default:
+		WARN_ON(1);
+		break;
+	}
+	return 0;
+}
+
+u32 perf_pmu_init_vfe_perf_event(struct gk20a *g)
+{
+	struct perf_pmupstate *perf_pmu = &g->perf_pmu;
+	char thread_name[64];
+	u32 err = 0;
+
+	nvgpu_log_fn(g, " ");
+
+	nvgpu_cond_init(&perf_pmu->vfe_init.wq);
+
+	snprintf(thread_name, sizeof(thread_name),
+				"nvgpu_vfe_invalidate_init_%s", g->name);
+
+	err = nvgpu_thread_create(&perf_pmu->vfe_init.state_task, g,
+			pmu_set_boot_clk_runcb_fn, thread_name);
+	if (err != 0U) {
+		nvgpu_err(g, "failed to start nvgpu_vfe_invalidate_init thread");
+	}
+
+	return err;
+
+}
+
+u32 gv100_perf_pmu_vfe_load(struct gk20a *g)
+{
+	struct nvgpu_pmu *pmu = &g->pmu;
+	struct nv_pmu_rpc_struct_perf_load rpc;
+	u32 status = 0;
+
+	memset(&rpc, 0, sizeof(struct nv_pmu_rpc_struct_perf_load));
+	PMU_RPC_EXECUTE_CPB(status, pmu, PERF, VFE_INVALIDATE, &rpc, 0);
+	if (status != 0U) {
+		nvgpu_err(g, "Failed to execute RPC status=0x%x",
+			status);
+	}
+
+	perf_pmu_init_vfe_perf_event(g);
+
+	/*register call back for future VFE updates*/
+	g->ops.perf.handle_pmu_perf_event = gv100_pmu_handle_perf_event;
+
+	return status;
+}
diff --git a/drivers/gpu/nvgpu/gv100/perf_gv100.h b/drivers/gpu/nvgpu/gv100/perf_gv100.h
new file mode 100644
index 00000000..e128c06a
--- /dev/null
+++ b/drivers/gpu/nvgpu/gv100/perf_gv100.h
@@ -0,0 +1,36 @@
+/*
+ * GV100 PERF
+ *
+ * Copyright (c) 2018, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ * DEALINGS IN THE SOFTWARE.
+ */
+
+#ifndef __PERF_GV100_H_
+#define __PERF_GV100_H_
+
+#include <nvgpu/pmuif/nvgpu_gpmu_cmdif.h>
+
+struct gk20a;
+
+u32 perf_pmu_init_vfe_perf_event(struct gk20a *g);
+u32 gv100_perf_pmu_vfe_load(struct gk20a *g);
+
+
+#endif /*__PERF_GV100_H_*/
-- 
cgit v1.2.2