From 77e2cbab237637f71367df25384164b8c936a31a Mon Sep 17 00:00:00 2001
From: Mahantesh Kumbar <mkumbar@nvidia.com>
Date: Tue, 13 Jun 2017 15:21:56 +0530
Subject: gpu: nvgpu: reorganize PMU perfmon

-Moved perfmon code from pmu_gk20a.c to
"drivers/gpu/nvgpu/common/pmu/pmu_perfmon.c" file

-Moved below related methods
    perfmon init,
    start/stop sampling,
    load counter read/write/reset,
    perfmon event handler

- prepend with nvgpu_ for perfmon global methods
by replacing gk20a_

JURA NVGPU-56
JURA NVGPU-98

Change-Id: Idbcdf63ebd76da170e609cc401b320a42110cd7b
Signed-off-by: Mahantesh Kumbar <mkumbar@nvidia.com>
Reviewed-on: http://git-master/r/1501418
Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com>
Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
---
 drivers/gpu/nvgpu/common/pmu/pmu_perfmon.c | 271 +++++++++++++++++++++++++++++
 1 file changed, 271 insertions(+)
 create mode 100644 drivers/gpu/nvgpu/common/pmu/pmu_perfmon.c

(limited to 'drivers/gpu/nvgpu/common')

diff --git a/drivers/gpu/nvgpu/common/pmu/pmu_perfmon.c b/drivers/gpu/nvgpu/common/pmu/pmu_perfmon.c
new file mode 100644
index 00000000..e28e53a0
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/pmu/pmu_perfmon.c
@@ -0,0 +1,271 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ */
+
+#include <nvgpu/pmu.h>
+#include <nvgpu/log.h>
+#include <nvgpu/pmuif/nvgpu_gpmu_cmdif.h>
+
+#include "gk20a/gk20a.h"
+
+#ifdef CONFIG_TEGRA_19x_GPU
+#include "nvgpu_gpuid_t19x.h"
+#endif
+
+static u8 get_perfmon_id(struct nvgpu_pmu *pmu)
+{
+	struct gk20a *g = gk20a_from_pmu(pmu);
+	u32 ver = g->gpu_characteristics.arch + g->gpu_characteristics.impl;
+	u8 unit_id;
+
+	switch (ver) {
+	case GK20A_GPUID_GK20A:
+	case GK20A_GPUID_GM20B:
+		unit_id = PMU_UNIT_PERFMON;
+		break;
+	case NVGPU_GPUID_GP10B:
+	case NVGPU_GPUID_GP104:
+	case NVGPU_GPUID_GP106:
+		unit_id = PMU_UNIT_PERFMON_T18X;
+		break;
+#if defined(CONFIG_TEGRA_19x_GPU)
+	case TEGRA_19x_GPUID:
+		unit_id = PMU_UNIT_PERFMON_T18X;
+		break;
+#endif
+	default:
+		unit_id = PMU_UNIT_INVALID;
+		nvgpu_err(g, "no support for %x", ver);
+		WARN_ON(1);
+	}
+
+	return unit_id;
+}
+
+int nvgpu_pmu_init_perfmon(struct nvgpu_pmu *pmu)
+{
+	struct gk20a *g = gk20a_from_pmu(pmu);
+	struct pmu_v *pv = &g->ops.pmu_ver;
+	struct pmu_cmd cmd;
+	struct pmu_payload payload;
+	u32 seq;
+
+	nvgpu_log_fn(g, " ");
+
+	pmu->perfmon_ready = 0;
+
+	gk20a_pmu_init_perfmon_counter(g);
+
+	if (!pmu->sample_buffer)
+		pmu->sample_buffer = nvgpu_alloc(&pmu->dmem,
+						  2 * sizeof(u16));
+	if (!pmu->sample_buffer) {
+		nvgpu_err(g, "failed to allocate perfmon sample buffer");
+		return -ENOMEM;
+	}
+
+	/* init PERFMON */
+	memset(&cmd, 0, sizeof(struct pmu_cmd));
+
+	cmd.hdr.unit_id = get_perfmon_id(pmu);
+	if (cmd.hdr.unit_id == PMU_UNIT_INVALID) {
+		nvgpu_err(g, "failed to get perfmon UNIT ID, command skipped");
+		return -EINVAL;
+	}
+
+	cmd.hdr.size = PMU_CMD_HDR_SIZE + pv->get_pmu_perfmon_cmd_init_size();
+	cmd.cmd.perfmon.cmd_type = PMU_PERFMON_CMD_ID_INIT;
+	/* buffer to save counter values for pmu perfmon */
+	pv->perfmon_cmd_init_set_sample_buffer(&cmd.cmd.perfmon,
+	(u16)pmu->sample_buffer);
+	/* number of sample periods below lower threshold
+	 * before pmu triggers perfmon decrease event
+	 * TBD: = 15
+	 */
+	pv->perfmon_cmd_init_set_dec_cnt(&cmd.cmd.perfmon, 15);
+	/* index of base counter, aka. always ticking counter */
+	pv->perfmon_cmd_init_set_base_cnt_id(&cmd.cmd.perfmon, 6);
+	/* microseconds interval between pmu polls perf counters */
+	pv->perfmon_cmd_init_set_samp_period_us(&cmd.cmd.perfmon, 16700);
+	/* number of perfmon counters
+	 * counter #3 (GR and CE2) for gk20a
+	 */
+	pv->perfmon_cmd_init_set_num_cnt(&cmd.cmd.perfmon, 1);
+	/* moving average window for sample periods
+	 * TBD: = 3000000 / sample_period_us = 17
+	 */
+	pv->perfmon_cmd_init_set_mov_avg(&cmd.cmd.perfmon, 17);
+
+	memset(&payload, 0, sizeof(struct pmu_payload));
+	payload.in.buf = pv->get_perfmon_cntr_ptr(pmu);
+	payload.in.size = pv->get_perfmon_cntr_sz(pmu);
+	payload.in.offset = pv->get_perfmon_cmd_init_offsetofvar(COUNTER_ALLOC);
+
+	nvgpu_pmu_dbg(g, "cmd post PMU_PERFMON_CMD_ID_INIT");
+	gk20a_pmu_cmd_post(g, &cmd, NULL, &payload, PMU_COMMAND_QUEUE_LPQ,
+			NULL, NULL, &seq, ~0);
+
+	return 0;
+}
+
+int nvgpu_pmu_perfmon_start_sampling(struct nvgpu_pmu *pmu)
+{
+	struct gk20a *g = gk20a_from_pmu(pmu);
+	struct pmu_v *pv = &g->ops.pmu_ver;
+	struct pmu_cmd cmd;
+	struct pmu_payload payload;
+	u32 seq;
+
+	/* PERFMON Start */
+	memset(&cmd, 0, sizeof(struct pmu_cmd));
+	cmd.hdr.unit_id = get_perfmon_id(pmu);
+	if (cmd.hdr.unit_id == PMU_UNIT_INVALID) {
+		nvgpu_err(g, "failed to get perfmon UNIT ID, command skipped");
+		return -EINVAL;
+	}
+	cmd.hdr.size = PMU_CMD_HDR_SIZE + pv->get_pmu_perfmon_cmd_start_size();
+	pv->perfmon_start_set_cmd_type(&cmd.cmd.perfmon,
+		PMU_PERFMON_CMD_ID_START);
+	pv->perfmon_start_set_group_id(&cmd.cmd.perfmon,
+		PMU_DOMAIN_GROUP_PSTATE);
+	pv->perfmon_start_set_state_id(&cmd.cmd.perfmon,
+		pmu->perfmon_state_id[PMU_DOMAIN_GROUP_PSTATE]);
+
+	pv->perfmon_start_set_flags(&cmd.cmd.perfmon,
+		PMU_PERFMON_FLAG_ENABLE_INCREASE |
+		PMU_PERFMON_FLAG_ENABLE_DECREASE |
+		PMU_PERFMON_FLAG_CLEAR_PREV);
+
+	memset(&payload, 0, sizeof(struct pmu_payload));
+
+	/* TBD: PMU_PERFMON_PCT_TO_INC * 100 */
+	pv->set_perfmon_cntr_ut(pmu, 3000); /* 30% */
+	/* TBD: PMU_PERFMON_PCT_TO_DEC * 100 */
+	pv->set_perfmon_cntr_lt(pmu, 1000); /* 10% */
+	pv->set_perfmon_cntr_valid(pmu, true);
+
+	payload.in.buf = pv->get_perfmon_cntr_ptr(pmu);
+	payload.in.size = pv->get_perfmon_cntr_sz(pmu);
+	payload.in.offset =
+		pv->get_perfmon_cmd_start_offsetofvar(COUNTER_ALLOC);
+
+	nvgpu_pmu_dbg(g, "cmd post PMU_PERFMON_CMD_ID_START");
+	gk20a_pmu_cmd_post(g, &cmd, NULL, &payload, PMU_COMMAND_QUEUE_LPQ,
+			NULL, NULL, &seq, ~0);
+
+	return 0;
+}
+
+int nvgpu_pmu_perfmon_stop_sampling(struct nvgpu_pmu *pmu)
+{
+	struct gk20a *g = gk20a_from_pmu(pmu);
+	struct pmu_cmd cmd;
+	u32 seq;
+
+	/* PERFMON Stop */
+	memset(&cmd, 0, sizeof(struct pmu_cmd));
+	cmd.hdr.unit_id = get_perfmon_id(pmu);
+	if (cmd.hdr.unit_id == PMU_UNIT_INVALID) {
+		nvgpu_err(g, "failed to get perfmon UNIT ID, command skipped");
+		return -EINVAL;
+	}
+	cmd.hdr.size = PMU_CMD_HDR_SIZE + sizeof(struct pmu_perfmon_cmd_stop);
+	cmd.cmd.perfmon.stop.cmd_type = PMU_PERFMON_CMD_ID_STOP;
+
+	nvgpu_pmu_dbg(g, "cmd post PMU_PERFMON_CMD_ID_STOP");
+	gk20a_pmu_cmd_post(g, &cmd, NULL, NULL, PMU_COMMAND_QUEUE_LPQ,
+			NULL, NULL, &seq, ~0);
+	return 0;
+}
+
+int nvgpu_pmu_load_norm(struct gk20a *g, u32 *load)
+{
+	*load = g->pmu.load_shadow;
+	return 0;
+}
+
+int nvgpu_pmu_load_update(struct gk20a *g)
+{
+	struct nvgpu_pmu *pmu = &g->pmu;
+	u16 load = 0;
+
+	if (!pmu->perfmon_ready) {
+		pmu->load_shadow = 0;
+		return 0;
+	}
+
+	pmu_copy_from_dmem(pmu, pmu->sample_buffer, (u8 *)&load, 2, 0);
+	pmu->load_shadow = load / 10;
+	pmu->load_avg = (((9*pmu->load_avg) + pmu->load_shadow) / 10);
+
+	return 0;
+}
+
+void nvgpu_pmu_get_load_counters(struct gk20a *g, u32 *busy_cycles,
+				 u32 *total_cycles)
+{
+	if (!g->power_on || gk20a_busy(g)) {
+		*busy_cycles = 0;
+		*total_cycles = 0;
+		return;
+	}
+
+	*busy_cycles = gk20a_pmu_read_idle_counter(g, 1);
+	*total_cycles = gk20a_pmu_read_idle_counter(g, 2);
+
+	gk20a_idle(g);
+}
+
+void nvgpu_pmu_reset_load_counters(struct gk20a *g)
+{
+	if (!g->power_on || gk20a_busy(g))
+		return;
+
+	gk20a_pmu_reset_idle_counter(g, 2);
+	gk20a_pmu_reset_idle_counter(g, 1);
+
+	gk20a_idle(g);
+}
+
+int nvgpu_pmu_handle_perfmon_event(struct nvgpu_pmu *pmu,
+			struct pmu_perfmon_msg *msg)
+{
+	struct gk20a *g = gk20a_from_pmu(pmu);
+
+	nvgpu_log_fn(g, " ");
+
+	switch (msg->msg_type) {
+	case PMU_PERFMON_MSG_ID_INCREASE_EVENT:
+		nvgpu_pmu_dbg(g, "perfmon increase event: ");
+		nvgpu_pmu_dbg(g, "state_id %d, ground_id %d, pct %d",
+			msg->gen.state_id, msg->gen.group_id, msg->gen.data);
+		(pmu->perfmon_events_cnt)++;
+		break;
+	case PMU_PERFMON_MSG_ID_DECREASE_EVENT:
+		nvgpu_pmu_dbg(g, "perfmon decrease event: ");
+		nvgpu_pmu_dbg(g, "state_id %d, ground_id %d, pct %d",
+			msg->gen.state_id, msg->gen.group_id, msg->gen.data);
+		(pmu->perfmon_events_cnt)++;
+		break;
+	case PMU_PERFMON_MSG_ID_INIT_EVENT:
+		pmu->perfmon_ready = 1;
+		nvgpu_pmu_dbg(g, "perfmon init event");
+		break;
+	default:
+		break;
+	}
+
+	/* restart sampling */
+	if (pmu->perfmon_sampling_enabled)
+		return nvgpu_pmu_perfmon_start_sampling(pmu);
+	return 0;
+}
-- 
cgit v1.2.2