1 files changed, 306 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/common/linux/driver_common.c b/drivers/gpu/nvgpu/common/linux/driver_common.c
new file mode 100644
index 00000000..5c96b4e8
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/linux/driver_common.c
@@ -0,0 +1,306 @@
+/*
+ * Copyright (c) 2016-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <linux/dma-mapping.h>
+#include <linux/firmware.h>
+#include <nvgpu/kmem.h>
+#include <nvgpu/nvgpu_common.h>
+#include <nvgpu/soc.h>
+#include <nvgpu/bug.h>
+#include "gk20a/gk20a_scale.h"
+#include "gk20a/gk20a.h"
+#include "module.h"
+#define EMC3D_DEFAULT_RATIO 750
+static void nvgpu_init_vars(struct gk20a *g)
+{
+        struct gk20a_platform *platform = dev_get_drvdata(g->dev);
+        init_waitqueue_head(&g->sw_irq_stall_last_handled_wq);
+        init_waitqueue_head(&g->sw_irq_nonstall_last_handled_wq);
+        gk20a_init_gr(g);
+        init_rwsem(&g->busy_lock);
+        nvgpu_spinlock_init(&g->mc_enable_lock);
+        nvgpu_mutex_init(&platform->railgate_lock);
+        nvgpu_mutex_init(&g->dbg_sessions_lock);
+        nvgpu_mutex_init(&g->client_lock);
+        nvgpu_mutex_init(&g->poweroff_lock);
+        g->regs_saved = g->regs;
+        g->bar1_saved = g->bar1;
+        g->emc3d_ratio = EMC3D_DEFAULT_RATIO;
+        /* Set DMA parameters to allow larger sgt lists */
+        g->dev->dma_parms = &g->dma_parms;
+        dma_set_max_seg_size(g->dev, UINT_MAX);
+        nvgpu_init_list_node(&g->pending_sema_waits);
+        nvgpu_raw_spinlock_init(&g->pending_sema_waits_lock);
+        nvgpu_init_list_node(&g->profiler_objects);
+}
+static void nvgpu_init_timeout(struct gk20a *g)
+{
+        g->gr_idle_timeout_default = CONFIG_GK20A_DEFAULT_TIMEOUT;
+        if (nvgpu_platform_is_silicon(g))
+                g->timeouts_enabled = true;
+        else if (nvgpu_platform_is_fpga(g)) {
+                g->gr_idle_timeout_default = GK20A_TIMEOUT_FPGA;
+                g->timeouts_enabled = true;
+        }
+}
+static void nvgpu_init_timeslice(struct gk20a *g)
+{
+        g->runlist_interleave = true;
+        g->timeslice_low_priority_us = 1300;
+        g->timeslice_medium_priority_us = 2600;
+        g->timeslice_high_priority_us = 5200;
+        g->min_timeslice_us = 1000;
+        g->max_timeslice_us = 50000;
+}
+static void nvgpu_init_pm_vars(struct gk20a *g)
+{
+        struct gk20a_platform *platform = dev_get_drvdata(g->dev);
+        /*
+         * Set up initial power settings. For non-slicon platforms, disable
+         * power features and for silicon platforms, read from platform data
+         */
+        g->slcg_enabled =
+                nvgpu_platform_is_silicon(g) ? platform->enable_slcg : false;
+        g->blcg_enabled =
+                nvgpu_platform_is_silicon(g) ? platform->enable_blcg : false;
+        g->elcg_enabled =
+                nvgpu_platform_is_silicon(g) ? platform->enable_elcg : false;
+        g->elpg_enabled =
+                nvgpu_platform_is_silicon(g) ? platform->enable_elpg : false;
+        g->aelpg_enabled =
+                nvgpu_platform_is_silicon(g) ? platform->enable_aelpg : false;
+        g->mscg_enabled =
+                nvgpu_platform_is_silicon(g) ? platform->enable_mscg : false;
+        /* set default values to aelpg parameters */
+        g->pmu.aelpg_param[0] = APCTRL_SAMPLING_PERIOD_PG_DEFAULT_US;
+        g->pmu.aelpg_param[1] = APCTRL_MINIMUM_IDLE_FILTER_DEFAULT_US;
+        g->pmu.aelpg_param[2] = APCTRL_MINIMUM_TARGET_SAVING_DEFAULT_US;
+        g->pmu.aelpg_param[3] = APCTRL_POWER_BREAKEVEN_DEFAULT_US;
+        g->pmu.aelpg_param[4] = APCTRL_CYCLES_PER_SAMPLE_MAX_DEFAULT;
+}
+static void nvgpu_init_mm_vars(struct gk20a *g)
+{
+        struct gk20a_platform *platform = dev_get_drvdata(g->dev);
+        g->mm.bypass_smmu = platform->bypass_smmu;
+        g->mm.disable_bigpage = platform->disable_bigpage;
+        g->mm.vidmem_is_vidmem = platform->vidmem_is_vidmem;
+        nvgpu_mutex_init(&g->mm.tlb_lock);
+        nvgpu_mutex_init(&g->mm.priv_lock);
+}
+static int gk20a_secure_page_alloc(struct device *dev)
+{
+        struct gk20a_platform *platform = dev_get_drvdata(dev);
+        int err = 0;
+        if (platform->secure_page_alloc) {
+                err = platform->secure_page_alloc(dev);
+                if (!err)
+                        platform->secure_alloc_ready = true;
+        }
+        return err;
+}
+int nvgpu_probe(struct gk20a *g,
+                const char *debugfs_symlink,
+                const char *interface_name,
+                struct class *class)
+{
+        struct gk20a_platform *platform = dev_get_drvdata(g->dev);
+        int err = 0;
+        nvgpu_init_vars(g);
+        nvgpu_init_timeout(g);
+        nvgpu_init_timeslice(g);
+        nvgpu_init_pm_vars(g);
+        /* Initialize the platform interface. */
+        err = platform->probe(g->dev);
+        if (err) {
+                dev_err(g->dev, "platform probe failed");
+                return err;
+        }
+        /* platform probe can defer do user init only if probe succeeds */
+        err = gk20a_user_init(g->dev, interface_name, class);
+        if (err)
+                return err;
+        /* Initialise scaling */
+        if (IS_ENABLED(CONFIG_GK20A_DEVFREQ))
+                gk20a_scale_init(g->dev);
+        err = gk20a_secure_page_alloc(g->dev);
+        if (err)
+                dev_err(g->dev,
+                        "failed to allocate secure buffer %d\n", err);
+        if (platform->late_probe) {
+                err = platform->late_probe(g->dev);
+                if (err) {
+                        dev_err(g->dev, "late probe failed");
+                        return err;
+                }
+        }
+        nvgpu_init_mm_vars(g);
+        gk20a_create_sysfs(g->dev);
+        gk20a_debug_init(g->dev, debugfs_symlink);
+        g->dbg_regops_tmp_buf = nvgpu_kzalloc(g, SZ_4K);
+        if (!g->dbg_regops_tmp_buf) {
+                dev_err(g->dev, "couldn't allocate regops tmp buf");
+                return -ENOMEM;
+        }
+        g->dbg_regops_tmp_buf_ops =
+                SZ_4K / sizeof(g->dbg_regops_tmp_buf[0]);
+        g->remove_support = gk20a_remove_support;
+        kref_init(&g->refcount);
+        return 0;
+}
+static const struct firmware *do_request_firmware(struct device *dev,
+                const char *prefix, const char *fw_name, int flags)
+{
+        const struct firmware *fw;
+        char *fw_path = NULL;
+        int path_len, err;
+        if (prefix) {
+                path_len = strlen(prefix) + strlen(fw_name);
+                path_len += 2; /* for the path separator and zero terminator*/
+                fw_path = nvgpu_kzalloc(get_gk20a(dev),
+                                        sizeof(*fw_path) * path_len);
+                if (!fw_path)
+                        return NULL;
+                sprintf(fw_path, "%s/%s", prefix, fw_name);
+                fw_name = fw_path;
+        }
+#if LINUX_VERSION_CODE < KERNEL_VERSION(3,18,0)
+        err = request_firmware(&fw, fw_name, dev);
+#else
+        if (flags & NVGPU_REQUEST_FIRMWARE_NO_WARN)
+                err = request_firmware_direct(&fw, fw_name, dev);
+        else
+                err = request_firmware(&fw, fw_name, dev);
+#endif
+        nvgpu_kfree(get_gk20a(dev), fw_path);
+        if (err)
+                return NULL;
+        return fw;
+}
+/* This is a simple wrapper around request_firmware that takes 'fw_name' and
+ * applies an IP specific relative path prefix to it. The caller is
+ * responsible for calling release_firmware later. */
+const struct firmware *nvgpu_request_firmware(struct gk20a *g,
+                                              const char *fw_name,
+                                              int flags)
+{
+        struct device *dev = g->dev;
+        const struct firmware *fw;
+        /* current->fs is NULL when calling from SYS_EXIT.
+           Add a check here to prevent crash in request_firmware */
+        if (!current->fs || !fw_name)
+                return NULL;
+        BUG_ON(!g->name);
+        fw = do_request_firmware(dev, g->name, fw_name, flags);
+#ifdef CONFIG_TEGRA_GK20A
+        /* TO BE REMOVED - Support loading from legacy SOC specific path. */
+        if (!fw && !(flags & NVGPU_REQUEST_FIRMWARE_NO_SOC)) {
+                struct gk20a_platform *platform = gk20a_get_platform(dev);
+                fw = do_request_firmware(dev,
+                                platform->soc_name, fw_name, flags);
+        }
+#endif
+        return fw;
+}
+/**
+ * cyclic_delta - Returns delta of cyclic integers a and b.
+ *
+ * @a - First integer
+ * @b - Second integer
+ *
+ * Note: if a is ahead of b, delta is positive.
+ */
+static int cyclic_delta(int a, int b)
+{
+        return a - b;
+}
+/**
+ * nvgpu_wait_for_deferred_interrupts - Wait for interrupts to complete
+ *
+ * @g - The GPU to wait on.
+ *
+ * Waits until all interrupt handlers that have been scheduled to run have
+ * completed.
+ */
+void nvgpu_wait_for_deferred_interrupts(struct gk20a *g)
+{
+        int stall_irq_threshold = atomic_read(&g->hw_irq_stall_count);
+        int nonstall_irq_threshold = atomic_read(&g->hw_irq_nonstall_count);
+        /* wait until all stalling irqs are handled */
+        wait_event(g->sw_irq_stall_last_handled_wq,
+                   cyclic_delta(stall_irq_threshold,
+                                atomic_read(&g->sw_irq_stall_last_handled))
+                   <= 0);
+        /* wait until all non-stalling irqs are handled */
+        wait_event(g->sw_irq_nonstall_last_handled_wq,
+                   cyclic_delta(nonstall_irq_threshold,
+                                atomic_read(&g->sw_irq_nonstall_last_handled))
+                   <= 0);
+}

diff --git a/drivers/gpu/nvgpu/common/linux/driver_common.c b/drivers/gpu/nvgpu/common/linux/driver_common.c new file mode 100644 index 00000000..5c96b4e8 --- /dev/null +++ b/drivers/gpu/nvgpu/common/linux/driver_common.c
@@ -0,0 +1,306 @@
	1	/*
	2	* Copyright (c) 2016-2017, NVIDIA CORPORATION. All rights reserved.
	3	*
	4	* This program is free software; you can redistribute it and/or modify it
	5	* under the terms and conditions of the GNU General Public License,
	6	* version 2, as published by the Free Software Foundation.
	7	*
	8	* This program is distributed in the hope it will be useful, but WITHOUT
	9	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
	10	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
	11	* more details.
	12	*
	13	* You should have received a copy of the GNU General Public License
	14	* along with this program. If not, see <http://www.gnu.org/licenses/>.
	15	*/
	16
	17	#include <linux/dma-mapping.h>
	18	#include <linux/firmware.h>
	19
	20	#include <nvgpu/kmem.h>
	21	#include <nvgpu/nvgpu_common.h>
	22	#include <nvgpu/soc.h>
	23	#include <nvgpu/bug.h>
	24
	25	#include "gk20a/gk20a_scale.h"
	26	#include "gk20a/gk20a.h"
	27	#include "module.h"
	28
	29	#define EMC3D_DEFAULT_RATIO 750
	30
	31	static void nvgpu_init_vars(struct gk20a *g)
	32	{
	33	struct gk20a_platform *platform = dev_get_drvdata(g->dev);
	34
	35	init_waitqueue_head(&g->sw_irq_stall_last_handled_wq);
	36	init_waitqueue_head(&g->sw_irq_nonstall_last_handled_wq);
	37	gk20a_init_gr(g);
	38
	39	init_rwsem(&g->busy_lock);
	40
	41	nvgpu_spinlock_init(&g->mc_enable_lock);
	42
	43	nvgpu_mutex_init(&platform->railgate_lock);
	44	nvgpu_mutex_init(&g->dbg_sessions_lock);
	45	nvgpu_mutex_init(&g->client_lock);
	46	nvgpu_mutex_init(&g->poweroff_lock);
	47
	48	g->regs_saved = g->regs;
	49	g->bar1_saved = g->bar1;
	50
	51	g->emc3d_ratio = EMC3D_DEFAULT_RATIO;
	52
	53	/* Set DMA parameters to allow larger sgt lists */
	54	g->dev->dma_parms = &g->dma_parms;
	55	dma_set_max_seg_size(g->dev, UINT_MAX);
	56
	57	nvgpu_init_list_node(&g->pending_sema_waits);
	58	nvgpu_raw_spinlock_init(&g->pending_sema_waits_lock);
	59
	60	nvgpu_init_list_node(&g->profiler_objects);
	61	}
	62
	63	static void nvgpu_init_timeout(struct gk20a *g)
	64	{
	65	g->gr_idle_timeout_default = CONFIG_GK20A_DEFAULT_TIMEOUT;
	66	if (nvgpu_platform_is_silicon(g))
	67	g->timeouts_enabled = true;
	68	else if (nvgpu_platform_is_fpga(g)) {
	69	g->gr_idle_timeout_default = GK20A_TIMEOUT_FPGA;
	70	g->timeouts_enabled = true;
	71	}
	72	}
	73
	74	static void nvgpu_init_timeslice(struct gk20a *g)
	75	{
	76	g->runlist_interleave = true;
	77
	78	g->timeslice_low_priority_us = 1300;
	79	g->timeslice_medium_priority_us = 2600;
	80	g->timeslice_high_priority_us = 5200;
	81
	82	g->min_timeslice_us = 1000;
	83	g->max_timeslice_us = 50000;
	84	}
	85
	86	static void nvgpu_init_pm_vars(struct gk20a *g)
	87	{
	88	struct gk20a_platform *platform = dev_get_drvdata(g->dev);
	89
	90	/*
	91	* Set up initial power settings. For non-slicon platforms, disable
	92	* power features and for silicon platforms, read from platform data
	93	*/
	94	g->slcg_enabled =
	95	nvgpu_platform_is_silicon(g) ? platform->enable_slcg : false;
	96	g->blcg_enabled =
	97	nvgpu_platform_is_silicon(g) ? platform->enable_blcg : false;
	98	g->elcg_enabled =
	99	nvgpu_platform_is_silicon(g) ? platform->enable_elcg : false;
	100	g->elpg_enabled =
	101	nvgpu_platform_is_silicon(g) ? platform->enable_elpg : false;
	102	g->aelpg_enabled =
	103	nvgpu_platform_is_silicon(g) ? platform->enable_aelpg : false;
	104	g->mscg_enabled =
	105	nvgpu_platform_is_silicon(g) ? platform->enable_mscg : false;
	106
	107	/* set default values to aelpg parameters */
	108	g->pmu.aelpg_param[0] = APCTRL_SAMPLING_PERIOD_PG_DEFAULT_US;
	109	g->pmu.aelpg_param[1] = APCTRL_MINIMUM_IDLE_FILTER_DEFAULT_US;
	110	g->pmu.aelpg_param[2] = APCTRL_MINIMUM_TARGET_SAVING_DEFAULT_US;
	111	g->pmu.aelpg_param[3] = APCTRL_POWER_BREAKEVEN_DEFAULT_US;
	112	g->pmu.aelpg_param[4] = APCTRL_CYCLES_PER_SAMPLE_MAX_DEFAULT;
	113	}
	114
	115	static void nvgpu_init_mm_vars(struct gk20a *g)
	116	{
	117	struct gk20a_platform *platform = dev_get_drvdata(g->dev);
	118
	119	g->mm.bypass_smmu = platform->bypass_smmu;
	120	g->mm.disable_bigpage = platform->disable_bigpage;
	121	g->mm.vidmem_is_vidmem = platform->vidmem_is_vidmem;
	122
	123	nvgpu_mutex_init(&g->mm.tlb_lock);
	124	nvgpu_mutex_init(&g->mm.priv_lock);
	125	}
	126
	127	static int gk20a_secure_page_alloc(struct device *dev)
	128	{
	129	struct gk20a_platform *platform = dev_get_drvdata(dev);
	130	int err = 0;
	131
	132	if (platform->secure_page_alloc) {
	133	err = platform->secure_page_alloc(dev);
	134	if (!err)
	135	platform->secure_alloc_ready = true;
	136	}
	137
	138	return err;
	139	}
	140
	141	int nvgpu_probe(struct gk20a *g,
	142	const char *debugfs_symlink,
	143	const char *interface_name,
	144	struct class *class)
	145	{
	146	struct gk20a_platform *platform = dev_get_drvdata(g->dev);
	147	int err = 0;
	148
	149	nvgpu_init_vars(g);
	150	nvgpu_init_timeout(g);
	151	nvgpu_init_timeslice(g);
	152	nvgpu_init_pm_vars(g);
	153
	154	/* Initialize the platform interface. */
	155	err = platform->probe(g->dev);
	156	if (err) {
	157	dev_err(g->dev, "platform probe failed");
	158	return err;
	159	}
	160
	161	/* platform probe can defer do user init only if probe succeeds */
	162	err = gk20a_user_init(g->dev, interface_name, class);
	163	if (err)
	164	return err;
	165
	166
	167	/* Initialise scaling */
	168	if (IS_ENABLED(CONFIG_GK20A_DEVFREQ))
	169	gk20a_scale_init(g->dev);
	170
	171	err = gk20a_secure_page_alloc(g->dev);
	172	if (err)
	173	dev_err(g->dev,
	174	"failed to allocate secure buffer %d\n", err);
	175
	176	if (platform->late_probe) {
	177	err = platform->late_probe(g->dev);
	178	if (err) {
	179	dev_err(g->dev, "late probe failed");
	180	return err;
	181	}
	182	}
	183
	184	nvgpu_init_mm_vars(g);
	185
	186	gk20a_create_sysfs(g->dev);
	187	gk20a_debug_init(g->dev, debugfs_symlink);
	188
	189	g->dbg_regops_tmp_buf = nvgpu_kzalloc(g, SZ_4K);
	190	if (!g->dbg_regops_tmp_buf) {
	191	dev_err(g->dev, "couldn't allocate regops tmp buf");
	192	return -ENOMEM;
	193	}
	194	g->dbg_regops_tmp_buf_ops =
	195	SZ_4K / sizeof(g->dbg_regops_tmp_buf[0]);
	196
	197	g->remove_support = gk20a_remove_support;
	198
	199	kref_init(&g->refcount);
	200
	201	return 0;
	202	}
	203
	204	static const struct firmware do_request_firmware(struct device dev,
	205	const char prefix, const char fw_name, int flags)
	206	{
	207	const struct firmware *fw;
	208	char *fw_path = NULL;
	209	int path_len, err;
	210
	211	if (prefix) {
	212	path_len = strlen(prefix) + strlen(fw_name);
	213	path_len += 2; /* for the path separator and zero terminator*/
	214
	215	fw_path = nvgpu_kzalloc(get_gk20a(dev),
	216	sizeof(fw_path) path_len);
	217	if (!fw_path)
	218	return NULL;
	219
	220	sprintf(fw_path, "%s/%s", prefix, fw_name);
	221	fw_name = fw_path;
	222	}
	223
	224	#if LINUX_VERSION_CODE < KERNEL_VERSION(3,18,0)
	225	err = request_firmware(&fw, fw_name, dev);
	226	#else
	227	if (flags & NVGPU_REQUEST_FIRMWARE_NO_WARN)
	228	err = request_firmware_direct(&fw, fw_name, dev);
	229	else
	230	err = request_firmware(&fw, fw_name, dev);
	231	#endif
	232
	233	nvgpu_kfree(get_gk20a(dev), fw_path);
	234	if (err)
	235	return NULL;
	236	return fw;
	237	}
	238
	239	/* This is a simple wrapper around request_firmware that takes 'fw_name' and
	240	* applies an IP specific relative path prefix to it. The caller is
	241	* responsible for calling release_firmware later. */
	242	const struct firmware nvgpu_request_firmware(struct gk20a g,
	243	const char *fw_name,
	244	int flags)
	245	{
	246	struct device *dev = g->dev;
	247	const struct firmware *fw;
	248
	249	/* current->fs is NULL when calling from SYS_EXIT.
	250	Add a check here to prevent crash in request_firmware */
	251	if (!current->fs \|\| !fw_name)
	252	return NULL;
	253
	254	BUG_ON(!g->name);
	255	fw = do_request_firmware(dev, g->name, fw_name, flags);
	256
	257	#ifdef CONFIG_TEGRA_GK20A
	258	/* TO BE REMOVED - Support loading from legacy SOC specific path. */
	259	if (!fw && !(flags & NVGPU_REQUEST_FIRMWARE_NO_SOC)) {
	260	struct gk20a_platform *platform = gk20a_get_platform(dev);
	261	fw = do_request_firmware(dev,
	262	platform->soc_name, fw_name, flags);
	263	}
	264	#endif
	265
	266	return fw;
	267	}
	268
	269	/**
	270	* cyclic_delta - Returns delta of cyclic integers a and b.
	271	*
	272	* @a - First integer
	273	* @b - Second integer
	274	*
	275	* Note: if a is ahead of b, delta is positive.
	276	*/
	277	static int cyclic_delta(int a, int b)
	278	{
	279	return a - b;
	280	}
	281
	282	/**
	283	* nvgpu_wait_for_deferred_interrupts - Wait for interrupts to complete
	284	*
	285	* @g - The GPU to wait on.
	286	*
	287	* Waits until all interrupt handlers that have been scheduled to run have
	288	* completed.
	289	*/
	290	void nvgpu_wait_for_deferred_interrupts(struct gk20a *g)
	291	{
	292	int stall_irq_threshold = atomic_read(&g->hw_irq_stall_count);
	293	int nonstall_irq_threshold = atomic_read(&g->hw_irq_nonstall_count);
	294
	295	/* wait until all stalling irqs are handled */
	296	wait_event(g->sw_irq_stall_last_handled_wq,
	297	cyclic_delta(stall_irq_threshold,
	298	atomic_read(&g->sw_irq_stall_last_handled))
	299	<= 0);
	300
	301	/* wait until all non-stalling irqs are handled */
	302	wait_event(g->sw_irq_nonstall_last_handled_wq,
	303	cyclic_delta(nonstall_irq_threshold,
	304	atomic_read(&g->sw_irq_nonstall_last_handled))
	305	<= 0);
	306	}