summaryrefslogtreecommitdiffstats
path: root/drivers/gpu/nvgpu/common/linux/driver_common.c
diff options
context:
space:
mode:
Diffstat (limited to 'drivers/gpu/nvgpu/common/linux/driver_common.c')
-rw-r--r--drivers/gpu/nvgpu/common/linux/driver_common.c306
1 files changed, 306 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/common/linux/driver_common.c b/drivers/gpu/nvgpu/common/linux/driver_common.c
new file mode 100644
index 00000000..5c96b4e8
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/linux/driver_common.c
@@ -0,0 +1,306 @@
1/*
2 * Copyright (c) 2016-2017, NVIDIA CORPORATION. All rights reserved.
3 *
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms and conditions of the GNU General Public License,
6 * version 2, as published by the Free Software Foundation.
7 *
8 * This program is distributed in the hope it will be useful, but WITHOUT
9 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
11 * more details.
12 *
13 * You should have received a copy of the GNU General Public License
14 * along with this program. If not, see <http://www.gnu.org/licenses/>.
15 */
16
17#include <linux/dma-mapping.h>
18#include <linux/firmware.h>
19
20#include <nvgpu/kmem.h>
21#include <nvgpu/nvgpu_common.h>
22#include <nvgpu/soc.h>
23#include <nvgpu/bug.h>
24
25#include "gk20a/gk20a_scale.h"
26#include "gk20a/gk20a.h"
27#include "module.h"
28
29#define EMC3D_DEFAULT_RATIO 750
30
31static void nvgpu_init_vars(struct gk20a *g)
32{
33 struct gk20a_platform *platform = dev_get_drvdata(g->dev);
34
35 init_waitqueue_head(&g->sw_irq_stall_last_handled_wq);
36 init_waitqueue_head(&g->sw_irq_nonstall_last_handled_wq);
37 gk20a_init_gr(g);
38
39 init_rwsem(&g->busy_lock);
40
41 nvgpu_spinlock_init(&g->mc_enable_lock);
42
43 nvgpu_mutex_init(&platform->railgate_lock);
44 nvgpu_mutex_init(&g->dbg_sessions_lock);
45 nvgpu_mutex_init(&g->client_lock);
46 nvgpu_mutex_init(&g->poweroff_lock);
47
48 g->regs_saved = g->regs;
49 g->bar1_saved = g->bar1;
50
51 g->emc3d_ratio = EMC3D_DEFAULT_RATIO;
52
53 /* Set DMA parameters to allow larger sgt lists */
54 g->dev->dma_parms = &g->dma_parms;
55 dma_set_max_seg_size(g->dev, UINT_MAX);
56
57 nvgpu_init_list_node(&g->pending_sema_waits);
58 nvgpu_raw_spinlock_init(&g->pending_sema_waits_lock);
59
60 nvgpu_init_list_node(&g->profiler_objects);
61}
62
63static void nvgpu_init_timeout(struct gk20a *g)
64{
65 g->gr_idle_timeout_default = CONFIG_GK20A_DEFAULT_TIMEOUT;
66 if (nvgpu_platform_is_silicon(g))
67 g->timeouts_enabled = true;
68 else if (nvgpu_platform_is_fpga(g)) {
69 g->gr_idle_timeout_default = GK20A_TIMEOUT_FPGA;
70 g->timeouts_enabled = true;
71 }
72}
73
74static void nvgpu_init_timeslice(struct gk20a *g)
75{
76 g->runlist_interleave = true;
77
78 g->timeslice_low_priority_us = 1300;
79 g->timeslice_medium_priority_us = 2600;
80 g->timeslice_high_priority_us = 5200;
81
82 g->min_timeslice_us = 1000;
83 g->max_timeslice_us = 50000;
84}
85
86static void nvgpu_init_pm_vars(struct gk20a *g)
87{
88 struct gk20a_platform *platform = dev_get_drvdata(g->dev);
89
90 /*
91 * Set up initial power settings. For non-slicon platforms, disable
92 * power features and for silicon platforms, read from platform data
93 */
94 g->slcg_enabled =
95 nvgpu_platform_is_silicon(g) ? platform->enable_slcg : false;
96 g->blcg_enabled =
97 nvgpu_platform_is_silicon(g) ? platform->enable_blcg : false;
98 g->elcg_enabled =
99 nvgpu_platform_is_silicon(g) ? platform->enable_elcg : false;
100 g->elpg_enabled =
101 nvgpu_platform_is_silicon(g) ? platform->enable_elpg : false;
102 g->aelpg_enabled =
103 nvgpu_platform_is_silicon(g) ? platform->enable_aelpg : false;
104 g->mscg_enabled =
105 nvgpu_platform_is_silicon(g) ? platform->enable_mscg : false;
106
107 /* set default values to aelpg parameters */
108 g->pmu.aelpg_param[0] = APCTRL_SAMPLING_PERIOD_PG_DEFAULT_US;
109 g->pmu.aelpg_param[1] = APCTRL_MINIMUM_IDLE_FILTER_DEFAULT_US;
110 g->pmu.aelpg_param[2] = APCTRL_MINIMUM_TARGET_SAVING_DEFAULT_US;
111 g->pmu.aelpg_param[3] = APCTRL_POWER_BREAKEVEN_DEFAULT_US;
112 g->pmu.aelpg_param[4] = APCTRL_CYCLES_PER_SAMPLE_MAX_DEFAULT;
113}
114
115static void nvgpu_init_mm_vars(struct gk20a *g)
116{
117 struct gk20a_platform *platform = dev_get_drvdata(g->dev);
118
119 g->mm.bypass_smmu = platform->bypass_smmu;
120 g->mm.disable_bigpage = platform->disable_bigpage;
121 g->mm.vidmem_is_vidmem = platform->vidmem_is_vidmem;
122
123 nvgpu_mutex_init(&g->mm.tlb_lock);
124 nvgpu_mutex_init(&g->mm.priv_lock);
125}
126
127static int gk20a_secure_page_alloc(struct device *dev)
128{
129 struct gk20a_platform *platform = dev_get_drvdata(dev);
130 int err = 0;
131
132 if (platform->secure_page_alloc) {
133 err = platform->secure_page_alloc(dev);
134 if (!err)
135 platform->secure_alloc_ready = true;
136 }
137
138 return err;
139}
140
141int nvgpu_probe(struct gk20a *g,
142 const char *debugfs_symlink,
143 const char *interface_name,
144 struct class *class)
145{
146 struct gk20a_platform *platform = dev_get_drvdata(g->dev);
147 int err = 0;
148
149 nvgpu_init_vars(g);
150 nvgpu_init_timeout(g);
151 nvgpu_init_timeslice(g);
152 nvgpu_init_pm_vars(g);
153
154 /* Initialize the platform interface. */
155 err = platform->probe(g->dev);
156 if (err) {
157 dev_err(g->dev, "platform probe failed");
158 return err;
159 }
160
161 /* platform probe can defer do user init only if probe succeeds */
162 err = gk20a_user_init(g->dev, interface_name, class);
163 if (err)
164 return err;
165
166
167 /* Initialise scaling */
168 if (IS_ENABLED(CONFIG_GK20A_DEVFREQ))
169 gk20a_scale_init(g->dev);
170
171 err = gk20a_secure_page_alloc(g->dev);
172 if (err)
173 dev_err(g->dev,
174 "failed to allocate secure buffer %d\n", err);
175
176 if (platform->late_probe) {
177 err = platform->late_probe(g->dev);
178 if (err) {
179 dev_err(g->dev, "late probe failed");
180 return err;
181 }
182 }
183
184 nvgpu_init_mm_vars(g);
185
186 gk20a_create_sysfs(g->dev);
187 gk20a_debug_init(g->dev, debugfs_symlink);
188
189 g->dbg_regops_tmp_buf = nvgpu_kzalloc(g, SZ_4K);
190 if (!g->dbg_regops_tmp_buf) {
191 dev_err(g->dev, "couldn't allocate regops tmp buf");
192 return -ENOMEM;
193 }
194 g->dbg_regops_tmp_buf_ops =
195 SZ_4K / sizeof(g->dbg_regops_tmp_buf[0]);
196
197 g->remove_support = gk20a_remove_support;
198
199 kref_init(&g->refcount);
200
201 return 0;
202}
203
204static const struct firmware *do_request_firmware(struct device *dev,
205 const char *prefix, const char *fw_name, int flags)
206{
207 const struct firmware *fw;
208 char *fw_path = NULL;
209 int path_len, err;
210
211 if (prefix) {
212 path_len = strlen(prefix) + strlen(fw_name);
213 path_len += 2; /* for the path separator and zero terminator*/
214
215 fw_path = nvgpu_kzalloc(get_gk20a(dev),
216 sizeof(*fw_path) * path_len);
217 if (!fw_path)
218 return NULL;
219
220 sprintf(fw_path, "%s/%s", prefix, fw_name);
221 fw_name = fw_path;
222 }
223
224#if LINUX_VERSION_CODE < KERNEL_VERSION(3,18,0)
225 err = request_firmware(&fw, fw_name, dev);
226#else
227 if (flags & NVGPU_REQUEST_FIRMWARE_NO_WARN)
228 err = request_firmware_direct(&fw, fw_name, dev);
229 else
230 err = request_firmware(&fw, fw_name, dev);
231#endif
232
233 nvgpu_kfree(get_gk20a(dev), fw_path);
234 if (err)
235 return NULL;
236 return fw;
237}
238
239/* This is a simple wrapper around request_firmware that takes 'fw_name' and
240 * applies an IP specific relative path prefix to it. The caller is
241 * responsible for calling release_firmware later. */
242const struct firmware *nvgpu_request_firmware(struct gk20a *g,
243 const char *fw_name,
244 int flags)
245{
246 struct device *dev = g->dev;
247 const struct firmware *fw;
248
249 /* current->fs is NULL when calling from SYS_EXIT.
250 Add a check here to prevent crash in request_firmware */
251 if (!current->fs || !fw_name)
252 return NULL;
253
254 BUG_ON(!g->name);
255 fw = do_request_firmware(dev, g->name, fw_name, flags);
256
257#ifdef CONFIG_TEGRA_GK20A
258 /* TO BE REMOVED - Support loading from legacy SOC specific path. */
259 if (!fw && !(flags & NVGPU_REQUEST_FIRMWARE_NO_SOC)) {
260 struct gk20a_platform *platform = gk20a_get_platform(dev);
261 fw = do_request_firmware(dev,
262 platform->soc_name, fw_name, flags);
263 }
264#endif
265
266 return fw;
267}
268
269/**
270 * cyclic_delta - Returns delta of cyclic integers a and b.
271 *
272 * @a - First integer
273 * @b - Second integer
274 *
275 * Note: if a is ahead of b, delta is positive.
276 */
277static int cyclic_delta(int a, int b)
278{
279 return a - b;
280}
281
282/**
283 * nvgpu_wait_for_deferred_interrupts - Wait for interrupts to complete
284 *
285 * @g - The GPU to wait on.
286 *
287 * Waits until all interrupt handlers that have been scheduled to run have
288 * completed.
289 */
290void nvgpu_wait_for_deferred_interrupts(struct gk20a *g)
291{
292 int stall_irq_threshold = atomic_read(&g->hw_irq_stall_count);
293 int nonstall_irq_threshold = atomic_read(&g->hw_irq_nonstall_count);
294
295 /* wait until all stalling irqs are handled */
296 wait_event(g->sw_irq_stall_last_handled_wq,
297 cyclic_delta(stall_irq_threshold,
298 atomic_read(&g->sw_irq_stall_last_handled))
299 <= 0);
300
301 /* wait until all non-stalling irqs are handled */
302 wait_event(g->sw_irq_nonstall_last_handled_wq,
303 cyclic_delta(nonstall_irq_threshold,
304 atomic_read(&g->sw_irq_nonstall_last_handled))
305 <= 0);
306}