gpu: nvgpu: Add bus HAL

Add bus HAL and move all bus related hardware sequencing to that file: BAR1 binding, timer access, and interrupt handling. Change-Id: Ibc5f5797dc338de10749b446a7bdbcae600fecb4 Signed-off-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-on: http://git-master/r/1323353 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Terje Bergstrom <tbergstrom@nvidia.com> 2017-03-17 14:09:44 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2017-03-23 11:44:07 -0400
commit: 4492c62ffe9398bd4457f6f1c2773e40afe909fb (patch)
tree: 5d792f81d97844278f4eca665a8b4778fa93dc35
parent: 33f637585ecd617a9f4423f56e2aa6df0691ac64 (diff)
21 files changed, 306 insertions, 177 deletions
diff --git a/drivers/gpu/nvgpu/Makefile.nvgpu b/drivers/gpu/nvgpu/Makefile.nvgpu
index 3852e728..9cf5195b 100644
--- a/drivers/gpu/nvgpu/Makefile.nvgpu
+++ b/drivers/gpu/nvgpu/Makefile.nvgpu
@@ -34,6 +34,7 @@ nvgpu-y := \
        common/semaphore.o \
        common/vbios/bios.o \
        gk20a/gk20a.o \
+        gk20a/bus_gk20a.o \
        gk20a/sched_gk20a.o \
        gk20a/as_gk20a.o \
        gk20a/ctrl_gk20a.o \
@@ -67,6 +68,7 @@ nvgpu-y := \
        gk20a/mc_gk20a.o \
        gk20a/sim_gk20a.o \
        gm20b/hal_gm20b.o \
+        gm20b/bus_gm20b.o \
        gm20b/ltc_gm20b.o \
        gm20b/ce2_gm20b.o \
        gm20b/gr_gm20b.o \
diff --git a/drivers/gpu/nvgpu/clk/clk_arb.c b/drivers/gpu/nvgpu/clk/clk_arb.c
index 30447d3e..fc821235 100644
--- a/drivers/gpu/nvgpu/clk/clk_arb.c
+++ b/drivers/gpu/nvgpu/clk/clk_arb.c
@@ -1062,7 +1062,7 @@ static void nvgpu_clk_arb_run_arbiter_cb(struct work_struct *work)
                goto exit_arb;
 #ifdef CONFIG_DEBUG_FS
-        g->ops.read_ptimer(g, &t0);
+        g->ops.bus.read_ptimer(g, &t0);
 #endif
        /* Only one arbiter should be running */
@@ -1248,7 +1248,7 @@ static void nvgpu_clk_arb_run_arbiter_cb(struct work_struct *work)
        wake_up_interruptible(&arb->request_wq);
 #ifdef CONFIG_DEBUG_FS
-        g->ops.read_ptimer(g, &t1);
+        g->ops.bus.read_ptimer(g, &t1);
        debug = arb->debug == &arb->debug_pool[0] ?
                &arb->debug_pool[1] : &arb->debug_pool[0];
diff --git a/drivers/gpu/nvgpu/clk/clk_mclk.c b/drivers/gpu/nvgpu/clk/clk_mclk.c
index c2e9b35c..e5452051 100644
--- a/drivers/gpu/nvgpu/clk/clk_mclk.c
+++ b/drivers/gpu/nvgpu/clk/clk_mclk.c
@@ -2311,7 +2311,7 @@ int clk_mclkseq_change_mclk_gddr5(struct gk20a *g, u16 val)
        pseq_cmd->cmd_type = NV_PMU_SEQ_CMD_ID_RUN_SCRIPT;
 #ifdef CONFIG_DEBUG_FS
-        g->ops.read_ptimer(g, &t0);
+        g->ops.bus.read_ptimer(g, &t0);
 #endif
        if (speed == gk20a_mclk_high_speed) {
@@ -2362,7 +2362,7 @@ int clk_mclkseq_change_mclk_gddr5(struct gk20a *g, u16 val)
        mclk->speed = speed;
 #ifdef CONFIG_DEBUG_FS
-        g->ops.read_ptimer(g, &t1);
+        g->ops.bus.read_ptimer(g, &t1);
        nvgpu_mutex_acquire(&mclk->data_lock);
        mclk->switch_num++;
diff --git a/drivers/gpu/nvgpu/gk20a/bus_gk20a.c b/drivers/gpu/nvgpu/gk20a/bus_gk20a.c
new file mode 100644
index 00000000..fda1f80e
--- /dev/null
+++ b/drivers/gpu/nvgpu/gk20a/bus_gk20a.c
@@ -0,0 +1,156 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#include <soc/tegra/chip-id.h>
+#include <nvgpu/page_allocator.h>
+#include "gk20a.h"
+#include <nvgpu/hw/gk20a/hw_bus_gk20a.h>
+#include <nvgpu/hw/gk20a/hw_mc_gk20a.h>
+#include <nvgpu/hw/gk20a/hw_gr_gk20a.h>
+#include <nvgpu/hw/gk20a/hw_timer_gk20a.h>
+void gk20a_bus_init_hw(struct gk20a *g)
+{
+        struct gk20a_platform *platform = gk20a_get_platform(g->dev);
+        /* enable pri timeout only on silicon */
+        if (tegra_platform_is_silicon()) {
+                gk20a_writel(g,
+                        timer_pri_timeout_r(),
+                        timer_pri_timeout_period_f(
+                                platform->default_pri_timeout ?
+                                        platform->default_pri_timeout :
+                                                                0x186A0) |
+                        timer_pri_timeout_en_en_enabled_f());
+        } else {
+                gk20a_writel(g,
+                        timer_pri_timeout_r(),
+                        timer_pri_timeout_period_f(0x186A0) |
+                        timer_pri_timeout_en_en_disabled_f());
+        }
+        if (!tegra_platform_is_silicon())
+                gk20a_writel(g, bus_intr_en_0_r(), 0x0);
+        else
+                gk20a_writel(g, bus_intr_en_0_r(),
+                                bus_intr_en_0_pri_squash_m() |
+                                bus_intr_en_0_pri_fecserr_m() |
+                                bus_intr_en_0_pri_timeout_m());
+}
+void gk20a_bus_isr(struct gk20a *g)
+{
+        u32 val, err_code;
+        val = gk20a_readl(g, bus_intr_0_r());
+        if (val & (bus_intr_0_pri_squash_m() |
+                        bus_intr_0_pri_fecserr_m() |
+                        bus_intr_0_pri_timeout_m())) {
+                gk20a_dbg(gpu_dbg_intr, "pmc_enable : 0x%x",
+                        gk20a_readl(g, mc_enable_r()));
+                gk20a_dbg(gpu_dbg_intr, "NV_PBUS_INTR_0 : 0x%x", val);
+                gk20a_dbg(gpu_dbg_intr,
+                        "NV_PTIMER_PRI_TIMEOUT_SAVE_0: 0x%x\n",
+                        gk20a_readl(g, timer_pri_timeout_save_0_r()));
+                gk20a_dbg(gpu_dbg_intr,
+                        "NV_PTIMER_PRI_TIMEOUT_SAVE_1: 0x%x\n",
+                        gk20a_readl(g, timer_pri_timeout_save_1_r()));
+                err_code = gk20a_readl(g, timer_pri_timeout_fecs_errcode_r());
+                gk20a_dbg(gpu_dbg_intr,
+                        "NV_PTIMER_PRI_TIMEOUT_FECS_ERRCODE: 0x%x\n",
+                        err_code);
+                if (err_code == 0xbadf13)
+                        gk20a_dbg(gpu_dbg_intr,
+                        "NV_PGRAPH_PRI_GPC0_GPCCS_FS_GPC: 0x%x\n",
+                        gk20a_readl(g, gr_gpc0_fs_gpc_r()));
+                gk20a_writel(g, timer_pri_timeout_save_0_r(), 0);
+                gk20a_writel(g, timer_pri_timeout_save_1_r(), 0);
+        }
+        if (val)
+                gk20a_dbg(gpu_dbg_intr,
+                        "Unhandled pending pbus interrupt\n");
+        gk20a_writel(g, bus_intr_0_r(), val);
+}
+int gk20a_read_ptimer(struct gk20a *g, u64 *value)
+{
+        const unsigned int max_iterations = 3;
+        unsigned int i = 0;
+        u32 gpu_timestamp_hi_prev = 0;
+        if (!value)
+                return -EINVAL;
+        /* Note. The GPU nanosecond timer consists of two 32-bit
+         * registers (high & low). To detect a possible low register
+         * wrap-around between the reads, we need to read the high
+         * register before and after low. The wraparound happens
+         * approximately once per 4 secs. */
+        /* get initial gpu_timestamp_hi value */
+        gpu_timestamp_hi_prev = gk20a_readl(g, timer_time_1_r());
+        for (i = 0; i < max_iterations; ++i) {
+                u32 gpu_timestamp_hi = 0;
+                u32 gpu_timestamp_lo = 0;
+                gpu_timestamp_lo = gk20a_readl(g, timer_time_0_r());
+                gpu_timestamp_hi = gk20a_readl(g, timer_time_1_r());
+                if (gpu_timestamp_hi == gpu_timestamp_hi_prev) {
+                        *value = (((u64)gpu_timestamp_hi) << 32) |
+                                gpu_timestamp_lo;
+                        return 0;
+                }
+                /* wrap-around detected, retry */
+                gpu_timestamp_hi_prev = gpu_timestamp_hi;
+        }
+        /* too many iterations, bail out */
+        gk20a_err(dev_from_gk20a(g), "failed to read ptimer");
+        return -EBUSY;
+}
+static int gk20a_bus_bar1_bind(struct gk20a *g, struct mem_desc *bar1_inst)
+{
+        u64 iova = gk20a_mm_inst_block_addr(g, bar1_inst);
+        u32 ptr_v = (u32)(iova >> bar1_instance_block_shift_gk20a());
+        gk20a_dbg_info("bar1 inst block ptr: 0x%08x", ptr_v);
+        gk20a_writel(g, bus_bar1_block_r(),
+                     gk20a_aperture_mask(g, bar1_inst,
+                       bus_bar1_block_target_sys_mem_ncoh_f(),
+                       bus_bar1_block_target_vid_mem_f()) |
+                     bus_bar1_block_mode_virtual_f() |
+                     bus_bar1_block_ptr_f(ptr_v));
+        return 0;
+}
+void gk20a_init_bus(struct gpu_ops *gops)
+{
+        gops->bus.init_hw = gk20a_bus_init_hw;
+        gops->bus.isr = gk20a_bus_isr;
+        gops->bus.read_ptimer = gk20a_read_ptimer;
+        gops->bus.bar1_bind = gk20a_bus_bar1_bind;
+}
diff --git a/drivers/gpu/nvgpu/gk20a/bus_gk20a.h b/drivers/gpu/nvgpu/gk20a/bus_gk20a.h
new file mode 100644
index 00000000..01526f06
--- /dev/null
+++ b/drivers/gpu/nvgpu/gk20a/bus_gk20a.h
@@ -0,0 +1,29 @@
+/*
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+#ifndef BUS_GK20A_H
+#define BUS_GK20A_H
+struct gk20a;
+struct gpu_ops;
+struct mem_desc;
+void gk20a_init_bus(struct gpu_ops *gops);
+void gk20a_bus_isr(struct gk20a *g);
+int gk20a_read_ptimer(struct gk20a *g, u64 *value);
+void gk20a_bus_init_hw(struct gk20a *g);
+#endif /* GK20A_H */
diff --git a/drivers/gpu/nvgpu/gk20a/ctrl_gk20a.c b/drivers/gpu/nvgpu/gk20a/ctrl_gk20a.c
index e6626c4a..67971369 100644
--- a/drivers/gpu/nvgpu/gk20a/ctrl_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/ctrl_gk20a.c
@@ -725,7 +725,7 @@ static int nvgpu_gpu_get_gpu_time(
        if (err)
                return err;
-        err = g->ops.read_ptimer(g, &time);
+        err = g->ops.bus.read_ptimer(g, &time);
        if (!err)
                args->gpu_timestamp = time;
diff --git a/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c b/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c
index 4ad2abd6..0736a03b 100644
--- a/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/ctxsw_trace_gk20a.c
@@ -686,7 +686,7 @@ void gk20a_ctxsw_trace_channel_reset(struct gk20a *g, struct channel_gk20a *ch)
        if (!g->ctxsw_trace)
                return;
-        g->ops.read_ptimer(g, &entry.timestamp);
+        g->ops.bus.read_ptimer(g, &entry.timestamp);
        gk20a_ctxsw_trace_write(g, &entry);
        gk20a_ctxsw_trace_wake_up(g, 0);
 #endif
@@ -706,7 +706,7 @@ void gk20a_ctxsw_trace_tsg_reset(struct gk20a *g, struct tsg_gk20a *tsg)
        if (!g->ctxsw_trace)
                return;
-        g->ops.read_ptimer(g, &entry.timestamp);
+        g->ops.bus.read_ptimer(g, &entry.timestamp);
        gk20a_ctxsw_trace_write(g, &entry);
        gk20a_ctxsw_trace_wake_up(g, 0);
 #endif
diff --git a/drivers/gpu/nvgpu/gk20a/gk20a.c b/drivers/gpu/nvgpu/gk20a/gk20a.c
index 76484dd5..72528758 100644
--- a/drivers/gpu/nvgpu/gk20a/gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/gk20a.c
@@ -57,6 +57,7 @@
 #include "hal.h"
 #include "vgpu/vgpu.h"
 #include "pci.h"
+#include "bus_gk20a.h"
 #ifdef CONFIG_ARCH_TEGRA_18x_SOC
 #include "pstate/pstate.h"
 #endif
@@ -70,11 +71,8 @@
 #endif
 #include <nvgpu/hw/gk20a/hw_mc_gk20a.h>
-#include <nvgpu/hw/gk20a/hw_timer_gk20a.h>
-#include <nvgpu/hw/gk20a/hw_bus_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_top_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_ltc_gk20a.h>
-#include <nvgpu/hw/gk20a/hw_gr_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_fb_gk20a.h>
@@ -330,42 +328,6 @@ static irqreturn_t gk20a_intr_isr_nonstall(int irq, void *dev_id)
        return g->ops.mc.isr_nonstall(g);
 }
-void gk20a_pbus_isr(struct gk20a *g)
-{
-        u32 val, err_code;
-        val = gk20a_readl(g, bus_intr_0_r());
-        if (val & (bus_intr_0_pri_squash_m() |
-                        bus_intr_0_pri_fecserr_m() |
-                        bus_intr_0_pri_timeout_m())) {
-                gk20a_dbg(gpu_dbg_intr, "pmc_enable : 0x%x",
-                        gk20a_readl(g, mc_enable_r()));
-                gk20a_dbg(gpu_dbg_intr, "NV_PBUS_INTR_0 : 0x%x", val);
-                gk20a_dbg(gpu_dbg_intr,
-                        "NV_PTIMER_PRI_TIMEOUT_SAVE_0: 0x%x\n",
-                        gk20a_readl(g, timer_pri_timeout_save_0_r()));
-                gk20a_dbg(gpu_dbg_intr,
-                        "NV_PTIMER_PRI_TIMEOUT_SAVE_1: 0x%x\n",
-                        gk20a_readl(g, timer_pri_timeout_save_1_r()));
-                err_code = gk20a_readl(g, timer_pri_timeout_fecs_errcode_r());
-                gk20a_dbg(gpu_dbg_intr,
-                        "NV_PTIMER_PRI_TIMEOUT_FECS_ERRCODE: 0x%x\n",
-                        err_code);
-                if (err_code == 0xbadf13)
-                        gk20a_dbg(gpu_dbg_intr,
-                        "NV_PGRAPH_PRI_GPC0_GPCCS_FS_GPC: 0x%x\n",
-                        gk20a_readl(g, gr_gpc0_fs_gpc_r()));
-                gk20a_writel(g, timer_pri_timeout_save_0_r(), 0);
-                gk20a_writel(g, timer_pri_timeout_save_1_r(), 0);
-        }
-        if (val)
-                gk20a_dbg(gpu_dbg_intr,
-                        "Unhandled pending pbus interrupt\n");
-        gk20a_writel(g, bus_intr_0_r(), val);
-}
 static irqreturn_t gk20a_intr_thread_stall(int irq, void *dev_id)
 {
        struct gk20a *g = dev_id;
@@ -596,13 +558,7 @@ int gk20a_pm_finalize_poweron(struct device *dev)
        if (err)
                goto done;
-        if (!tegra_platform_is_silicon())
+        g->ops.bus.init_hw(g);
-                gk20a_writel(g, bus_intr_en_0_r(), 0x0);
-        else
-                gk20a_writel(g, bus_intr_en_0_r(),
-                                bus_intr_en_0_pri_squash_m() |
-                                bus_intr_en_0_pri_fecserr_m() |
-                                bus_intr_en_0_pri_timeout_m());
        if (g->ops.clk.disable_slowboot)
                g->ops.clk.disable_slowboot(g);
@@ -630,22 +586,6 @@ int gk20a_pm_finalize_poweron(struct device *dev)
                }
        }
-        /* enable pri timeout only on silicon */
-        if (tegra_platform_is_silicon()) {
-                gk20a_writel(g,
-                        timer_pri_timeout_r(),
-                        timer_pri_timeout_period_f(
-                                platform->default_pri_timeout ?
-                                        platform->default_pri_timeout :
-                                                                0x186A0) |
-                        timer_pri_timeout_en_en_enabled_f());
-        } else {
-                gk20a_writel(g,
-                        timer_pri_timeout_r(),
-                        timer_pri_timeout_period_f(0x186A0) |
-                        timer_pri_timeout_en_en_disabled_f());
-        }
        err = gk20a_init_fifo_reset_enable_hw(g);
        if (err) {
                gk20a_err(dev, "failed to reset gk20a fifo");
@@ -1910,46 +1850,6 @@ int gk20a_init_gpu_characteristics(struct gk20a *g)
        return 0;
 }
-int gk20a_read_ptimer(struct gk20a *g, u64 *value)
-{
-        const unsigned int max_iterations = 3;
-        unsigned int i = 0;
-        u32 gpu_timestamp_hi_prev = 0;
-        if (!value)
-                return -EINVAL;
-        /* Note. The GPU nanosecond timer consists of two 32-bit
-         * registers (high & low). To detect a possible low register
-         * wrap-around between the reads, we need to read the high
-         * register before and after low. The wraparound happens
-         * approximately once per 4 secs. */
-        /* get initial gpu_timestamp_hi value */
-        gpu_timestamp_hi_prev = gk20a_readl(g, timer_time_1_r());
-        for (i = 0; i < max_iterations; ++i) {
-                u32 gpu_timestamp_hi = 0;
-                u32 gpu_timestamp_lo = 0;
-                gpu_timestamp_lo = gk20a_readl(g, timer_time_0_r());
-                gpu_timestamp_hi = gk20a_readl(g, timer_time_1_r());
-                if (gpu_timestamp_hi == gpu_timestamp_hi_prev) {
-                        *value = (((u64)gpu_timestamp_hi) << 32) |
-                                gpu_timestamp_lo;
-                        return 0;
-                }
-                /* wrap-around detected, retry */
-                gpu_timestamp_hi_prev = gpu_timestamp_hi;
-        }
-        /* too many iterations, bail out */
-        gk20a_err(dev_from_gk20a(g), "failed to read ptimer");
-        return -EBUSY;
-}
 /*
 * Free the gk20a struct.
 */
diff --git a/drivers/gpu/nvgpu/gk20a/gk20a.h b/drivers/gpu/nvgpu/gk20a/gk20a.h
index 7c836b3c..8d03cc9a 100644
--- a/drivers/gpu/nvgpu/gk20a/gk20a.h
+++ b/drivers/gpu/nvgpu/gk20a/gk20a.h
@@ -629,7 +629,6 @@ struct gpu_ops {
                                struct vm_gk20a *vm);
                u64 (*get_iova_addr)(struct gk20a *g, struct scatterlist *sgl,
                                         u32 flags);
-                int (*bar1_bind)(struct gk20a *g, struct mem_desc *bar1_inst);
                size_t (*get_vidmem_size)(struct gk20a *g);
                void (*init_inst_block)(struct mem_desc *inst_block,
                                struct vm_gk20a *vm, u32 big_page_size);
@@ -773,7 +772,13 @@ struct gpu_ops {
        int (*get_litter_value)(struct gk20a *g, int value);
        int (*chip_init_gpu_characteristics)(struct gk20a *g);
-        int (*read_ptimer)(struct gk20a *g, u64 *value);
+        struct {
+                void (*init_hw)(struct gk20a *g);
+                void (*isr)(struct gk20a *g);
+                int (*read_ptimer)(struct gk20a *g, u64 *value);
+                int (*bar1_bind)(struct gk20a *g, struct mem_desc *bar1_inst);
+        } bus;
        int (*bios_init)(struct gk20a *g);
@@ -1417,8 +1422,6 @@ int gk20a_wait_for_idle(struct device *dev);
 int gk20a_init_gpu_characteristics(struct gk20a *g);
-void gk20a_pbus_isr(struct gk20a *g);
 int gk20a_user_init(struct device *dev, const char *interface_name,
                    struct class *class);
 void gk20a_user_deinit(struct device *dev, struct class *class);
@@ -1435,7 +1438,6 @@ static inline u32 scale_ptimer(u32 timeout , u32 scale10x)
                return (timeout * 10) / scale10x;
 }
-int gk20a_read_ptimer(struct gk20a *g, u64 *value);
 extern struct class nvgpu_class;
 #define INTERFACE_NAME "nvhost%s-gpu"
diff --git a/drivers/gpu/nvgpu/gk20a/hal_gk20a.c b/drivers/gpu/nvgpu/gk20a/hal_gk20a.c
index 23725b8b..1e4fffdc 100644
--- a/drivers/gpu/nvgpu/gk20a/hal_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/hal_gk20a.c
@@ -16,6 +16,7 @@
 */
 #include "hal_gk20a.h"
+#include "bus_gk20a.h"
 #include "ltc_gk20a.h"
 #include "fb_gk20a.h"
 #include "gk20a.h"
@@ -147,6 +148,7 @@ int gk20a_init_hal(struct gk20a *g)
        gops->privsecurity = 0;
        gops->securegpccs = 0;
        gops->pmupstate = false;
+        gk20a_init_bus(gops);
        gk20a_init_mc(gops);
        gk20a_init_ltc(gops);
        gk20a_init_gr_ops(gops);
@@ -169,7 +171,6 @@ int gk20a_init_hal(struct gk20a *g)
        gops->name = "gk20a";
        gops->chip_init_gpu_characteristics = gk20a_init_gpu_characteristics;
        gops->get_litter_value = gk20a_get_litter_value;
-        gops->read_ptimer = gk20a_read_ptimer;
        c->twod_class = FERMI_TWOD_A;
        c->threed_class = KEPLER_C;
diff --git a/drivers/gpu/nvgpu/gk20a/mc_gk20a.c b/drivers/gpu/nvgpu/gk20a/mc_gk20a.c
index a1861b0d..e51c4a29 100644
--- a/drivers/gpu/nvgpu/gk20a/mc_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/mc_gk20a.c
@@ -150,7 +150,7 @@ irqreturn_t mc_gk20a_intr_thread_stall(struct gk20a *g)
        if (mc_intr_0 & mc_intr_0_ltc_pending_f())
                g->ops.ltc.isr(g);
        if (mc_intr_0 & mc_intr_0_pbus_pending_f())
-                gk20a_pbus_isr(g);
+                g->ops.bus.isr(g);
        /* sync handled irq counter before re-enabling interrupts */
        atomic_set(&g->sw_irq_stall_last_handled, hw_irq_count);
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
index eaf8f74a..b9217c2c 100644
--- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.c
@@ -42,12 +42,13 @@
 #include "mm_gk20a.h"
 #include "fence_gk20a.h"
 #include "kind_gk20a.h"
+#include "bus_gk20a.h"
 #include <nvgpu/hw/gk20a/hw_gmmu_gk20a.h>
-#include <nvgpu/hw/gk20a/hw_bus_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_ram_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_pram_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_mc_gk20a.h>
+#include <nvgpu/hw/gk20a/hw_bus_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_flush_gk20a.h>
 #include <nvgpu/hw/gk20a/hw_ltc_gk20a.h>
@@ -1087,8 +1088,8 @@ int gk20a_init_mm_setup_hw(struct gk20a *g)
        g->ops.fb.init_hw(g);
-        if (g->ops.mm.bar1_bind)
+        if (g->ops.bus.bar1_bind)
-                g->ops.mm.bar1_bind(g, &mm->bar1.inst_block);
+                g->ops.bus.bar1_bind(g, &mm->bar1.inst_block);
        if (g->ops.mm.init_bar2_mm_hw_setup) {
                err = g->ops.mm.init_bar2_mm_hw_setup(g);
@@ -1103,23 +1104,6 @@ int gk20a_init_mm_setup_hw(struct gk20a *g)
        return 0;
 }
-static int gk20a_mm_bar1_bind(struct gk20a *g, struct mem_desc *bar1_inst)
-{
-        u64 iova = gk20a_mm_inst_block_addr(g, bar1_inst);
-        u32 ptr_v = (u32)(iova >> bar1_instance_block_shift_gk20a());
-        gk20a_dbg_info("bar1 inst block ptr: 0x%08x", ptr_v);
-        gk20a_writel(g, bus_bar1_block_r(),
-                     gk20a_aperture_mask(g, bar1_inst,
-                       bus_bar1_block_target_sys_mem_ncoh_f(),
-                       bus_bar1_block_target_vid_mem_f()) |
-                     bus_bar1_block_mode_virtual_f() |
-                     bus_bar1_block_ptr_f(ptr_v));
-        return 0;
-}
 int gk20a_init_mm_support(struct gk20a *g)
 {
        u32 err;
@@ -5447,7 +5431,6 @@ void gk20a_init_mm(struct gpu_ops *gops)
        gops->mm.get_mmu_levels = gk20a_mm_get_mmu_levels;
        gops->mm.init_pdb = gk20a_mm_init_pdb;
        gops->mm.init_mm_setup_hw = gk20a_init_mm_setup_hw;
-        gops->mm.bar1_bind = gk20a_mm_bar1_bind;
        gops->mm.init_inst_block = gk20a_init_inst_block;
        gops->mm.is_bar1_supported = gk20a_mm_is_bar1_supported;
        gops->mm.mmu_fault_pending = gk20a_fifo_mmu_fault_pending;
diff --git a/drivers/gpu/nvgpu/gm20b/bus_gm20b.c b/drivers/gpu/nvgpu/gm20b/bus_gm20b.c
new file mode 100644
index 00000000..68a4b15f
--- /dev/null
+++ b/drivers/gpu/nvgpu/gm20b/bus_gm20b.c
@@ -0,0 +1,64 @@
+/*
+ * GM20B MMU
+ *
+ * Copyright (c) 2014-2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ */
+#include <linux/delay.h>
+#include <nvgpu/timers.h>
+#include "bus_gm20b.h"
+#include "gk20a/gk20a.h"
+#include "gk20a/bus_gk20a.h"
+#include <nvgpu/hw/gm20b/hw_bus_gm20b.h>
+static int gm20b_bus_bar1_bind(struct gk20a *g, struct mem_desc *bar1_inst)
+{
+        struct nvgpu_timeout timeout;
+        int err = 0;
+        u64 iova = gk20a_mm_inst_block_addr(g, bar1_inst);
+        u32 ptr_v = (u32)(iova >> bar1_instance_block_shift_gk20a());
+        gk20a_dbg_info("bar1 inst block ptr: 0x%08x", ptr_v);
+        gk20a_writel(g, bus_bar1_block_r(),
+                     gk20a_aperture_mask(g, bar1_inst,
+                       bus_bar1_block_target_sys_mem_ncoh_f(),
+                       bus_bar1_block_target_vid_mem_f()) |
+                     bus_bar1_block_mode_virtual_f() |
+                     bus_bar1_block_ptr_f(ptr_v));
+        nvgpu_timeout_init(g, &timeout, 1000, NVGPU_TIMER_RETRY_TIMER);
+        do {
+                u32 val = gk20a_readl(g, bus_bind_status_r());
+                u32 pending = bus_bind_status_bar1_pending_v(val);
+                u32 outstanding = bus_bind_status_bar1_outstanding_v(val);
+                if (!pending && !outstanding)
+                        break;
+                udelay(5);
+        } while (!nvgpu_timeout_expired(&timeout));
+        if (nvgpu_timeout_peek_expired(&timeout))
+                err = -EINVAL;
+        return err;
+}
+void gm20b_init_bus(struct gpu_ops *gops)
+{
+        gops->bus.init_hw = gk20a_bus_init_hw;
+        gops->bus.isr = gk20a_bus_isr;
+        gops->bus.read_ptimer = gk20a_read_ptimer;
+        gops->bus.bar1_bind = gm20b_bus_bar1_bind;
+}
diff --git a/drivers/gpu/nvgpu/gm20b/bus_gm20b.h b/drivers/gpu/nvgpu/gm20b/bus_gm20b.h
new file mode 100644
index 00000000..853e50a6
--- /dev/null
+++ b/drivers/gpu/nvgpu/gm20b/bus_gm20b.h
@@ -0,0 +1,23 @@
+/*
+ * GM20B BUS
+ *
+ * Copyright (c) 2017, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ */
+#ifndef _NVGPU_GM20B_BUS
+#define _NVGPU_GM20B_BUS
+struct gpu_ops;
+void gm20b_init_bus(struct gpu_ops *gops);
+#endif
diff --git a/drivers/gpu/nvgpu/gm20b/hal_gm20b.c b/drivers/gpu/nvgpu/gm20b/hal_gm20b.c
index ad041f67..684f5731 100644
--- a/drivers/gpu/nvgpu/gm20b/hal_gm20b.c
+++ b/drivers/gpu/nvgpu/gm20b/hal_gm20b.c
@@ -18,6 +18,7 @@
 #include "gk20a/gk20a.h"
 #include "gk20a/dbg_gpu_gk20a.h"
 #include "gk20a/css_gr_gk20a.h"
+#include "gk20a/bus_gk20a.h"
 #include "ltc_gm20b.h"
 #include "ce2_gm20b.h"
@@ -215,6 +216,7 @@ int gm20b_init_hal(struct gk20a *g)
                }
        }
 #endif
+        gk20a_init_bus(gops);
        gm20b_init_mc(gops);
        gm20b_init_ltc(gops);
        gm20b_init_gr(gops);
@@ -238,7 +240,6 @@ int gm20b_init_hal(struct gk20a *g)
        gops->name = "gm20b";
        gops->chip_init_gpu_characteristics = gk20a_init_gpu_characteristics;
        gops->get_litter_value = gm20b_get_litter_value;
-        gops->read_ptimer = gk20a_read_ptimer;
        c->twod_class = FERMI_TWOD_A;
        c->threed_class = MAXWELL_B;
diff --git a/drivers/gpu/nvgpu/gm20b/mm_gm20b.c b/drivers/gpu/nvgpu/gm20b/mm_gm20b.c
index 18f9eec1..949a5c5d 100644
--- a/drivers/gpu/nvgpu/gm20b/mm_gm20b.c
+++ b/drivers/gpu/nvgpu/gm20b/mm_gm20b.c
@@ -13,17 +13,12 @@
 * more details.
 */
-#include <linux/delay.h>
 #include "gk20a/gk20a.h"
 #include "mm_gm20b.h"
-#include <nvgpu/timers.h>
 #include <nvgpu/hw/gm20b/hw_gmmu_gm20b.h>
 #include <nvgpu/hw/gm20b/hw_ram_gm20b.h>
-#include <nvgpu/hw/gm20b/hw_bus_gm20b.h>
 static void gm20b_mm_set_big_page_size(struct gk20a *g,
                                struct mem_desc *mem, int size)
@@ -55,34 +50,6 @@ static bool gm20b_mm_support_sparse(struct gk20a *g)
        return true;
 }
-static int gm20b_mm_bar1_bind(struct gk20a *g, struct mem_desc *bar1_inst)
-{
-        int retry = 1000;
-        u64 iova = gk20a_mm_inst_block_addr(g, bar1_inst);
-        u32 ptr_v = (u32)(iova >> bar1_instance_block_shift_gk20a());
-        gk20a_dbg_info("bar1 inst block ptr: 0x%08x", ptr_v);
-        gk20a_writel(g, bus_bar1_block_r(),
-                     gk20a_aperture_mask(g, bar1_inst,
-                       bus_bar1_block_target_sys_mem_ncoh_f(),
-                       bus_bar1_block_target_vid_mem_f()) |
-                     bus_bar1_block_mode_virtual_f() |
-                     bus_bar1_block_ptr_f(ptr_v));
-        do {
-                u32 val = gk20a_readl(g, bus_bind_status_r());
-                u32 pending = bus_bind_status_bar1_pending_v(val);
-                u32 outstanding = bus_bind_status_bar1_outstanding_v(val);
-                if (!pending && !outstanding)
-                        break;
-                udelay(5);
-                retry--;
-        } while (retry >= 0 || !tegra_platform_is_silicon());
-        return retry ? -EINVAL : 0;
-}
 static bool gm20b_mm_is_bar1_supported(struct gk20a *g)
 {
        return true;
@@ -107,7 +74,6 @@ void gm20b_init_mm(struct gpu_ops *gops)
        gops->mm.get_mmu_levels = gk20a_mm_get_mmu_levels;
        gops->mm.init_pdb = gk20a_mm_init_pdb;
        gops->mm.init_mm_setup_hw = gk20a_init_mm_setup_hw;
-        gops->mm.bar1_bind = gm20b_mm_bar1_bind;
        gops->mm.is_bar1_supported = gm20b_mm_is_bar1_supported;
        gops->mm.init_inst_block = gk20a_init_inst_block;
        gops->mm.mmu_fault_pending = gk20a_fifo_mmu_fault_pending;
diff --git a/drivers/gpu/nvgpu/gp106/hal_gp106.c b/drivers/gpu/nvgpu/gp106/hal_gp106.c
index a05b71ab..36f72b12 100644
--- a/drivers/gpu/nvgpu/gp106/hal_gp106.c
+++ b/drivers/gpu/nvgpu/gp106/hal_gp106.c
@@ -21,6 +21,7 @@
 #include "gk20a/gk20a.h"
 #include "gk20a/dbg_gpu_gk20a.h"
 #include "gk20a/css_gr_gk20a.h"
+#include "gk20a/bus_gk20a.h"
 #include "gp10b/gr_gp10b.h"
 #include "gp10b/fecs_trace_gp10b.h"
@@ -223,6 +224,7 @@ int gp106_init_hal(struct gk20a *g)
        gops->privsecurity = 1;
        gops->securegpccs = 1;
        gops->pmupstate = true;
+        gk20a_init_bus(gops);
        gp10b_init_mc(gops);
        gp106_init_gr(gops);
        gp10b_init_fecs_trace_ops(gops);
@@ -251,7 +253,6 @@ int gp106_init_hal(struct gk20a *g)
        gops->get_litter_value = gp106_get_litter_value;
        gops->chip_init_gpu_characteristics = gp106_init_gpu_characteristics;
        gops->gr_ctx.use_dma_for_fw_bootstrap = true;
-        gops->read_ptimer = gk20a_read_ptimer;
        c->twod_class = FERMI_TWOD_A;
        c->threed_class = PASCAL_B;
diff --git a/drivers/gpu/nvgpu/gp10b/hal_gp10b.c b/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
index 62a19abd..245d2d26 100644
--- a/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
+++ b/drivers/gpu/nvgpu/gp10b/hal_gp10b.c
@@ -21,6 +21,7 @@
 #include "gk20a/gk20a.h"
 #include "gk20a/dbg_gpu_gk20a.h"
 #include "gk20a/css_gr_gk20a.h"
+#include "gk20a/bus_gk20a.h"
 #include "gp10b/gr_gp10b.h"
 #include "gp10b/fecs_trace_gp10b.h"
@@ -232,6 +233,7 @@ int gp10b_init_hal(struct gk20a *g)
        }
 #endif
+        gk20a_init_bus(gops);
        gp10b_init_mc(gops);
        gp10b_init_gr(gops);
        gp10b_init_fecs_trace_ops(gops);
@@ -254,7 +256,6 @@ int gp10b_init_hal(struct gk20a *g)
        gops->name = "gp10b";
        gops->chip_init_gpu_characteristics = gp10b_init_gpu_characteristics;
        gops->get_litter_value = gp10b_get_litter_value;
-        gops->read_ptimer = gk20a_read_ptimer;
        c->twod_class = FERMI_TWOD_A;
        c->threed_class = PASCAL_A;
diff --git a/drivers/gpu/nvgpu/gp10b/mc_gp10b.c b/drivers/gpu/nvgpu/gp10b/mc_gp10b.c
index fc0e6553..547169ed 100644
--- a/drivers/gpu/nvgpu/gp10b/mc_gp10b.c
+++ b/drivers/gpu/nvgpu/gp10b/mc_gp10b.c
@@ -162,7 +162,7 @@ irqreturn_t mc_gp10b_intr_thread_stall(struct gk20a *g)
        if (mc_intr_0 & mc_intr_ltc_pending_f())
                g->ops.ltc.isr(g);
        if (mc_intr_0 & mc_intr_pbus_pending_f())
-                gk20a_pbus_isr(g);
+                g->ops.bus.isr(g);
        /* sync handled irq counter before re-enabling interrupts */
        atomic_set(&g->sw_irq_stall_last_handled, hw_irq_count);
diff --git a/drivers/gpu/nvgpu/gp10b/mm_gp10b.c b/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
index 26facbe3..a5322bad 100644
--- a/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
+++ b/drivers/gpu/nvgpu/gp10b/mm_gp10b.c
@@ -45,7 +45,7 @@ static int gp10b_init_mm_setup_hw(struct gk20a *g)
                     (g->ops.mm.get_iova_addr(g, g->mm.sysmem_flush.sgt->sgl, 0)
                     >> 8ULL));
-        g->ops.mm.bar1_bind(g, inst_block);
+        g->ops.bus.bar1_bind(g, inst_block);
        if (g->ops.mm.init_bar2_mm_hw_setup) {
                err = g->ops.mm.init_bar2_mm_hw_setup(g);
diff --git a/drivers/gpu/nvgpu/vgpu/vgpu.c b/drivers/gpu/nvgpu/vgpu/vgpu.c
index 2d7417f0..72606952 100644
--- a/drivers/gpu/nvgpu/vgpu/vgpu.c
+++ b/drivers/gpu/nvgpu/vgpu/vgpu.c
@@ -362,7 +362,7 @@ void vgpu_init_hal_common(struct gk20a *g)
        vgpu_init_css_ops(gops);
 #endif
        gops->chip_init_gpu_characteristics = vgpu_init_gpu_characteristics;
-        gops->read_ptimer = vgpu_read_ptimer;
+        gops->bus.read_ptimer = vgpu_read_ptimer;
 }
 static int vgpu_init_hal(struct gk20a *g)
author	Terje Bergstrom <tbergstrom@nvidia.com>	2017-03-17 14:09:44 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2017-03-23 11:44:07 -0400
commit	4492c62ffe9398bd4457f6f1c2773e40afe909fb (patch)
tree	5d792f81d97844278f4eca665a8b4778fa93dc35
parent	33f637585ecd617a9f4423f56e2aa6df0691ac64 (diff)