summaryrefslogtreecommitdiffstats
path: root/drivers/gpu/nvgpu/gv11b/gr_gv11b.c
diff options
context:
space:
mode:
authorDeepak Nibade <dnibade@nvidia.com>2018-04-02 05:41:02 -0400
committermobile promotions <svcmobile_promotions@nvidia.com>2018-04-03 11:23:08 -0400
commit4b8432a663e12c915acec9043ab8493b30471188 (patch)
tree6654069e3801f0d7a89e876b6683807739fbaf31 /drivers/gpu/nvgpu/gv11b/gr_gv11b.c
parentd02ae4f1e94fbeb9401bde9d34044792e213c54b (diff)
gpu: nvgpu: fix address table for GPCS_TPC6 broadcast conversion
In gr_gk20a_create_priv_addr_table() and gv11b_gr_egpc_etpc_priv_addr_table(), we create a table of unicast addresses from broadcast addresses For GPC boardcast addresses like NV_PGRAPH_PRI_EGPCS_ETPC6_SM_*, we generate the table assuming there are 7 TPCs in all the GPCs But this is incorrect in some cases like GV100 where GPC0/1 have only 6 TPCs And hence we end up generating registers which do not exist Fix this by explicitly checking the number of TPCs and ensuring that address generated is belongs to valid TPC Bug 200400376 Jira NVGPU-564 Change-Id: I65d7d6cd7f0bf16171eb54ed71f1f3840ade3495 Signed-off-by: Deepak Nibade <dnibade@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1686806 Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com> GVS: Gerrit_Virtual_Submit Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
Diffstat (limited to 'drivers/gpu/nvgpu/gv11b/gr_gv11b.c')
-rw-r--r--drivers/gpu/nvgpu/gv11b/gr_gv11b.c15
1 files changed, 11 insertions, 4 deletions
diff --git a/drivers/gpu/nvgpu/gv11b/gr_gv11b.c b/drivers/gpu/nvgpu/gv11b/gr_gv11b.c
index e0c60efb..7f6d1906 100644
--- a/drivers/gpu/nvgpu/gv11b/gr_gv11b.c
+++ b/drivers/gpu/nvgpu/gv11b/gr_gv11b.c
@@ -3979,6 +3979,7 @@ void gv11b_gr_egpc_etpc_priv_addr_table(struct gk20a *g, u32 addr,
3979 u32 gpc, u32 broadcast_flags, u32 *priv_addr_table, u32 *t) 3979 u32 gpc, u32 broadcast_flags, u32 *priv_addr_table, u32 *t)
3980{ 3980{
3981 u32 gpc_num, tpc_num; 3981 u32 gpc_num, tpc_num;
3982 u32 priv_addr, gpc_addr;
3982 3983
3983 nvgpu_log_info(g, "addr=0x%x", addr); 3984 nvgpu_log_info(g, "addr=0x%x", addr);
3984 3985
@@ -4017,10 +4018,16 @@ void gv11b_gr_egpc_etpc_priv_addr_table(struct gk20a *g, u32 addr,
4017 g, gpc_num, tpc_num, addr, 4018 g, gpc_num, tpc_num, addr,
4018 priv_addr_table, t); 4019 priv_addr_table, t);
4019 } else { 4020 } else {
4020 priv_addr_table[*t] = 4021 priv_addr = pri_egpc_addr(g,
4021 pri_egpc_addr(g, 4022 pri_gpccs_addr_mask(addr),
4022 pri_gpccs_addr_mask(addr), 4023 gpc_num);
4023 gpc_num); 4024
4025 gpc_addr = pri_gpccs_addr_mask(priv_addr);
4026 tpc_num = g->ops.gr.get_tpc_num(g, gpc_addr);
4027 if (tpc_num >= g->gr.gpc_tpc_count[gpc_num])
4028 continue;
4029
4030 priv_addr_table[*t] = priv_addr;
4024 nvgpu_log_info(g, "priv_addr_table[%d]:%#08x", 4031 nvgpu_log_info(g, "priv_addr_table[%d]:%#08x",
4025 *t, priv_addr_table[*t]); 4032 *t, priv_addr_table[*t]);
4026 (*t)++; 4033 (*t)++;