summaryrefslogtreecommitdiffstats
path: root/drivers/gpu/nvgpu/gv100/gr_gv100.c
diff options
context:
space:
mode:
authorVaibhav Kachore <vkachore@nvidia.com>2018-07-03 07:51:13 -0400
committermobile promotions <svcmobile_promotions@nvidia.com>2018-07-10 21:14:16 -0400
commit503d489dba278136ea0e4241d000018682989da5 (patch)
tree29b95d43aaf47b50f2abda9a4e16153afe070c25 /drivers/gpu/nvgpu/gv100/gr_gv100.c
parente14fdcd8f1f4125da697433b1744b1e4e4f15b09 (diff)
gpu: nvgpu: Initialize hwpm perfmons (engine_sel)
- For Mode-E ctxsw it is required that engine_sel is set to 0xFFFFFFFF. - Default 0 is a valid signal and causes problems. Bug 2106999 Change-Id: I5cdb4441a8e6d7e8133c31a9e361b54611dd2995 Signed-off-by: Vaibhav Kachore <vkachore@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1770755 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
Diffstat (limited to 'drivers/gpu/nvgpu/gv100/gr_gv100.c')
-rw-r--r--drivers/gpu/nvgpu/gv100/gr_gv100.c87
1 files changed, 87 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/gv100/gr_gv100.c b/drivers/gpu/nvgpu/gv100/gr_gv100.c
index b1b1cee6..5f891ce5 100644
--- a/drivers/gpu/nvgpu/gv100/gr_gv100.c
+++ b/drivers/gpu/nvgpu/gv100/gr_gv100.c
@@ -39,6 +39,7 @@
39#include <nvgpu/hw/gv100/hw_fuse_gv100.h> 39#include <nvgpu/hw/gv100/hw_fuse_gv100.h>
40#include <nvgpu/hw/gv100/hw_top_gv100.h> 40#include <nvgpu/hw/gv100/hw_top_gv100.h>
41#include <nvgpu/hw/gv100/hw_ctxsw_prog_gv100.h> 41#include <nvgpu/hw/gv100/hw_ctxsw_prog_gv100.h>
42#include <nvgpu/hw/gv100/hw_perf_gv100.h>
42 43
43 44
44/* 45/*
@@ -459,3 +460,89 @@ u32 gr_gv100_get_hw_accessor_stream_out_mode()
459{ 460{
460 return ctxsw_prog_main_image_pm_mode_stream_out_ctxsw_f(); 461 return ctxsw_prog_main_image_pm_mode_stream_out_ctxsw_f();
461} 462}
463
464static void gr_gv100_set_pmm_register(struct gk20a *g, u32 offset, u32 val,
465 u32 num_chiplets, u32 num_perfmons)
466{
467 u32 perfmon_index = 0;
468 u32 chiplet_index = 0;
469 u32 reg_offset = 0;
470 u32 chiplet_stride = g->ops.gr.get_pmm_per_chiplet_offset();
471
472 for (chiplet_index = 0; chiplet_index < num_chiplets; chiplet_index++) {
473 for (perfmon_index = 0; perfmon_index < num_perfmons;
474 perfmon_index++) {
475 reg_offset = offset + perfmon_index * perf_pmmgpc_perdomain_offset_v() +
476 chiplet_index * chiplet_stride;
477 nvgpu_writel(g, reg_offset, val);
478 }
479 }
480
481}
482
483static void gr_gv100_get_num_hwpm_perfmon(struct gk20a *g, int *num_sys_perfmon,
484 int *num_fbp_perfmon, int *num_gpc_perfmon)
485{
486 int err;
487 u32 buf_offset_lo, buf_offset_addr, num_offsets;
488 u32 perfmon_index = 0;
489
490 for (perfmon_index = 0; perfmon_index < perf_pmmsys_engine_sel__size_1_v();
491 perfmon_index++) {
492 err = gr_gk20a_get_pm_ctx_buffer_offsets(g,
493 perf_pmmsys_engine_sel_r(perfmon_index),
494 1,
495 &buf_offset_lo,
496 &buf_offset_addr,
497 &num_offsets);
498 if (err) {
499 break;
500 }
501 }
502 *num_sys_perfmon = perfmon_index;
503
504 for (perfmon_index = 0; perfmon_index < perf_pmmfbp_engine_sel__size_1_v();
505 perfmon_index++) {
506 err = gr_gk20a_get_pm_ctx_buffer_offsets(g,
507 perf_pmmfbp_engine_sel_r(perfmon_index),
508 1,
509 &buf_offset_lo,
510 &buf_offset_addr,
511 &num_offsets);
512 if (err) {
513 break;
514 }
515 }
516 *num_fbp_perfmon = perfmon_index;
517
518 for (perfmon_index = 0; perfmon_index < perf_pmmgpc_engine_sel__size_1_v();
519 perfmon_index++) {
520 err = gr_gk20a_get_pm_ctx_buffer_offsets(g,
521 perf_pmmgpc_engine_sel_r(perfmon_index),
522 1,
523 &buf_offset_lo,
524 &buf_offset_addr,
525 &num_offsets);
526 if (err) {
527 break;
528 }
529 }
530 *num_gpc_perfmon = perfmon_index;
531}
532
533void gr_gv100_init_hwpm_pmm_register(struct gk20a *g)
534{
535 int num_sys_perfmon = 0;
536 int num_fbp_perfmon = 0;
537 int num_gpc_perfmon = 0;
538
539 gr_gv100_get_num_hwpm_perfmon(g, &num_sys_perfmon,
540 &num_fbp_perfmon, &num_gpc_perfmon);
541
542 gr_gv100_set_pmm_register(g, perf_pmmsys_engine_sel_r(0),
543 1, 0xFFFFFFFF, num_sys_perfmon);
544 gr_gv100_set_pmm_register(g, perf_pmmsys_engine_sel_r(0),
545 nvgpu_get_litter_value(g, GPU_LIT_NUM_FBPS), 0xFFFFFFFF, num_fbp_perfmon);
546 gr_gv100_set_pmm_register(g, perf_pmmsys_engine_sel_r(0),
547 nvgpu_get_litter_value(g, GPU_LIT_NUM_GPCS), 0xFFFFFFFF, num_gpc_perfmon);
548}