From 54e783959b5d3622556bbf34a3a7ad8e481d9e25 Mon Sep 17 00:00:00 2001
From: Joshua Bakita <jbakita@cs.unc.edu>
Date: Thu, 26 Aug 2021 18:53:29 -0400
Subject: Use procfs instead of dmesg to print runlist

`cat /proc/runlist` to print the current runlist.

Also break nvdebug.c into nvdebug_entry.c, runlist.c, and
runlist_procfs.c.
---
 nvdebug.c | 278 --------------------------------------------------------------
 1 file changed, 278 deletions(-)
 delete mode 100644 nvdebug.c

(limited to 'nvdebug.c')

diff --git a/nvdebug.c b/nvdebug.c
deleted file mode 100644
index 31a797e..0000000
--- a/nvdebug.c
+++ /dev/null
@@ -1,278 +0,0 @@
-/* Copyright 2021 Joshua Bakita
- * SPDX-License-Identifier: MIT
- */
-
-/* TODO
- * - Add /proc /sys or debugfs interface
- * - Add API to trigger a preemption
- */
-
-#include <linux/module.h>
-#include <linux/kernel.h>
-#include <linux/device.h>
-#include <linux/kallsyms.h>
-#include <linux/iommu.h> // For struct iommu_domain
-#include <asm/io.h>
-
-/* Currently used symbols:
- * - struct gk20a;
- * - struct nvgpu_os_linux;
- * - void nvgpu_writel(struct gk20a *g, u32 reg_addr, u32 value);
- */
-#include <nvgpu/io.h>
-#include <nvgpu/gk20a.h>
-#include <os/linux/os_linux.h>
-
-#include "nvdebug.h"
-
-MODULE_LICENSE("GPL"); // LIAR
-MODULE_AUTHOR("Joshua Bakita");
-MODULE_DESCRIPTION("A scheduling debugging module for NVIDIA GPUs");
-MODULE_SOFTDEP("pre: nvgpu"); // We only support the Jetson boards for now
-
-// Bus types are global symbols in the kernel
-extern struct bus_type platform_bus_type;
-
-static inline struct gk20a *get_gk20a(struct device *dev) {
-	// XXX: Only works because gk20a* is the first member of gk20a_platform
-	return *((struct gk20a**)dev_get_drvdata(dev));
-}
-
-// Functionally identical to nvgpu_readl()
-// (except we don't try to resolve situations where regs is NULL)
-static inline u32 nvdebug_readl(struct gk20a* g, u32 r) {
-	struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
-	if (unlikely(!g_os->regs)) {
-		printk(KERN_ERR "[nvdebug] Attempted nvgpu_readl on non-existent registers!\n");
-		return -1;
-	}
-	return readl(g_os->regs + r);
-}
-
-// Functionally identical to nvgpu_writel()
-static inline void nvdebug_writel(struct gk20a* g, u32 r, u32 v) {
-	struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
-	if (unlikely(!g_os->regs)) {
-		printk(KERN_ERR "[nvdebug] Attempted nvgpu_writel on non-existent registers!\n");
-		return;
-	}	
-	writel_relaxed(v, g_os->regs + r);
-	wmb();
-}
-/*
-#define RUNLIST_PROCFS_NAME "runlist"
-
-static const struct seq_operations runlist_file_seq_ops = {
-	.start = 
-	.next =
-	.stop =
-	.show =
-};
-
-static const struct file_operations runlist_file_ops = {
-	.read = 
-*/
-/*static void read_bytes(struct gk20a *g, void* target, u32 start, u32 num_bytes) {
-	u32 *output = target;
-	u32 i;
-	// Read u32s from the GPU
-	for (i = 0; i < num_bytes; i += 4) {
-		output[i/4] = _nvgpu_readl(g, start + i);
-		printk(KERN_INFO "[nvdebug] U32 %d: %0x\n", i, output[i/4]);
-	}
-}
-
-static void read_bytes(void* target, void* start, u32 num_bytes) {
-	u32 *output = target;
-	u32 i;
-	// Read u32s from the GPU
-	for (i = 0; i < num_bytes; i += 4) {
-		output[i/4] = readl(start + i);
-		printk(KERN_INFO "[nvdebug] U32 %d: %0x\n", i, output[i/4]);
-	}
-}*/
-
-/*
-  +---- TSG Entry %d ----+
-  | Scale: %d            |
-  | Timeout: %d          |
-  +----------------------+
-
-
-
-
-
-
-*/
-
-#define PRE KERN_INFO "[nvdebug] "
-
-static void nvdebug_print_tsg(struct entry_tsg* tsg) {
-	if (tsg->entry_type != ENTRY_TYPE_TSG) {
-		printk(KERN_WARNING "[nvdebug] Attempted to print non-TSG in nvdebug_print_tsg()!\n");
-		return;
-	}
-	printk(PRE "+---- TSG Entry %-2d----+", tsg->tsgid);
-	printk(PRE "| Scale: %-13d|", tsg->timeslice_scale);
-	printk(PRE "| Timeout: %-11d|", tsg->timeslice_timeout);
-	printk(PRE "+---------------------+");
-}
-
-static void nvdebug_print_chan(struct runlist_chan* chan) {
-	char* loc_txt;
-	u64 inst_ptr;
-	if (chan->entry_type != ENTRY_TYPE_CHAN) {
-		printk(KERN_WARNING "[nvdebug] Attempted to print non-channel in nvdebug_print_channel()!\n");
-		return;
-	}
-	switch (chan->inst_target) {
-		case TARGET_VID_MEM:
-			loc_txt = "VID_MEM";
-			break;
-		case TARGET_SYS_MEM_COHERENT:
-			loc_txt = "SYS_MEM_COHERENT";
-			break;
-		case TARGET_SYS_MEM_NONCOHERENT:
-			loc_txt = "SYS_MEM_NONCOHERENT";
-			break;
-		default:
-			printk(KERN_WARNING "[nvdebug] Invalid aperture in runlist channel!\n");
-			return;
-	}
-	// Reconstruct pointer to channel instance block
-	inst_ptr = chan->inst_ptr_hi;
-	inst_ptr <<= 32;
-	inst_ptr |= chan->inst_ptr_lo << 12;
-
-	printk(PRE "  +- Channel Entry %-4d-+", chan->chid);
-	printk(PRE "  | Runqueue Selector: %d|", chan->runqueue_selector);
-	printk(PRE "  | Instance PTR:       |");
-	printk(PRE "  | %#018llx  |", inst_ptr);
-	printk(PRE "  | %-20s|", loc_txt);
-	printk(PRE "  +---------------------+");
-}
-
-#define for_chan_in_tsg(chan, tsg) \
-	for (chan = (struct runlist_chan*)(tsg + 1); \
-	     (void*)chan < (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length; \
-	     chan++)
-
-#define next_tsg(tsg) \
-	(void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length
-
-static void nvdebug_print_runlist(struct entry_tsg* head, runlist_info_t rl_info) {
-	int rl_idx = 0;
-	struct runlist_chan* chan;
-	printk(PRE "tsg->tsg_length: %d\n", head->tsg_length);
-	printk(PRE "rl_info.len: %d\n", rl_info.len);
-	while (rl_idx < rl_info.len) {
-		nvdebug_print_tsg(head);
-		for_chan_in_tsg(chan, head) {
-			nvdebug_print_chan(chan);
-		}
-		rl_idx += 1 + head->tsg_length;
-		head = next_tsg(head);
-	}
-}
-
-static int __init nvdebug_init(void) {
-	struct device *dev = NULL;
-	struct device *temp_dev;
-	struct gk20a *g;
-	struct entry_tsg head;
-	runlist_base_t rl_base;
-	runlist_info_t rl_info;
-	u64 runlist_iova;
-	// Get the last device that matches our name
-	while ((temp_dev = bus_find_device_by_name(&platform_bus_type, dev, "17000000.gv11b"))) {
-		printk(KERN_INFO "Found a matching device\n");
-		dev = temp_dev;
-	}
-	if (!dev)
-		return -EIO;
-	g = get_gk20a(dev);
-	// This address seems to not be:
-	// - A GPU address (type is sysmem_coherent)
-	// - A physical address (dereferencing after ioremap crashes)
-	// - A kernel virtual address (dereferencing segfaults)
-	// So maybe it's some sort of custom thing? This is an address that the GPU
-	// can use, so it would make most sense for it to be a physical address.
-	//
-	// BUT, it can't possibly be a physical address, as it would refer to an
-	// address greater than the maximum one on our system (by a lot!).
-	// Maybe I'm reading the runlist base wrong?
-	// Aha, the driver calls it runlist_iova. Sounds like runlist I/O virtual
-	// address! So, what's this I/O address space? All I know is that it's what
-	// nvgpu_mem_get_addr() returns. That function returns the result of either:
-	// - gpu_phys_addr which is  __nvgpu_sgl_phys on our platform which (?)
-	//   converts an IPA to a PA?
-	// - nvgpu_mem_iommu_translate
-	//
-	// The original memory is allocated with nvgpu_dma_alloc_flags_sys(), which
-	// returns SYSMEM.
-	//
-	// To convert a physical address to a IOMMU address, we add a bit
-	//
-	// BUT, it turns out that it IS JUST A PHYSICAL ADDRESS! It wasn't working
-	// before because the GPU had simply gone to sleep and invalidated its
-	// register state, so nvgpu_readl() was simply returning garbage.
-
-	printk(KERN_INFO "[nvdebug] Pulling runlist base address from %x\n", NV_PFIFO_RUNLIST_BASE);
-	printk(KERN_INFO "[nvdebug] Using struct gk20a* of %px\n", g);
-	printk(KERN_INFO "[nvdebug] g->name: %s, g->power_on: %d, g->sw_ready: %d, g->is_virtual %d\n", g->name, g->power_on, g->sw_ready, g->is_virtual);
-	struct nvgpu_os_linux *l = container_of(g, struct nvgpu_os_linux, g);
-	printk(KERN_INFO "[nvdebug] l->regs %px, l->regs_saved %px\n", l->regs, l->regs_saved);
-	if (!l->regs)
-		return -EIO;
-	rl_base.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST_BASE);
-	rl_info.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST);
-	runlist_iova = ((u64)rl_base.ptr) << 12;
-	printk(KERN_INFO "[nvdebug] Runlist ptr: %x, type: %d, raw: %x, IOVA: %px\n", rl_base.ptr, rl_base.type, rl_base.raw, (void*)runlist_iova);
-	// Segfaults
-	//u32 attempted_read = ioread32(runlist_iova);
-	//printk(KERN_INFO "[nvdebug] first word of runlist: %0x\n", attempted_read);
-
-	// Errors out
-	//u32* virt_rt_addr = ioremap(phys_rl_addr, sizeof(struct entry_tsg));
-	//printk(KERN_INFO "[nvdebug] Runlist virt_addr: %px\n", virt_rt_addr);
-
-	/* Overcomplicated?
-	struct iommu_domain *domain = iommu_get_domain_for_dev(dev);
-	if (!domain) {
-		printk(KERN_INFO "[nvdebug] No IOMMU domain!\n");
-		return -EIO;
-	}
-	u64 phys_addr = platform_bus_type.iommu_ops->iova_to_phys(domain, runlist_iova);
-	printk(KERN_INFO "[nvdebug] Runlist PA: %px\n", phys_addr);
-	*/
-
-	printk(KERN_INFO "[nvdebug] Runlist phys_to_virt:   %px\n", (void*)phys_to_virt(runlist_iova));
-	printk(KERN_INFO "[nvdebug] Runlist *phys_to_virt:  %x\n", *(u32*)phys_to_virt(runlist_iova));
-	head = *(struct entry_tsg*)phys_to_virt(runlist_iova);
-	nvdebug_print_runlist((struct entry_tsg*)phys_to_virt(runlist_iova), rl_info);
-	//nvdebug_print_tsg(&head);
-	//nvdebug_print_chan((struct runlist_chan*)(phys_to_virt(runlist_iova) + sizeof(struct entry_tsg)));
-	//printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
-	//printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
-	//printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
-	//printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
-	//printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
-
-	//printk(KERN_INFO "[nvdebug] Mem base phys: %p\n", (void*)virt_to_phys((void*)0xffffffc000000000ULL));
-	//printk(KERN_INFO "[nvdebug] Mem end phys: %p\n", (void*)virt_to_phys((void*)0xffffffc400000000ULL));
-	//printk(KERN_INFO "[nvdebug] Runlist *virt_addr: %x\n", readl(virt_rt_addr)); // This crashes
-	//read_bytes(&head, virt_rt_addr, sizeof(struct entry_tsg));
-	/*printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
-	printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
-	printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
-	printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
-	printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
-	*/return 0;
-}
-
-static void __exit nvdebug_exit(void) {
-	printk(KERN_INFO "[nvdebug] Exiting...\n");
-}
-
-module_init(nvdebug_init);
-module_exit(nvdebug_exit);
-- 
cgit v1.2.2