From 54e783959b5d3622556bbf34a3a7ad8e481d9e25 Mon Sep 17 00:00:00 2001
From: Joshua Bakita <jbakita@cs.unc.edu>
Date: Thu, 26 Aug 2021 18:53:29 -0400
Subject: Use procfs instead of dmesg to print runlist

`cat /proc/runlist` to print the current runlist.

Also break nvdebug.c into nvdebug_entry.c, runlist.c, and
runlist_procfs.c.
---
 Makefile         |   1 +
 nvdebug.c        | 278 -------------------------------------------------------
 nvdebug.h        |  49 ++++++++++
 nvdebug_entry.c  |  40 ++++++++
 runlist.c        | 106 +++++++++++++++++++++
 runlist_procfs.c | 102 ++++++++++++++++++++
 6 files changed, 298 insertions(+), 278 deletions(-)
 delete mode 100644 nvdebug.c
 create mode 100644 nvdebug_entry.c
 create mode 100644 runlist.c
 create mode 100644 runlist_procfs.c

diff --git a/Makefile b/Makefile
index cc14996..5d61177 100644
--- a/Makefile
+++ b/Makefile
@@ -1,4 +1,5 @@
 obj-m += nvdebug.o
+nvdebug-objs = runlist_procfs.o runlist.o nvdebug_entry.o
 
 # TODO: Avoid needing to distribute NVIDIA's headers (at least they're MIT...)
 #ccflags-y += -I$(PWD)/include
diff --git a/nvdebug.c b/nvdebug.c
deleted file mode 100644
index 31a797e..0000000
--- a/nvdebug.c
+++ /dev/null
@@ -1,278 +0,0 @@
-/* Copyright 2021 Joshua Bakita
- * SPDX-License-Identifier: MIT
- */
-
-/* TODO
- * - Add /proc /sys or debugfs interface
- * - Add API to trigger a preemption
- */
-
-#include <linux/module.h>
-#include <linux/kernel.h>
-#include <linux/device.h>
-#include <linux/kallsyms.h>
-#include <linux/iommu.h> // For struct iommu_domain
-#include <asm/io.h>
-
-/* Currently used symbols:
- * - struct gk20a;
- * - struct nvgpu_os_linux;
- * - void nvgpu_writel(struct gk20a *g, u32 reg_addr, u32 value);
- */
-#include <nvgpu/io.h>
-#include <nvgpu/gk20a.h>
-#include <os/linux/os_linux.h>
-
-#include "nvdebug.h"
-
-MODULE_LICENSE("GPL"); // LIAR
-MODULE_AUTHOR("Joshua Bakita");
-MODULE_DESCRIPTION("A scheduling debugging module for NVIDIA GPUs");
-MODULE_SOFTDEP("pre: nvgpu"); // We only support the Jetson boards for now
-
-// Bus types are global symbols in the kernel
-extern struct bus_type platform_bus_type;
-
-static inline struct gk20a *get_gk20a(struct device *dev) {
-	// XXX: Only works because gk20a* is the first member of gk20a_platform
-	return *((struct gk20a**)dev_get_drvdata(dev));
-}
-
-// Functionally identical to nvgpu_readl()
-// (except we don't try to resolve situations where regs is NULL)
-static inline u32 nvdebug_readl(struct gk20a* g, u32 r) {
-	struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
-	if (unlikely(!g_os->regs)) {
-		printk(KERN_ERR "[nvdebug] Attempted nvgpu_readl on non-existent registers!\n");
-		return -1;
-	}
-	return readl(g_os->regs + r);
-}
-
-// Functionally identical to nvgpu_writel()
-static inline void nvdebug_writel(struct gk20a* g, u32 r, u32 v) {
-	struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
-	if (unlikely(!g_os->regs)) {
-		printk(KERN_ERR "[nvdebug] Attempted nvgpu_writel on non-existent registers!\n");
-		return;
-	}	
-	writel_relaxed(v, g_os->regs + r);
-	wmb();
-}
-/*
-#define RUNLIST_PROCFS_NAME "runlist"
-
-static const struct seq_operations runlist_file_seq_ops = {
-	.start = 
-	.next =
-	.stop =
-	.show =
-};
-
-static const struct file_operations runlist_file_ops = {
-	.read = 
-*/
-/*static void read_bytes(struct gk20a *g, void* target, u32 start, u32 num_bytes) {
-	u32 *output = target;
-	u32 i;
-	// Read u32s from the GPU
-	for (i = 0; i < num_bytes; i += 4) {
-		output[i/4] = _nvgpu_readl(g, start + i);
-		printk(KERN_INFO "[nvdebug] U32 %d: %0x\n", i, output[i/4]);
-	}
-}
-
-static void read_bytes(void* target, void* start, u32 num_bytes) {
-	u32 *output = target;
-	u32 i;
-	// Read u32s from the GPU
-	for (i = 0; i < num_bytes; i += 4) {
-		output[i/4] = readl(start + i);
-		printk(KERN_INFO "[nvdebug] U32 %d: %0x\n", i, output[i/4]);
-	}
-}*/
-
-/*
-  +---- TSG Entry %d ----+
-  | Scale: %d            |
-  | Timeout: %d          |
-  +----------------------+
-
-
-
-
-
-
-*/
-
-#define PRE KERN_INFO "[nvdebug] "
-
-static void nvdebug_print_tsg(struct entry_tsg* tsg) {
-	if (tsg->entry_type != ENTRY_TYPE_TSG) {
-		printk(KERN_WARNING "[nvdebug] Attempted to print non-TSG in nvdebug_print_tsg()!\n");
-		return;
-	}
-	printk(PRE "+---- TSG Entry %-2d----+", tsg->tsgid);
-	printk(PRE "| Scale: %-13d|", tsg->timeslice_scale);
-	printk(PRE "| Timeout: %-11d|", tsg->timeslice_timeout);
-	printk(PRE "+---------------------+");
-}
-
-static void nvdebug_print_chan(struct runlist_chan* chan) {
-	char* loc_txt;
-	u64 inst_ptr;
-	if (chan->entry_type != ENTRY_TYPE_CHAN) {
-		printk(KERN_WARNING "[nvdebug] Attempted to print non-channel in nvdebug_print_channel()!\n");
-		return;
-	}
-	switch (chan->inst_target) {
-		case TARGET_VID_MEM:
-			loc_txt = "VID_MEM";
-			break;
-		case TARGET_SYS_MEM_COHERENT:
-			loc_txt = "SYS_MEM_COHERENT";
-			break;
-		case TARGET_SYS_MEM_NONCOHERENT:
-			loc_txt = "SYS_MEM_NONCOHERENT";
-			break;
-		default:
-			printk(KERN_WARNING "[nvdebug] Invalid aperture in runlist channel!\n");
-			return;
-	}
-	// Reconstruct pointer to channel instance block
-	inst_ptr = chan->inst_ptr_hi;
-	inst_ptr <<= 32;
-	inst_ptr |= chan->inst_ptr_lo << 12;
-
-	printk(PRE "  +- Channel Entry %-4d-+", chan->chid);
-	printk(PRE "  | Runqueue Selector: %d|", chan->runqueue_selector);
-	printk(PRE "  | Instance PTR:       |");
-	printk(PRE "  | %#018llx  |", inst_ptr);
-	printk(PRE "  | %-20s|", loc_txt);
-	printk(PRE "  +---------------------+");
-}
-
-#define for_chan_in_tsg(chan, tsg) \
-	for (chan = (struct runlist_chan*)(tsg + 1); \
-	     (void*)chan < (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length; \
-	     chan++)
-
-#define next_tsg(tsg) \
-	(void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length
-
-static void nvdebug_print_runlist(struct entry_tsg* head, runlist_info_t rl_info) {
-	int rl_idx = 0;
-	struct runlist_chan* chan;
-	printk(PRE "tsg->tsg_length: %d\n", head->tsg_length);
-	printk(PRE "rl_info.len: %d\n", rl_info.len);
-	while (rl_idx < rl_info.len) {
-		nvdebug_print_tsg(head);
-		for_chan_in_tsg(chan, head) {
-			nvdebug_print_chan(chan);
-		}
-		rl_idx += 1 + head->tsg_length;
-		head = next_tsg(head);
-	}
-}
-
-static int __init nvdebug_init(void) {
-	struct device *dev = NULL;
-	struct device *temp_dev;
-	struct gk20a *g;
-	struct entry_tsg head;
-	runlist_base_t rl_base;
-	runlist_info_t rl_info;
-	u64 runlist_iova;
-	// Get the last device that matches our name
-	while ((temp_dev = bus_find_device_by_name(&platform_bus_type, dev, "17000000.gv11b"))) {
-		printk(KERN_INFO "Found a matching device\n");
-		dev = temp_dev;
-	}
-	if (!dev)
-		return -EIO;
-	g = get_gk20a(dev);
-	// This address seems to not be:
-	// - A GPU address (type is sysmem_coherent)
-	// - A physical address (dereferencing after ioremap crashes)
-	// - A kernel virtual address (dereferencing segfaults)
-	// So maybe it's some sort of custom thing? This is an address that the GPU
-	// can use, so it would make most sense for it to be a physical address.
-	//
-	// BUT, it can't possibly be a physical address, as it would refer to an
-	// address greater than the maximum one on our system (by a lot!).
-	// Maybe I'm reading the runlist base wrong?
-	// Aha, the driver calls it runlist_iova. Sounds like runlist I/O virtual
-	// address! So, what's this I/O address space? All I know is that it's what
-	// nvgpu_mem_get_addr() returns. That function returns the result of either:
-	// - gpu_phys_addr which is  __nvgpu_sgl_phys on our platform which (?)
-	//   converts an IPA to a PA?
-	// - nvgpu_mem_iommu_translate
-	//
-	// The original memory is allocated with nvgpu_dma_alloc_flags_sys(), which
-	// returns SYSMEM.
-	//
-	// To convert a physical address to a IOMMU address, we add a bit
-	//
-	// BUT, it turns out that it IS JUST A PHYSICAL ADDRESS! It wasn't working
-	// before because the GPU had simply gone to sleep and invalidated its
-	// register state, so nvgpu_readl() was simply returning garbage.
-
-	printk(KERN_INFO "[nvdebug] Pulling runlist base address from %x\n", NV_PFIFO_RUNLIST_BASE);
-	printk(KERN_INFO "[nvdebug] Using struct gk20a* of %px\n", g);
-	printk(KERN_INFO "[nvdebug] g->name: %s, g->power_on: %d, g->sw_ready: %d, g->is_virtual %d\n", g->name, g->power_on, g->sw_ready, g->is_virtual);
-	struct nvgpu_os_linux *l = container_of(g, struct nvgpu_os_linux, g);
-	printk(KERN_INFO "[nvdebug] l->regs %px, l->regs_saved %px\n", l->regs, l->regs_saved);
-	if (!l->regs)
-		return -EIO;
-	rl_base.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST_BASE);
-	rl_info.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST);
-	runlist_iova = ((u64)rl_base.ptr) << 12;
-	printk(KERN_INFO "[nvdebug] Runlist ptr: %x, type: %d, raw: %x, IOVA: %px\n", rl_base.ptr, rl_base.type, rl_base.raw, (void*)runlist_iova);
-	// Segfaults
-	//u32 attempted_read = ioread32(runlist_iova);
-	//printk(KERN_INFO "[nvdebug] first word of runlist: %0x\n", attempted_read);
-
-	// Errors out
-	//u32* virt_rt_addr = ioremap(phys_rl_addr, sizeof(struct entry_tsg));
-	//printk(KERN_INFO "[nvdebug] Runlist virt_addr: %px\n", virt_rt_addr);
-
-	/* Overcomplicated?
-	struct iommu_domain *domain = iommu_get_domain_for_dev(dev);
-	if (!domain) {
-		printk(KERN_INFO "[nvdebug] No IOMMU domain!\n");
-		return -EIO;
-	}
-	u64 phys_addr = platform_bus_type.iommu_ops->iova_to_phys(domain, runlist_iova);
-	printk(KERN_INFO "[nvdebug] Runlist PA: %px\n", phys_addr);
-	*/
-
-	printk(KERN_INFO "[nvdebug] Runlist phys_to_virt:   %px\n", (void*)phys_to_virt(runlist_iova));
-	printk(KERN_INFO "[nvdebug] Runlist *phys_to_virt:  %x\n", *(u32*)phys_to_virt(runlist_iova));
-	head = *(struct entry_tsg*)phys_to_virt(runlist_iova);
-	nvdebug_print_runlist((struct entry_tsg*)phys_to_virt(runlist_iova), rl_info);
-	//nvdebug_print_tsg(&head);
-	//nvdebug_print_chan((struct runlist_chan*)(phys_to_virt(runlist_iova) + sizeof(struct entry_tsg)));
-	//printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
-	//printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
-	//printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
-	//printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
-	//printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
-
-	//printk(KERN_INFO "[nvdebug] Mem base phys: %p\n", (void*)virt_to_phys((void*)0xffffffc000000000ULL));
-	//printk(KERN_INFO "[nvdebug] Mem end phys: %p\n", (void*)virt_to_phys((void*)0xffffffc400000000ULL));
-	//printk(KERN_INFO "[nvdebug] Runlist *virt_addr: %x\n", readl(virt_rt_addr)); // This crashes
-	//read_bytes(&head, virt_rt_addr, sizeof(struct entry_tsg));
-	/*printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
-	printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
-	printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
-	printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
-	printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
-	*/return 0;
-}
-
-static void __exit nvdebug_exit(void) {
-	printk(KERN_INFO "[nvdebug] Exiting...\n");
-}
-
-module_init(nvdebug_init);
-module_exit(nvdebug_exit);
diff --git a/nvdebug.h b/nvdebug.h
index aa5d0cf..b4ff0a4 100644
--- a/nvdebug.h
+++ b/nvdebug.h
@@ -2,6 +2,10 @@
  * SPDX-License-Identifier: MIT
  */
 
+// TODO(jbakita): Don't depend on these.
+#include <nvgpu/gk20a.h>  // For struct gk20a
+#include <os/linux/os_linux.h>  // For struct nvgpu_os_linux
+
 /* Runlist Channel
   A timeslice group (TSG) is composed of channels. Each channel is a FIFO queue
   of GPU commands. These commands are typically queued from userspace.
@@ -125,3 +129,48 @@ typedef union {
 	} __attribute__((packed));
 	uint32_t raw;
 } runlist_info_t;
+
+// TODO(jbakita): Maybe put the above GPU types in a different file.
+
+#define for_chan_in_tsg(chan, tsg) \
+        for (chan = (struct runlist_chan*)(tsg + 1); \
+             (void*)chan < (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length; \
+             chan++)
+
+#define next_tsg(tsg) \
+        (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length
+
+struct runlist_iter {
+	struct entry_tsg *curr_tsg;
+	runlist_info_t rl_info;
+};
+
+// Defined in runlist.c
+int get_runlist_iter(struct runlist_iter *rl_iter);
+
+static inline struct gk20a *get_gk20a(struct device *dev) {
+        // XXX: Only works because gk20a* is the first member of gk20a_platform
+        return *((struct gk20a**)dev_get_drvdata(dev));
+}
+
+// Functionally identical to nvgpu_readl()
+// (except we don't try to resolve situations where regs is NULL)
+static inline u32 nvdebug_readl(struct gk20a* g, u32 r) {
+        struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
+        if (unlikely(!g_os->regs)) {
+                printk(KERN_ERR "[nvdebug] Attempted nvgpu_readl on non-existent registers!\n");
+                return -1;
+        }
+        return readl(g_os->regs + r);
+}
+
+// Functionally identical to nvgpu_writel()
+static inline void nvdebug_writel(struct gk20a* g, u32 r, u32 v) {
+        struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
+        if (unlikely(!g_os->regs)) {
+                printk(KERN_ERR "[nvdebug] Attempted nvgpu_writel on non-existent registers!\n");
+                return;
+        }
+        writel_relaxed(v, g_os->regs + r);
+        wmb();
+}
diff --git a/nvdebug_entry.c b/nvdebug_entry.c
new file mode 100644
index 0000000..148bd3f
--- /dev/null
+++ b/nvdebug_entry.c
@@ -0,0 +1,40 @@
+/* Copyright 2021 Joshua Bakita
+ * SPDX-License-Identifier: MIT
+ */
+
+/* TODO
+ * - Add sysfs trigger for a preemption
+ */
+
+#include <linux/kernel.h>
+#include <linux/module.h>
+#include <linux/proc_fs.h> // So we can set up entries in /proc
+
+#include "nvdebug.h"
+
+// LIAR. But without this we can't use GPL-only exported symbols like
+// platform_bus_type or bus_find_device_by_name...
+MODULE_LICENSE("GPL");
+MODULE_AUTHOR("Joshua Bakita");
+MODULE_DESCRIPTION("A scheduling debugging module for NVIDIA GPUs");
+MODULE_SOFTDEP("pre: nvgpu"); // We only support the Jetson boards for now
+
+extern const struct file_operations runlist_file_ops;
+
+int __init nvdebug_init(void) {
+	struct proc_dir_entry *entry = proc_create("runlist", 0444, NULL, &runlist_file_ops);
+	if (!entry) {
+		remove_proc_entry("runlist", NULL);
+		printk(KERN_ERR "[nvdebug] Unable to initialize procfs entries!\n");
+		return -ENOMEM;
+	}
+	return 0;
+}
+
+static void __exit nvdebug_exit(void) {
+	remove_proc_entry("runlist", NULL);
+	printk(KERN_INFO "[nvdebug] Exiting...\n");
+}
+
+module_init(nvdebug_init);
+module_exit(nvdebug_exit);
diff --git a/runlist.c b/runlist.c
new file mode 100644
index 0000000..8691b51
--- /dev/null
+++ b/runlist.c
@@ -0,0 +1,106 @@
+#include <linux/device.h>  // For struct device, bus_find_device*()
+//#include <linux/iommu.h>  // For struct iommu_domain
+#include <linux/kernel.h>  // Kernel types
+#include <asm/io.h>
+
+#include "nvdebug.h"
+
+// Bus types are global symbols in the kernel
+extern struct bus_type platform_bus_type;
+
+int get_runlist_iter(struct runlist_iter *rl_iter) {
+        struct device *dev = NULL;
+        struct device *temp_dev;
+        struct gk20a *g;
+        struct entry_tsg head;
+        runlist_base_t rl_base;
+        runlist_info_t rl_info;
+        u64 runlist_iova;
+        // Get the last device that matches our name
+        while ((temp_dev = bus_find_device_by_name(&platform_bus_type, dev, "17000000.gv11b"))) {
+                dev = temp_dev;
+                printk(KERN_INFO "[nvdebug] Found a matching device %s\n", dev_name(dev));
+        }
+        if (!dev)
+                return -EIO;
+        g = get_gk20a(dev);
+        // This address seems to not be:
+        // - A GPU address (type is sysmem_coherent)
+        // - A physical address (dereferencing after ioremap crashes)
+        // - A kernel virtual address (dereferencing segfaults)
+        // So maybe it's some sort of custom thing? This is an address that the GPU
+        // can use, so it would make most sense for it to be a physical address.
+        //
+        // BUT, it can't possibly be a physical address, as it would refer to an
+        // address greater than the maximum one on our system (by a lot!).
+        // Maybe I'm reading the runlist base wrong?
+        // Aha, the driver calls it runlist_iova. Sounds like runlist I/O virtual
+        // address! So, what's this I/O address space? All I know is that it's what
+        // nvgpu_mem_get_addr() returns. That function returns the result of either:
+        // - gpu_phys_addr which is  __nvgpu_sgl_phys on our platform which (?)
+        //   converts an IPA to a PA?
+        // - nvgpu_mem_iommu_translate
+        //
+        // The original memory is allocated with nvgpu_dma_alloc_flags_sys(), which
+        // returns SYSMEM.
+        //
+        // To convert a physical address to a IOMMU address, we add a bit
+        //
+        // BUT, it turns out that it IS JUST A PHYSICAL ADDRESS! It wasn't working
+        // before because the GPU had simply gone to sleep and invalidated its
+        // register state, so nvgpu_readl() was simply returning garbage.
+
+        printk(KERN_INFO "[nvdebug] Pulling runlist base address from %x\n", NV_PFIFO_RUNLIST_BASE);
+        printk(KERN_INFO "[nvdebug] Using struct gk20a* of %px\n", g);
+        printk(KERN_INFO "[nvdebug] g->name: %s, g->power_on: %d, g->sw_ready: %d, g->is_virtual %d\n",
+		g->name, g->power_on, g->sw_ready, g->is_virtual);
+        struct nvgpu_os_linux *l = container_of(g, struct nvgpu_os_linux, g);
+        printk(KERN_INFO "[nvdebug] l->regs %px, l->regs_saved %px\n", l->regs, l->regs_saved);
+        if (!l->regs)
+                return -EIO;
+        rl_base.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST_BASE);
+        rl_info.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST);
+        runlist_iova = ((u64)rl_base.ptr) << 12;
+        printk(KERN_INFO "[nvdebug] Runlist ptr: %x, type: %d, raw: %x, IOVA: %px\n",
+		rl_base.ptr, rl_base.type, rl_base.raw, (void*)runlist_iova);
+        // Segfaults
+        //u32 attempted_read = ioread32(runlist_iova);
+        //printk(KERN_INFO "[nvdebug] first word of runlist: %0x\n", attempted_read);
+
+        // Errors out
+        //u32* virt_rt_addr = ioremap(phys_rl_addr, sizeof(struct entry_tsg));
+        //printk(KERN_INFO "[nvdebug] Runlist virt_addr: %px\n", virt_rt_addr);
+
+        /* Overcomplicated?
+        struct iommu_domain *domain = iommu_get_domain_for_dev(dev);
+        if (!domain) {
+                printk(KERN_INFO "[nvdebug] No IOMMU domain!\n");
+                return -EIO;
+        }
+        u64 phys_addr = platform_bus_type.iommu_ops->iova_to_phys(domain, runlist_iova);
+        printk(KERN_INFO "[nvdebug] Runlist PA: %px\n", phys_addr);
+        */
+
+        printk(KERN_INFO "[nvdebug] Runlist phys_to_virt:   %px\n", (void*)phys_to_virt(runlist_iova));
+        printk(KERN_INFO "[nvdebug] Runlist *phys_to_virt:  %x\n", *(u32*)phys_to_virt(runlist_iova));
+        head = *(struct entry_tsg*)phys_to_virt(runlist_iova);
+
+        rl_iter->curr_tsg = (struct entry_tsg*)phys_to_virt(runlist_iova);
+        rl_iter->rl_info = rl_info;
+        return 0;
+        //printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
+        //printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
+        //printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
+        //printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
+        //printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
+
+        //printk(KERN_INFO "[nvdebug] Mem base phys: %p\n", (void*)virt_to_phys((void*)0xffffffc000000000ULL));
+        //printk(KERN_INFO "[nvdebug] Mem end phys: %p\n", (void*)virt_to_phys((void*)0xffffffc400000000ULL));
+        //printk(KERN_INFO "[nvdebug] Runlist *virt_addr: %x\n", readl(virt_rt_addr)); // This crashes
+        //read_bytes(&head, virt_rt_addr, sizeof(struct entry_tsg));
+        /*printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
+        printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
+        printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
+        printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
+        printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid); */
+}
diff --git a/runlist_procfs.c b/runlist_procfs.c
new file mode 100644
index 0000000..2107bd4
--- /dev/null
+++ b/runlist_procfs.c
@@ -0,0 +1,102 @@
+#include <linux/seq_file.h> // For seq_* functions and types
+
+#include "nvdebug.h"
+
+#define RUNLIST_PROCFS_NAME "runlist"
+
+static void *runlist_file_seq_start(struct seq_file *s, loff_t *pos) {
+	static struct runlist_iter rl_iter;
+
+	// *pos == 0 for first call after read of file
+	if (*pos == 0) {
+		int err = get_runlist_iter(&rl_iter);
+		if (err)
+			return NULL;
+		return &rl_iter;
+	}
+	// When called with *pos != 0, we already traversed the runlist
+	return NULL;
+}
+
+static void* runlist_file_seq_next(struct seq_file *s, void *raw_rl_iter,
+				   loff_t *pos) {
+	struct runlist_iter* rl_iter = raw_rl_iter;
+	// Advance by one TSG + channels under last TSG
+	*pos += 1 + rl_iter->curr_tsg->tsg_length;
+	// Verify we haven't reached the end of the runlist
+	// rl_info.len is the num of tsg entries + total num of channel entries
+	if (*pos < rl_iter->rl_info.len) {
+		rl_iter->curr_tsg = next_tsg(rl_iter->curr_tsg);
+		return rl_iter;
+	}
+	return NULL;
+}
+
+static void runlist_file_seq_stop(struct seq_file *s, void *raw_rl_iter) {
+	// No cleanup needed
+}
+
+static int runlist_file_seq_show(struct seq_file *s, void *raw_rl_iter) {
+	struct entry_tsg* tsg = ((struct runlist_iter*)raw_rl_iter)->curr_tsg;
+	struct runlist_chan* chan;
+	if (tsg->entry_type != ENTRY_TYPE_TSG) {
+                printk(KERN_WARNING "[nvdebug] Attempted to print non-TSG in nvdebug_print_tsg()!\n");
+                return -EIO;
+        }
+        seq_printf(s, "+---- TSG Entry %-2d----+\n", tsg->tsgid);
+        seq_printf(s, "| Scale: %-13d|\n", tsg->timeslice_scale);
+        seq_printf(s, "| Timeout: %-11d|\n", tsg->timeslice_timeout);
+        seq_printf(s, "+---------------------+\n");
+	for_chan_in_tsg(chan, tsg) {
+		char* loc_txt;
+		u64 instance_ptr;
+		if (chan->entry_type != ENTRY_TYPE_CHAN) {
+			printk(KERN_WARNING "[nvdebug] Attempted to print non-channel in nvdebug_print_channel()!\n");
+			return -EIO;
+		}
+		switch (chan->inst_target) {
+			case TARGET_VID_MEM:
+				loc_txt = "VID_MEM";
+				break;
+			case TARGET_SYS_MEM_COHERENT:
+				loc_txt = "SYS_MEM_COHERENT";
+				break;
+			case TARGET_SYS_MEM_NONCOHERENT:
+				loc_txt = "SYS_MEM_NONCOHERENT";
+				break;
+			default:
+				printk(KERN_WARNING "[nvdebug] Invalid aperture in runlist channel!\n");
+				return -EIO;
+		}
+		// Reconstruct pointer to channel instance block
+		instance_ptr = chan->inst_ptr_hi;
+		instance_ptr <<= 32;
+		instance_ptr |= chan->inst_ptr_lo << 12;
+
+		seq_printf(s, "  +- Channel Entry %-4d-+\n", chan->chid);
+		seq_printf(s, "  | Runqueue Selector: %d|\n", chan->runqueue_selector);
+		seq_printf(s, "  | Instance PTR:       |\n");
+		seq_printf(s, "  | %#018llx  |\n", instance_ptr);
+		seq_printf(s, "  | %-20s|\n", loc_txt);
+		seq_printf(s, "  +---------------------+\n");
+	}
+	return 0;
+}
+
+static const struct seq_operations runlist_file_seq_ops = {
+        .start = runlist_file_seq_start,
+        .next = runlist_file_seq_next,
+        .stop = runlist_file_seq_stop,
+        .show = runlist_file_seq_show,
+};
+
+static int runlist_file_open(struct inode *inode, struct file *f) {
+	return seq_open(f, &runlist_file_seq_ops);
+}
+
+const struct file_operations runlist_file_ops = {
+	.open = runlist_file_open,
+	.read = seq_read,
+	.llseek = seq_lseek,
+	.release = seq_release,
+};
-- 
cgit v1.2.2