6 files changed, 298 insertions, 278 deletions
diff --git a/Makefile b/Makefile
index cc14996..5d61177 100644
--- a/Makefile
+++ b/Makefile
@@ -1,4 +1,5 @@
 obj-m += nvdebug.o
+nvdebug-objs = runlist_procfs.o runlist.o nvdebug_entry.o
 # TODO: Avoid needing to distribute NVIDIA's headers (at least they're MIT...)
 #ccflags-y += -I$(PWD)/include
diff --git a/nvdebug.c b/nvdebug.c
deleted file mode 100644
index 31a797e..0000000
--- a/nvdebug.c
+++ /dev/null
@@ -1,278 +0,0 @@
-/* Copyright 2021 Joshua Bakita
- * SPDX-License-Identifier: MIT
- */
-/* TODO
- * - Add /proc /sys or debugfs interface
- * - Add API to trigger a preemption
- */
-#include <linux/module.h>
-#include <linux/kernel.h>
-#include <linux/device.h>
-#include <linux/kallsyms.h>
-#include <linux/iommu.h> // For struct iommu_domain
-#include <asm/io.h>
-/* Currently used symbols:
- * - struct gk20a;
- * - struct nvgpu_os_linux;
- * - void nvgpu_writel(struct gk20a *g, u32 reg_addr, u32 value);
- */
-#include <nvgpu/io.h>
-#include <nvgpu/gk20a.h>
-#include <os/linux/os_linux.h>
-#include "nvdebug.h"
-MODULE_LICENSE("GPL"); // LIAR
-MODULE_AUTHOR("Joshua Bakita");
-MODULE_DESCRIPTION("A scheduling debugging module for NVIDIA GPUs");
-MODULE_SOFTDEP("pre: nvgpu"); // We only support the Jetson boards for now
-// Bus types are global symbols in the kernel
-extern struct bus_type platform_bus_type;
-static inline struct gk20a *get_gk20a(struct device *dev) {
-        // XXX: Only works because gk20a* is the first member of gk20a_platform
-        return *((struct gk20a**)dev_get_drvdata(dev));
-}
-// Functionally identical to nvgpu_readl()
-// (except we don't try to resolve situations where regs is NULL)
-static inline u32 nvdebug_readl(struct gk20a* g, u32 r) {
-        struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
-        if (unlikely(!g_os->regs)) {
-                printk(KERN_ERR "[nvdebug] Attempted nvgpu_readl on non-existent registers!\n");
-                return -1;
-        }
-        return readl(g_os->regs + r);
-}
-// Functionally identical to nvgpu_writel()
-static inline void nvdebug_writel(struct gk20a* g, u32 r, u32 v) {
-        struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
-        if (unlikely(!g_os->regs)) {
-                printk(KERN_ERR "[nvdebug] Attempted nvgpu_writel on non-existent registers!\n");
-                return;
-        }       
-        writel_relaxed(v, g_os->regs + r);
-        wmb();
-}
-/*
-#define RUNLIST_PROCFS_NAME "runlist"
-static const struct seq_operations runlist_file_seq_ops = {
-        .start = 
-        .next =
-        .stop =
-        .show =
-};
-static const struct file_operations runlist_file_ops = {
-        .read = 
-*/
-/*static void read_bytes(struct gk20a *g, void* target, u32 start, u32 num_bytes) {
-        u32 *output = target;
-        u32 i;
-        // Read u32s from the GPU
-        for (i = 0; i < num_bytes; i += 4) {
-                output[i/4] = _nvgpu_readl(g, start + i);
-                printk(KERN_INFO "[nvdebug] U32 %d: %0x\n", i, output[i/4]);
-        }
-}
-static void read_bytes(void* target, void* start, u32 num_bytes) {
-        u32 *output = target;
-        u32 i;
-        // Read u32s from the GPU
-        for (i = 0; i < num_bytes; i += 4) {
-                output[i/4] = readl(start + i);
-                printk(KERN_INFO "[nvdebug] U32 %d: %0x\n", i, output[i/4]);
-        }
-}*/
-/*
-  +---- TSG Entry %d ----+
-  | Scale: %d            |
-  | Timeout: %d          |
-  +----------------------+
-*/
-#define PRE KERN_INFO "[nvdebug] "
-static void nvdebug_print_tsg(struct entry_tsg* tsg) {
-        if (tsg->entry_type != ENTRY_TYPE_TSG) {
-                printk(KERN_WARNING "[nvdebug] Attempted to print non-TSG in nvdebug_print_tsg()!\n");
-                return;
-        }
-        printk(PRE "+---- TSG Entry %-2d----+", tsg->tsgid);
-        printk(PRE "| Scale: %-13d|", tsg->timeslice_scale);
-        printk(PRE "| Timeout: %-11d|", tsg->timeslice_timeout);
-        printk(PRE "+---------------------+");
-}
-static void nvdebug_print_chan(struct runlist_chan* chan) {
-        char* loc_txt;
-        u64 inst_ptr;
-        if (chan->entry_type != ENTRY_TYPE_CHAN) {
-                printk(KERN_WARNING "[nvdebug] Attempted to print non-channel in nvdebug_print_channel()!\n");
-                return;
-        }
-        switch (chan->inst_target) {
-                case TARGET_VID_MEM:
-                        loc_txt = "VID_MEM";
-                        break;
-                case TARGET_SYS_MEM_COHERENT:
-                        loc_txt = "SYS_MEM_COHERENT";
-                        break;
-                case TARGET_SYS_MEM_NONCOHERENT:
-                        loc_txt = "SYS_MEM_NONCOHERENT";
-                        break;
-                default:
-                        printk(KERN_WARNING "[nvdebug] Invalid aperture in runlist channel!\n");
-                        return;
-        }
-        // Reconstruct pointer to channel instance block
-        inst_ptr = chan->inst_ptr_hi;
-        inst_ptr <<= 32;
-        inst_ptr |= chan->inst_ptr_lo << 12;
-        printk(PRE "  +- Channel Entry %-4d-+", chan->chid);
-        printk(PRE "  | Runqueue Selector: %d|", chan->runqueue_selector);
-        printk(PRE "  | Instance PTR:       |");
-        printk(PRE "  | %#018llx  |", inst_ptr);
-        printk(PRE "  | %-20s|", loc_txt);
-        printk(PRE "  +---------------------+");
-}
-#define for_chan_in_tsg(chan, tsg) \
-        for (chan = (struct runlist_chan*)(tsg + 1); \
-             (void*)chan < (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length; \
-             chan++)
-#define next_tsg(tsg) \
-        (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length
-static void nvdebug_print_runlist(struct entry_tsg* head, runlist_info_t rl_info) {
-        int rl_idx = 0;
-        struct runlist_chan* chan;
-        printk(PRE "tsg->tsg_length: %d\n", head->tsg_length);
-        printk(PRE "rl_info.len: %d\n", rl_info.len);
-        while (rl_idx < rl_info.len) {
-                nvdebug_print_tsg(head);
-                for_chan_in_tsg(chan, head) {
-                        nvdebug_print_chan(chan);
-                }
-                rl_idx += 1 + head->tsg_length;
-                head = next_tsg(head);
-        }
-}
-static int __init nvdebug_init(void) {
-        struct device *dev = NULL;
-        struct device *temp_dev;
-        struct gk20a *g;
-        struct entry_tsg head;
-        runlist_base_t rl_base;
-        runlist_info_t rl_info;
-        u64 runlist_iova;
-        // Get the last device that matches our name
-        while ((temp_dev = bus_find_device_by_name(&platform_bus_type, dev, "17000000.gv11b"))) {
-                printk(KERN_INFO "Found a matching device\n");
-                dev = temp_dev;
-        }
-        if (!dev)
-                return -EIO;
-        g = get_gk20a(dev);
-        // This address seems to not be:
-        // - A GPU address (type is sysmem_coherent)
-        // - A physical address (dereferencing after ioremap crashes)
-        // - A kernel virtual address (dereferencing segfaults)
-        // So maybe it's some sort of custom thing? This is an address that the GPU
-        // can use, so it would make most sense for it to be a physical address.
-        //
-        // BUT, it can't possibly be a physical address, as it would refer to an
-        // address greater than the maximum one on our system (by a lot!).
-        // Maybe I'm reading the runlist base wrong?
-        // Aha, the driver calls it runlist_iova. Sounds like runlist I/O virtual
-        // address! So, what's this I/O address space? All I know is that it's what
-        // nvgpu_mem_get_addr() returns. That function returns the result of either:
-        // - gpu_phys_addr which is  __nvgpu_sgl_phys on our platform which (?)
-        //   converts an IPA to a PA?
-        // - nvgpu_mem_iommu_translate
-        //
-        // The original memory is allocated with nvgpu_dma_alloc_flags_sys(), which
-        // returns SYSMEM.
-        //
-        // To convert a physical address to a IOMMU address, we add a bit
-        //
-        // BUT, it turns out that it IS JUST A PHYSICAL ADDRESS! It wasn't working
-        // before because the GPU had simply gone to sleep and invalidated its
-        // register state, so nvgpu_readl() was simply returning garbage.
-        printk(KERN_INFO "[nvdebug] Pulling runlist base address from %x\n", NV_PFIFO_RUNLIST_BASE);
-        printk(KERN_INFO "[nvdebug] Using struct gk20a* of %px\n", g);
-        printk(KERN_INFO "[nvdebug] g->name: %s, g->power_on: %d, g->sw_ready: %d, g->is_virtual %d\n", g->name, g->power_on, g->sw_ready, g->is_virtual);
-        struct nvgpu_os_linux *l = container_of(g, struct nvgpu_os_linux, g);
-        printk(KERN_INFO "[nvdebug] l->regs %px, l->regs_saved %px\n", l->regs, l->regs_saved);
-        if (!l->regs)
-                return -EIO;
-        rl_base.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST_BASE);
-        rl_info.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST);
-        runlist_iova = ((u64)rl_base.ptr) << 12;
-        printk(KERN_INFO "[nvdebug] Runlist ptr: %x, type: %d, raw: %x, IOVA: %px\n", rl_base.ptr, rl_base.type, rl_base.raw, (void*)runlist_iova);
-        // Segfaults
-        //u32 attempted_read = ioread32(runlist_iova);
-        //printk(KERN_INFO "[nvdebug] first word of runlist: %0x\n", attempted_read);
-        // Errors out
-        //u32* virt_rt_addr = ioremap(phys_rl_addr, sizeof(struct entry_tsg));
-        //printk(KERN_INFO "[nvdebug] Runlist virt_addr: %px\n", virt_rt_addr);
-        /* Overcomplicated?
-        struct iommu_domain *domain = iommu_get_domain_for_dev(dev);
-        if (!domain) {
-                printk(KERN_INFO "[nvdebug] No IOMMU domain!\n");
-                return -EIO;
-        }
-        u64 phys_addr = platform_bus_type.iommu_ops->iova_to_phys(domain, runlist_iova);
-        printk(KERN_INFO "[nvdebug] Runlist PA: %px\n", phys_addr);
-        */
-        printk(KERN_INFO "[nvdebug] Runlist phys_to_virt:   %px\n", (void*)phys_to_virt(runlist_iova));
-        printk(KERN_INFO "[nvdebug] Runlist *phys_to_virt:  %x\n", *(u32*)phys_to_virt(runlist_iova));
-        head = *(struct entry_tsg*)phys_to_virt(runlist_iova);
-        nvdebug_print_runlist((struct entry_tsg*)phys_to_virt(runlist_iova), rl_info);
-        //nvdebug_print_tsg(&head);
-        //nvdebug_print_chan((struct runlist_chan*)(phys_to_virt(runlist_iova) + sizeof(struct entry_tsg)));
-        //printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
-        //printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
-        //printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
-        //printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
-        //printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
-        //printk(KERN_INFO "[nvdebug] Mem base phys: %p\n", (void*)virt_to_phys((void*)0xffffffc000000000ULL));
-        //printk(KERN_INFO "[nvdebug] Mem end phys: %p\n", (void*)virt_to_phys((void*)0xffffffc400000000ULL));
-        //printk(KERN_INFO "[nvdebug] Runlist *virt_addr: %x\n", readl(virt_rt_addr)); // This crashes
-        //read_bytes(&head, virt_rt_addr, sizeof(struct entry_tsg));
-        /*printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
-        printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
-        printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
-        printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
-        printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
-        */return 0;
-}
-static void __exit nvdebug_exit(void) {
-        printk(KERN_INFO "[nvdebug] Exiting...\n");
-}
-module_init(nvdebug_init);
-module_exit(nvdebug_exit);
diff --git a/nvdebug.h b/nvdebug.h
index aa5d0cf..b4ff0a4 100644
--- a/nvdebug.h
+++ b/nvdebug.h
@@ -2,6 +2,10 @@
 * SPDX-License-Identifier: MIT
 */
+// TODO(jbakita): Don't depend on these.
+#include <nvgpu/gk20a.h>  // For struct gk20a
+#include <os/linux/os_linux.h>  // For struct nvgpu_os_linux
 /* Runlist Channel
  A timeslice group (TSG) is composed of channels. Each channel is a FIFO queue
  of GPU commands. These commands are typically queued from userspace.
@@ -125,3 +129,48 @@ typedef union {
        } __attribute__((packed));
        uint32_t raw;
 } runlist_info_t;
+// TODO(jbakita): Maybe put the above GPU types in a different file.
+#define for_chan_in_tsg(chan, tsg) \
+        for (chan = (struct runlist_chan*)(tsg + 1); \
+             (void*)chan < (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length; \
+             chan++)
+#define next_tsg(tsg) \
+        (void*)(tsg + 1) + sizeof(struct runlist_chan) * tsg->tsg_length
+struct runlist_iter {
+        struct entry_tsg *curr_tsg;
+        runlist_info_t rl_info;
+};
+// Defined in runlist.c
+int get_runlist_iter(struct runlist_iter *rl_iter);
+static inline struct gk20a *get_gk20a(struct device *dev) {
+        // XXX: Only works because gk20a* is the first member of gk20a_platform
+        return *((struct gk20a**)dev_get_drvdata(dev));
+}
+// Functionally identical to nvgpu_readl()
+// (except we don't try to resolve situations where regs is NULL)
+static inline u32 nvdebug_readl(struct gk20a* g, u32 r) {
+        struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
+        if (unlikely(!g_os->regs)) {
+                printk(KERN_ERR "[nvdebug] Attempted nvgpu_readl on non-existent registers!\n");
+                return -1;
+        }
+        return readl(g_os->regs + r);
+}
+// Functionally identical to nvgpu_writel()
+static inline void nvdebug_writel(struct gk20a* g, u32 r, u32 v) {
+        struct nvgpu_os_linux* g_os = container_of(g, struct nvgpu_os_linux, g);
+        if (unlikely(!g_os->regs)) {
+                printk(KERN_ERR "[nvdebug] Attempted nvgpu_writel on non-existent registers!\n");
+                return;
+        }
+        writel_relaxed(v, g_os->regs + r);
+        wmb();
+}
diff --git a/nvdebug_entry.c b/nvdebug_entry.c
new file mode 100644
index 0000000..148bd3f
--- /dev/null
+++ b/nvdebug_entry.c
@@ -0,0 +1,40 @@
+/* Copyright 2021 Joshua Bakita
+ * SPDX-License-Identifier: MIT
+ */
+/* TODO
+ * - Add sysfs trigger for a preemption
+ */
+#include <linux/kernel.h>
+#include <linux/module.h>
+#include <linux/proc_fs.h> // So we can set up entries in /proc
+#include "nvdebug.h"
+// LIAR. But without this we can't use GPL-only exported symbols like
+// platform_bus_type or bus_find_device_by_name...
+MODULE_LICENSE("GPL");
+MODULE_AUTHOR("Joshua Bakita");
+MODULE_DESCRIPTION("A scheduling debugging module for NVIDIA GPUs");
+MODULE_SOFTDEP("pre: nvgpu"); // We only support the Jetson boards for now
+extern const struct file_operations runlist_file_ops;
+int __init nvdebug_init(void) {
+        struct proc_dir_entry *entry = proc_create("runlist", 0444, NULL, &runlist_file_ops);
+        if (!entry) {
+                remove_proc_entry("runlist", NULL);
+                printk(KERN_ERR "[nvdebug] Unable to initialize procfs entries!\n");
+                return -ENOMEM;
+        }
+        return 0;
+}
+static void __exit nvdebug_exit(void) {
+        remove_proc_entry("runlist", NULL);
+        printk(KERN_INFO "[nvdebug] Exiting...\n");
+}
+module_init(nvdebug_init);
+module_exit(nvdebug_exit);
diff --git a/runlist.c b/runlist.c
new file mode 100644
index 0000000..8691b51
--- /dev/null
+++ b/runlist.c
@@ -0,0 +1,106 @@
+#include <linux/device.h>  // For struct device, bus_find_device*()
+//#include <linux/iommu.h>  // For struct iommu_domain
+#include <linux/kernel.h>  // Kernel types
+#include <asm/io.h>
+#include "nvdebug.h"
+// Bus types are global symbols in the kernel
+extern struct bus_type platform_bus_type;
+int get_runlist_iter(struct runlist_iter *rl_iter) {
+        struct device *dev = NULL;
+        struct device *temp_dev;
+        struct gk20a *g;
+        struct entry_tsg head;
+        runlist_base_t rl_base;
+        runlist_info_t rl_info;
+        u64 runlist_iova;
+        // Get the last device that matches our name
+        while ((temp_dev = bus_find_device_by_name(&platform_bus_type, dev, "17000000.gv11b"))) {
+                dev = temp_dev;
+                printk(KERN_INFO "[nvdebug] Found a matching device %s\n", dev_name(dev));
+        }
+        if (!dev)
+                return -EIO;
+        g = get_gk20a(dev);
+        // This address seems to not be:
+        // - A GPU address (type is sysmem_coherent)
+        // - A physical address (dereferencing after ioremap crashes)
+        // - A kernel virtual address (dereferencing segfaults)
+        // So maybe it's some sort of custom thing? This is an address that the GPU
+        // can use, so it would make most sense for it to be a physical address.
+        //
+        // BUT, it can't possibly be a physical address, as it would refer to an
+        // address greater than the maximum one on our system (by a lot!).
+        // Maybe I'm reading the runlist base wrong?
+        // Aha, the driver calls it runlist_iova. Sounds like runlist I/O virtual
+        // address! So, what's this I/O address space? All I know is that it's what
+        // nvgpu_mem_get_addr() returns. That function returns the result of either:
+        // - gpu_phys_addr which is  __nvgpu_sgl_phys on our platform which (?)
+        //   converts an IPA to a PA?
+        // - nvgpu_mem_iommu_translate
+        //
+        // The original memory is allocated with nvgpu_dma_alloc_flags_sys(), which
+        // returns SYSMEM.
+        //
+        // To convert a physical address to a IOMMU address, we add a bit
+        //
+        // BUT, it turns out that it IS JUST A PHYSICAL ADDRESS! It wasn't working
+        // before because the GPU had simply gone to sleep and invalidated its
+        // register state, so nvgpu_readl() was simply returning garbage.
+        printk(KERN_INFO "[nvdebug] Pulling runlist base address from %x\n", NV_PFIFO_RUNLIST_BASE);
+        printk(KERN_INFO "[nvdebug] Using struct gk20a* of %px\n", g);
+        printk(KERN_INFO "[nvdebug] g->name: %s, g->power_on: %d, g->sw_ready: %d, g->is_virtual %d\n",
+                g->name, g->power_on, g->sw_ready, g->is_virtual);
+        struct nvgpu_os_linux *l = container_of(g, struct nvgpu_os_linux, g);
+        printk(KERN_INFO "[nvdebug] l->regs %px, l->regs_saved %px\n", l->regs, l->regs_saved);
+        if (!l->regs)
+                return -EIO;
+        rl_base.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST_BASE);
+        rl_info.raw = nvdebug_readl(g, NV_PFIFO_RUNLIST);
+        runlist_iova = ((u64)rl_base.ptr) << 12;
+        printk(KERN_INFO "[nvdebug] Runlist ptr: %x, type: %d, raw: %x, IOVA: %px\n",
+                rl_base.ptr, rl_base.type, rl_base.raw, (void*)runlist_iova);
+        // Segfaults
+        //u32 attempted_read = ioread32(runlist_iova);
+        //printk(KERN_INFO "[nvdebug] first word of runlist: %0x\n", attempted_read);
+        // Errors out
+        //u32* virt_rt_addr = ioremap(phys_rl_addr, sizeof(struct entry_tsg));
+        //printk(KERN_INFO "[nvdebug] Runlist virt_addr: %px\n", virt_rt_addr);
+        /* Overcomplicated?
+        struct iommu_domain *domain = iommu_get_domain_for_dev(dev);
+        if (!domain) {
+                printk(KERN_INFO "[nvdebug] No IOMMU domain!\n");
+                return -EIO;
+        }
+        u64 phys_addr = platform_bus_type.iommu_ops->iova_to_phys(domain, runlist_iova);
+        printk(KERN_INFO "[nvdebug] Runlist PA: %px\n", phys_addr);
+        */
+        printk(KERN_INFO "[nvdebug] Runlist phys_to_virt:   %px\n", (void*)phys_to_virt(runlist_iova));
+        printk(KERN_INFO "[nvdebug] Runlist *phys_to_virt:  %x\n", *(u32*)phys_to_virt(runlist_iova));
+        head = *(struct entry_tsg*)phys_to_virt(runlist_iova);
+        rl_iter->curr_tsg = (struct entry_tsg*)phys_to_virt(runlist_iova);
+        rl_iter->rl_info = rl_info;
+        return 0;
+        //printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
+        //printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
+        //printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
+        //printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
+        //printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid);
+        //printk(KERN_INFO "[nvdebug] Mem base phys: %p\n", (void*)virt_to_phys((void*)0xffffffc000000000ULL));
+        //printk(KERN_INFO "[nvdebug] Mem end phys: %p\n", (void*)virt_to_phys((void*)0xffffffc400000000ULL));
+        //printk(KERN_INFO "[nvdebug] Runlist *virt_addr: %x\n", readl(virt_rt_addr)); // This crashes
+        //read_bytes(&head, virt_rt_addr, sizeof(struct entry_tsg));
+        /*printk(KERN_INFO "[nvdebug] entry_type: %d\n", head.entry_type);
+        printk(KERN_INFO "[nvdebug] timeslice_scale: %d\n", head.timeslice_scale);
+        printk(KERN_INFO "[nvdebug] timeslice_timeout: %d\n", head.timeslice_timeout);
+        printk(KERN_INFO "[nvdebug] tsg_length: %d\n", head.tsg_length);
+        printk(KERN_INFO "[nvdebug] tsgid: %d\n", head.tsgid); */
+}
diff --git a/runlist_procfs.c b/runlist_procfs.c
new file mode 100644
index 0000000..2107bd4
--- /dev/null
+++ b/runlist_procfs.c
@@ -0,0 +1,102 @@
+#include <linux/seq_file.h> // For seq_* functions and types
+#include "nvdebug.h"
+#define RUNLIST_PROCFS_NAME "runlist"
+static void *runlist_file_seq_start(struct seq_file *s, loff_t *pos) {
+        static struct runlist_iter rl_iter;
+        // *pos == 0 for first call after read of file
+        if (*pos == 0) {
+                int err = get_runlist_iter(&rl_iter);
+                if (err)
+                        return NULL;
+                return &rl_iter;
+        }
+        // When called with *pos != 0, we already traversed the runlist
+        return NULL;
+}
+static void* runlist_file_seq_next(struct seq_file *s, void *raw_rl_iter,
+                                   loff_t *pos) {
+        struct runlist_iter* rl_iter = raw_rl_iter;
+        // Advance by one TSG + channels under last TSG
+        *pos += 1 + rl_iter->curr_tsg->tsg_length;
+        // Verify we haven't reached the end of the runlist
+        // rl_info.len is the num of tsg entries + total num of channel entries
+        if (*pos < rl_iter->rl_info.len) {
+                rl_iter->curr_tsg = next_tsg(rl_iter->curr_tsg);
+                return rl_iter;
+        }
+        return NULL;
+}
+static void runlist_file_seq_stop(struct seq_file *s, void *raw_rl_iter) {
+        // No cleanup needed
+}
+static int runlist_file_seq_show(struct seq_file *s, void *raw_rl_iter) {
+        struct entry_tsg* tsg = ((struct runlist_iter*)raw_rl_iter)->curr_tsg;
+        struct runlist_chan* chan;
+        if (tsg->entry_type != ENTRY_TYPE_TSG) {
+                printk(KERN_WARNING "[nvdebug] Attempted to print non-TSG in nvdebug_print_tsg()!\n");
+                return -EIO;
+        }
+        seq_printf(s, "+---- TSG Entry %-2d----+\n", tsg->tsgid);
+        seq_printf(s, "| Scale: %-13d|\n", tsg->timeslice_scale);
+        seq_printf(s, "| Timeout: %-11d|\n", tsg->timeslice_timeout);
+        seq_printf(s, "+---------------------+\n");
+        for_chan_in_tsg(chan, tsg) {
+                char* loc_txt;
+                u64 instance_ptr;
+                if (chan->entry_type != ENTRY_TYPE_CHAN) {
+                        printk(KERN_WARNING "[nvdebug] Attempted to print non-channel in nvdebug_print_channel()!\n");
+                        return -EIO;
+                }
+                switch (chan->inst_target) {
+                        case TARGET_VID_MEM:
+                                loc_txt = "VID_MEM";
+                                break;
+                        case TARGET_SYS_MEM_COHERENT:
+                                loc_txt = "SYS_MEM_COHERENT";
+                                break;
+                        case TARGET_SYS_MEM_NONCOHERENT:
+                                loc_txt = "SYS_MEM_NONCOHERENT";
+                                break;
+                        default:
+                                printk(KERN_WARNING "[nvdebug] Invalid aperture in runlist channel!\n");
+                                return -EIO;
+                }
+                // Reconstruct pointer to channel instance block
+                instance_ptr = chan->inst_ptr_hi;
+                instance_ptr <<= 32;
+                instance_ptr |= chan->inst_ptr_lo << 12;
+                seq_printf(s, "  +- Channel Entry %-4d-+\n", chan->chid);
+                seq_printf(s, "  | Runqueue Selector: %d|\n", chan->runqueue_selector);
+                seq_printf(s, "  | Instance PTR:       |\n");
+                seq_printf(s, "  | %#018llx  |\n", instance_ptr);
+                seq_printf(s, "  | %-20s|\n", loc_txt);
+                seq_printf(s, "  +---------------------+\n");
+        }
+        return 0;
+}
+static const struct seq_operations runlist_file_seq_ops = {
+        .start = runlist_file_seq_start,
+        .next = runlist_file_seq_next,
+        .stop = runlist_file_seq_stop,
+        .show = runlist_file_seq_show,
+};
+static int runlist_file_open(struct inode *inode, struct file *f) {
+        return seq_open(f, &runlist_file_seq_ops);
+}
+const struct file_operations runlist_file_ops = {
+        .open = runlist_file_open,
+        .read = seq_read,
+        .llseek = seq_lseek,
+        .release = seq_release,
+};