/* * GK20A Address Spaces * * Copyright (c) 2011-2018, NVIDIA CORPORATION. All rights reserved. * * This program is free software; you can redistribute it and/or modify it * under the terms and conditions of the GNU General Public License, * version 2, as published by the Free Software Foundation. * * This program is distributed in the hope it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for * more details. */ #include #include #include #include #include #include #include #include #include #include #include #include "platform_gk20a.h" #include "ioctl_as.h" #include "os_linux.h" #include // For nvmap_dmabuf_{d/r}ealloc() #include "dmabuf.h" // struct dma_buf things for swapping #include "swap.h" static u32 gk20a_as_translate_as_alloc_space_flags(struct gk20a *g, u32 flags) { u32 core_flags = 0; if (flags & NVGPU_AS_ALLOC_SPACE_FLAGS_FIXED_OFFSET) core_flags |= NVGPU_VM_AREA_ALLOC_FIXED_OFFSET; if (flags & NVGPU_AS_ALLOC_SPACE_FLAGS_SPARSE) core_flags |= NVGPU_VM_AREA_ALLOC_SPARSE; return core_flags; } static int gk20a_as_ioctl_bind_channel( struct gk20a_as_share *as_share, struct nvgpu_as_bind_channel_args *args) { int err = 0; struct channel_gk20a *ch; struct gk20a *g = gk20a_from_vm(as_share->vm); nvgpu_log_fn(g, " "); ch = gk20a_get_channel_from_file(args->channel_fd); if (!ch) return -EINVAL; if (gk20a_channel_as_bound(ch)) { err = -EINVAL; goto out; } /* this will set channel_gk20a->vm */ err = ch->g->ops.mm.vm_bind_channel(as_share->vm, ch); out: gk20a_channel_put(ch); return err; } static int gk20a_as_ioctl_alloc_space( struct gk20a_as_share *as_share, struct nvgpu_as_alloc_space_args *args) { struct gk20a *g = gk20a_from_vm(as_share->vm); nvgpu_log_fn(g, " "); return nvgpu_vm_area_alloc(as_share->vm, args->pages, args->page_size, &args->o_a.offset, gk20a_as_translate_as_alloc_space_flags(g, args->flags)); } static int gk20a_as_ioctl_free_space( struct gk20a_as_share *as_share, struct nvgpu_as_free_space_args *args) { struct gk20a *g = gk20a_from_vm(as_share->vm); nvgpu_log_fn(g, " "); return nvgpu_vm_area_free(as_share->vm, args->offset); } static int gk20a_as_ioctl_map_buffer_ex( struct gk20a_as_share *as_share, struct nvgpu_as_map_buffer_ex_args *args) { struct gk20a *g = gk20a_from_vm(as_share->vm); nvgpu_log_fn(g, " "); /* unsupported, direct kind control must be used */ if (!(args->flags & NVGPU_AS_MAP_BUFFER_FLAGS_DIRECT_KIND_CTRL)) { struct gk20a *g = as_share->vm->mm->g; nvgpu_log_info(g, "Direct kind control must be requested"); return -EINVAL; } return nvgpu_vm_map_buffer(as_share->vm, args->dmabuf_fd, &args->offset, args->flags, args->page_size, args->compr_kind, args->incompr_kind, args->buffer_offset, args->mapping_size, NULL); } static int gk20a_as_ioctl_unmap_buffer( struct gk20a_as_share *as_share, struct nvgpu_as_unmap_buffer_args *args) { struct gk20a *g = gk20a_from_vm(as_share->vm); nvgpu_log_fn(g, " "); nvgpu_vm_unmap(as_share->vm, args->offset, NULL); return 0; } static int gk20a_as_ioctl_map_buffer_batch( struct gk20a_as_share *as_share, struct nvgpu_as_map_buffer_batch_args *args) { struct gk20a *g = gk20a_from_vm(as_share->vm); u32 i; int err = 0; struct nvgpu_as_unmap_buffer_args __user *user_unmap_args = (struct nvgpu_as_unmap_buffer_args __user *)(uintptr_t) args->unmaps; struct nvgpu_as_map_buffer_ex_args __user *user_map_args = (struct nvgpu_as_map_buffer_ex_args __user *)(uintptr_t) args->maps; struct vm_gk20a_mapping_batch batch; nvgpu_log_fn(g, " "); if (args->num_unmaps > NVGPU_IOCTL_AS_MAP_BUFFER_BATCH_LIMIT || args->num_maps > NVGPU_IOCTL_AS_MAP_BUFFER_BATCH_LIMIT) return -EINVAL; nvgpu_vm_mapping_batch_start(&batch); for (i = 0; i < args->num_unmaps; ++i) { struct nvgpu_as_unmap_buffer_args unmap_args; if (copy_from_user(&unmap_args, &user_unmap_args[i], sizeof(unmap_args))) { err = -EFAULT; break; } nvgpu_vm_unmap(as_share->vm, unmap_args.offset, &batch); } nvgpu_speculation_barrier(); if (err) { nvgpu_vm_mapping_batch_finish(as_share->vm, &batch); args->num_unmaps = i; args->num_maps = 0; return err; } for (i = 0; i < args->num_maps; ++i) { s16 compressible_kind; s16 incompressible_kind; struct nvgpu_as_map_buffer_ex_args map_args; memset(&map_args, 0, sizeof(map_args)); if (copy_from_user(&map_args, &user_map_args[i], sizeof(map_args))) { err = -EFAULT; break; } if (map_args.flags & NVGPU_AS_MAP_BUFFER_FLAGS_DIRECT_KIND_CTRL) { compressible_kind = map_args.compr_kind; incompressible_kind = map_args.incompr_kind; } else { /* direct kind control must be used */ err = -EINVAL; break; } err = nvgpu_vm_map_buffer( as_share->vm, map_args.dmabuf_fd, &map_args.offset, map_args.flags, map_args.page_size, compressible_kind, incompressible_kind, map_args.buffer_offset, map_args.mapping_size, &batch); if (err) break; } nvgpu_vm_mapping_batch_finish(as_share->vm, &batch); if (err) args->num_maps = i; /* note: args->num_unmaps will be unmodified, which is ok * since all unmaps are done */ return err; } static int gk20a_as_ioctl_get_va_regions( struct gk20a_as_share *as_share, struct nvgpu_as_get_va_regions_args *args) { unsigned int i; unsigned int write_entries; struct nvgpu_as_va_region __user *user_region_ptr; struct vm_gk20a *vm = as_share->vm; struct gk20a *g = gk20a_from_vm(vm); unsigned int page_sizes = GMMU_PAGE_SIZE_KERNEL; nvgpu_log_fn(g, " "); if (!vm->big_pages) page_sizes--; write_entries = args->buf_size / sizeof(struct nvgpu_as_va_region); if (write_entries > page_sizes) write_entries = page_sizes; user_region_ptr = (struct nvgpu_as_va_region __user *)(uintptr_t)args->buf_addr; for (i = 0; i < write_entries; ++i) { struct nvgpu_as_va_region region; struct nvgpu_allocator *vma = vm->vma[i]; memset(®ion, 0, sizeof(struct nvgpu_as_va_region)); region.page_size = vm->gmmu_page_sizes[i]; region.offset = nvgpu_alloc_base(vma); /* No __aeabi_uldivmod() on some platforms... */ region.pages = (nvgpu_alloc_end(vma) - nvgpu_alloc_base(vma)) >> ilog2(region.page_size); if (copy_to_user(user_region_ptr + i, ®ion, sizeof(region))) return -EFAULT; } args->buf_size = page_sizes * sizeof(struct nvgpu_as_va_region); return 0; } static int nvgpu_as_ioctl_get_sync_ro_map( struct gk20a_as_share *as_share, struct nvgpu_as_get_sync_ro_map_args *args) { #ifdef CONFIG_TEGRA_GK20A_NVHOST struct vm_gk20a *vm = as_share->vm; struct gk20a *g = gk20a_from_vm(vm); u64 base_gpuva; u32 sync_size; int err = 0; if (!g->ops.fifo.get_sync_ro_map) return -EINVAL; if (!nvgpu_has_syncpoints(g)) return -EINVAL; err = g->ops.fifo.get_sync_ro_map(vm, &base_gpuva, &sync_size); if (err) return err; args->base_gpuva = base_gpuva; args->sync_size = sync_size; return err; #else return -EINVAL; #endif } int gk20a_as_dev_open(struct inode *inode, struct file *filp) { struct nvgpu_os_linux *l; struct gk20a_as_share *as_share; struct gk20a *g; int err; l = container_of(inode->i_cdev, struct nvgpu_os_linux, as_dev.cdev); g = &l->g; nvgpu_log_fn(g, " "); err = gk20a_as_alloc_share(g, 0, 0, &as_share); if (err) { nvgpu_log_fn(g, "failed to alloc share"); return err; } filp->private_data = as_share; return 0; } int gk20a_as_dev_release(struct inode *inode, struct file *filp) { struct gk20a_as_share *as_share = filp->private_data; if (!as_share) return 0; return gk20a_as_release_share(as_share); } /* Access dmabuf associated with passed file descriptor, copy the associated * pages to an NVME drive, unpin associated pages from DMA'able space, and free * said pages for use by others. * dmabuf is put in a deallocated state, and any GPU mappings will be * invalidated. To restore the dmabuf, see nvgpu_as_ioctl_read_swap_buffer(). * ... * Starts a swap-out operation by flushing the GPU L2 and starting I/O. * vm->update_gmmu_lock /must/ already be held. */ static int nvgpu_as_ioctl_write_swap_buffer( struct dma_buf *dmabuf, struct nvgpu_mapped_buf *m, struct vm_gk20a *vm, struct gk20a *g) { int err = 0; nvgpu_log_fn(g, " "); // Disable an annoying custom out-of-tree "feature" of dma_buf which defers unmap if (dma_buf_disable_lazy_unmapping(dev_from_vm(vm))) { err = -ENOTRECOVERABLE; goto out; } // TODO: Verify that we'll likely be able to free the pages later // before we start the copy. // Flush dirty GPU L2 cache lines to DRAM // (Assuming that NVMe DRAM acceses are uncached) gk20a_mm_l2_flush(g, false); // Copy out (non-blocking) // Could fail on inaccessible swap device, etc err = copy_out(m->os_priv.sgt, m); out: return err; } /* Finish a swap-out operation by waiting on I/O to complete, then unpinning * and freeing the pages. * * Note that this may fail even if nvgpu_as_ioctl_write_swap_buffer() * succeeded if the user mmaps the buffer before finishing the swap-out. * * vm->update_gmmu_lock /must/ already be held. */ static int nvgpu_as_ioctl_write_swap_buffer_finish( struct dma_buf *dmabuf, struct nvgpu_mapped_buf *m, struct vm_gk20a *vm, struct gk20a *g) { struct sg_table *sgt; int err = 0; nvgpu_log_fn(g, " "); // Wait for the pages to get written out wait_for_completion_io(&m->os_priv.swap_io_done); // Unpin needs to happen after copy out is done // (No return value check as it's a void function) gk20a_mm_unpin(dev_from_vm(vm), m->os_priv.dmabuf, m->os_priv.attachment, m->os_priv.sgt); // Deallocate dmabuf's backing pages // TODO: Fail early for these cases (where the dmabuf is mmaped, etc), // before we do all the above (expensive) steps err = nvmap_dealloc_dmabuf(dmabuf); if (err) { // Repin sgt = gk20a_mm_pin(dev_from_vm(vm), m->os_priv.dmabuf, &m->os_priv.attachment); m->os_priv.sgt = sgt; } return err; } /* Starts a swap-in operation by allocating and pinning backing pages, and * starting I/O. * vm->update_gmmu_lock /must/ already be held. */ static int nvgpu_as_ioctl_read_swap_buffer( struct dma_buf *dmabuf, struct nvgpu_mapped_buf *m, struct vm_gk20a *vm, struct gk20a *g) { struct sg_table *sgt; int err = 0; nvgpu_log_fn(g, " "); // Reallocate space for this buffer err = nvmap_realloc_dmabuf(dmabuf); if (err) goto out; // Out of memory (?) // Repin the buffer to DMA'able memory sgt = gk20a_mm_pin(dev_from_vm(vm), m->os_priv.dmabuf, &m->os_priv.attachment); if (IS_ERR(sgt)) { // Rollback allocation err = nvmap_dealloc_dmabuf(dmabuf); if (err) printk(KERN_ERR "nvgpu: Error %d while rolling back dmabuf allocation state on error in gk20a_mm_pin()! Consider dmabuf '%s' to be in an inconsistent state!\n", err, dmabuf->exp_name); err = PTR_ERR(sgt); goto out; } // Do any bookeeping not done by gk20a_mm_pin() m->os_priv.sgt = sgt; // Reload page contents from disk (non-blocking) err = copy_in(sgt, m); if (err) { int err2; // Rollback pinning and allocation gk20a_mm_unpin(dev_from_vm(vm), m->os_priv.dmabuf, m->os_priv.attachment, m->os_priv.sgt); err2 = nvmap_dealloc_dmabuf(dmabuf); if (err2) printk(KERN_ERR "nvgpu: Error %d while rolling back dmabuf allocation state on error in copy_in()! Consider dmabuf '%s' to be in an inconsistent state!\n", err2, dmabuf->exp_name); // Inaccessible swap device, etc goto out; } out: return err; } /* Finish a swap-in operation by mapping the pages and waiting on I/O to * complete. */ static int nvgpu_as_ioctl_read_swap_buffer_finish( struct dma_buf *dmabuf, struct nvgpu_mapped_buf *m, struct vm_gk20a *vm, struct gk20a *g) { int err = 0; nvgpu_log_fn(g, " "); // Update GPU page tables (PT) to point to new allocation nvgpu_vm_remap(m); // Due to PT update, translation lookaside buffer needs clearing g->ops.fb.tlb_invalidate(g, vm->pdb.mem); // Invalidate L2 so that TLB refill does not load stale PT gk20a_mm_l2_flush(g, true); // Wait for read to complete if it hasn't yet wait_for_completion_io(&m->os_priv.swap_io_done); return err; } #define NVGPU_SWAP_ALL -1 /* All swap functions require some common boilerplate. This function serves as * a common entrypoint for all swap functions my handling that boilerplate, * with includes input validation and locking for all functions. * @param cmd IOCTL command code */ static int nvgpu_as_dev_ioctl_swap( unsigned int cmd, struct gk20a_as_share *as_share, struct nvgpu_as_swap_buffer_args *args) { struct vm_gk20a *vm = as_share->vm; struct gk20a *g = gk20a_from_vm(vm); struct nvgpu_mapped_buf *m; struct dma_buf *dmabuf; int err; // Other code walking vm->mapped_buffers grabs this lock // Note that we don't really need to do this before getting the dmabuf, // but we do for now to limit code complexity. nvgpu_mutex_acquire(&vm->update_gmmu_lock); // Grab dmabuf and mapped_buf (if necessary) depending on op type if (args->dmabuf_fd != NVGPU_SWAP_ALL) { // If not swapping out everything, get dmabuf, then mapped_buf dmabuf = dma_buf_get(args->dmabuf_fd); if (IS_ERR(dmabuf)) { err = PTR_ERR(dmabuf); goto out_unlock; } // Get mapped buffer corresponding to this dmabuf m = dmabuf_to_mapped_buf(dmabuf); // If failed search if (IS_ERR(m)) { // No mapped dmabuf associated with FD err = -EBADFD; goto out_put_unlock; } } else { // When swapping everything, we get buffers by walking the // mapped_buf rbtree and then use those to get the dmabuf. // TODO //dmabuf = mapped_buf_to_dmabuf(m); err = -EBADFD; // Not yet supported goto out_unlock; } // Run appropriate command // XXX: Validate that buffer state is valid for the requested command. switch (cmd) { case NVGPU_AS_IOCTL_READ_SWAP_BUFFER: // Just a combo of the _ASYNC versions. Saves caller a lock, // some lookups, and an extra syscall. Partially kept for // legacy reasons. err = nvgpu_as_ioctl_read_swap_buffer(dmabuf, m, vm, g); if (err) goto out_put_unlock; err = nvgpu_as_ioctl_read_swap_buffer_finish(dmabuf, m, vm, g); break; case NVGPU_AS_IOCTL_READ_SWAP_BUFFER_ASYNC: err = nvgpu_as_ioctl_read_swap_buffer(dmabuf, m, vm, g); break; case NVGPU_AS_IOCTL_READ_SWAP_BUFFER_ASYNC_FINISH: err = nvgpu_as_ioctl_read_swap_buffer_finish(dmabuf, m, vm, g); break; case NVGPU_AS_IOCTL_WRITE_SWAP_BUFFER: // See comment on NVGPU_AS_IOCTL_READ_SWAP_BUFFER above err = nvgpu_as_ioctl_write_swap_buffer(dmabuf, m, vm, g); if (err) goto out_put_unlock; err = nvgpu_as_ioctl_write_swap_buffer_finish(dmabuf, m, vm, g); break; case NVGPU_AS_IOCTL_WRITE_SWAP_BUFFER_ASYNC: err = nvgpu_as_ioctl_write_swap_buffer(dmabuf, m, vm, g); break; case NVGPU_AS_IOCTL_WRITE_SWAP_BUFFER_ASYNC_FINISH: err = nvgpu_as_ioctl_write_swap_buffer_finish(dmabuf, m, vm, g); break; default: err = -ENOTTY; break; } out_put_unlock: // Done with dmabuf, so release our ref to it dma_buf_put(dmabuf); out_unlock: nvgpu_mutex_release(&vm->update_gmmu_lock); return err; } long gk20a_as_dev_ioctl(struct file *filp, unsigned int cmd, unsigned long arg) { int err = 0; struct gk20a_as_share *as_share = filp->private_data; struct gk20a *g = gk20a_from_as(as_share->as); u8 buf[NVGPU_AS_IOCTL_MAX_ARG_SIZE]; nvgpu_log_fn(g, "start %d", _IOC_NR(cmd)); if ((_IOC_TYPE(cmd) != NVGPU_AS_IOCTL_MAGIC) || (_IOC_NR(cmd) == 0) || (_IOC_NR(cmd) > NVGPU_AS_IOCTL_LAST) || (_IOC_SIZE(cmd) > NVGPU_AS_IOCTL_MAX_ARG_SIZE)) return -EINVAL; memset(buf, 0, sizeof(buf)); if (_IOC_DIR(cmd) & _IOC_WRITE) { if (copy_from_user(buf, (void __user *)arg, _IOC_SIZE(cmd))) return -EFAULT; } err = gk20a_busy(g); if (err) return err; nvgpu_speculation_barrier(); switch (cmd) { case NVGPU_AS_IOCTL_BIND_CHANNEL: trace_gk20a_as_ioctl_bind_channel(g->name); err = gk20a_as_ioctl_bind_channel(as_share, (struct nvgpu_as_bind_channel_args *)buf); break; case NVGPU32_AS_IOCTL_ALLOC_SPACE: { struct nvgpu32_as_alloc_space_args *args32 = (struct nvgpu32_as_alloc_space_args *)buf; struct nvgpu_as_alloc_space_args args; args.pages = args32->pages; args.page_size = args32->page_size; args.flags = args32->flags; args.o_a.offset = args32->o_a.offset; trace_gk20a_as_ioctl_alloc_space(g->name); err = gk20a_as_ioctl_alloc_space(as_share, &args); args32->o_a.offset = args.o_a.offset; break; } case NVGPU_AS_IOCTL_ALLOC_SPACE: trace_gk20a_as_ioctl_alloc_space(g->name); err = gk20a_as_ioctl_alloc_space(as_share, (struct nvgpu_as_alloc_space_args *)buf); break; case NVGPU_AS_IOCTL_FREE_SPACE: trace_gk20a_as_ioctl_free_space(g->name); err = gk20a_as_ioctl_free_space(as_share, (struct nvgpu_as_free_space_args *)buf); break; case NVGPU_AS_IOCTL_MAP_BUFFER_EX: trace_gk20a_as_ioctl_map_buffer(g->name); err = gk20a_as_ioctl_map_buffer_ex(as_share, (struct nvgpu_as_map_buffer_ex_args *)buf); break; case NVGPU_AS_IOCTL_UNMAP_BUFFER: trace_gk20a_as_ioctl_unmap_buffer(g->name); err = gk20a_as_ioctl_unmap_buffer(as_share, (struct nvgpu_as_unmap_buffer_args *)buf); break; case NVGPU_AS_IOCTL_GET_VA_REGIONS: trace_gk20a_as_ioctl_get_va_regions(g->name); err = gk20a_as_ioctl_get_va_regions(as_share, (struct nvgpu_as_get_va_regions_args *)buf); break; case NVGPU_AS_IOCTL_MAP_BUFFER_BATCH: err = gk20a_as_ioctl_map_buffer_batch(as_share, (struct nvgpu_as_map_buffer_batch_args *)buf); break; case NVGPU_AS_IOCTL_GET_SYNC_RO_MAP: err = nvgpu_as_ioctl_get_sync_ro_map(as_share, (struct nvgpu_as_get_sync_ro_map_args *)buf); break; case NVGPU_AS_IOCTL_READ_SWAP_BUFFER: case NVGPU_AS_IOCTL_READ_SWAP_BUFFER_ASYNC: case NVGPU_AS_IOCTL_READ_SWAP_BUFFER_ASYNC_FINISH: case NVGPU_AS_IOCTL_WRITE_SWAP_BUFFER: case NVGPU_AS_IOCTL_WRITE_SWAP_BUFFER_ASYNC: case NVGPU_AS_IOCTL_WRITE_SWAP_BUFFER_ASYNC_FINISH: err = nvgpu_as_dev_ioctl_swap(cmd, as_share, (struct nvgpu_as_swap_buffer_args *)buf); break; default: err = -ENOTTY; break; } gk20a_idle(g); if ((err == 0) && (_IOC_DIR(cmd) & _IOC_READ)) if (copy_to_user((void __user *)arg, buf, _IOC_SIZE(cmd))) err = -EFAULT; return err; }