/* * Copyright (c) 2016-2017, NVIDIA CORPORATION. All rights reserved. * * This program is free software; you can redistribute it and/or modify it * under the terms and conditions of the GNU General Public License, * version 2, as published by the Free Software Foundation. * * This program is distributed in the hope it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for * more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #include #include #include #include #include "lockless_allocator_priv.h" static u64 nvgpu_lockless_alloc_length(struct nvgpu_allocator *a) { struct nvgpu_lockless_allocator *pa = a->priv; return pa->length; } static u64 nvgpu_lockless_alloc_base(struct nvgpu_allocator *a) { struct nvgpu_lockless_allocator *pa = a->priv; return pa->base; } static int nvgpu_lockless_alloc_inited(struct nvgpu_allocator *a) { struct nvgpu_lockless_allocator *pa = a->priv; int inited = pa->inited; nvgpu_smp_rmb(); return inited; } static u64 nvgpu_lockless_alloc_end(struct nvgpu_allocator *a) { struct nvgpu_lockless_allocator *pa = a->priv; return pa->base + pa->length; } static u64 nvgpu_lockless_alloc(struct nvgpu_allocator *a, u64 len) { struct nvgpu_lockless_allocator *pa = a->priv; int head, new_head, ret; u64 addr = 0; if (len != pa->blk_size) return 0; head = NV_ACCESS_ONCE(pa->head); while (head >= 0) { new_head = NV_ACCESS_ONCE(pa->next[head]); ret = cmpxchg(&pa->head, head, new_head); if (ret == head) { addr = pa->base + head * pa->blk_size; nvgpu_atomic_inc(&pa->nr_allocs); alloc_dbg(a, "Alloc node # %d @ addr 0x%llx\n", head, addr); break; } head = NV_ACCESS_ONCE(pa->head); } if (addr) alloc_dbg(a, "Alloc node # %d @ addr 0x%llx\n", head, addr); else alloc_dbg(a, "Alloc failed!\n"); return addr; } static void nvgpu_lockless_free(struct nvgpu_allocator *a, u64 addr) { struct nvgpu_lockless_allocator *pa = a->priv; int head, ret; u64 cur_idx; cur_idx = (addr - pa->base) / pa->blk_size; alloc_dbg(a, "Free node # %llu @ addr 0x%llx\n", cur_idx, addr); while (1) { head = NV_ACCESS_ONCE(pa->head); NV_ACCESS_ONCE(pa->next[cur_idx]) = head; ret = cmpxchg(&pa->head, head, cur_idx); if (ret == head) { nvgpu_atomic_dec(&pa->nr_allocs); alloc_dbg(a, "Free node # %llu\n", cur_idx); break; } } } static void nvgpu_lockless_alloc_destroy(struct nvgpu_allocator *a) { struct nvgpu_lockless_allocator *pa = a->priv; #ifdef CONFIG_DEBUG_FS nvgpu_fini_alloc_debug(a); #endif nvgpu_vfree(a->g, pa->next); nvgpu_kfree(nvgpu_alloc_to_gpu(a), pa); } #ifdef __KERNEL__ static void nvgpu_lockless_print_stats(struct nvgpu_allocator *a, struct seq_file *s, int lock) { struct nvgpu_lockless_allocator *pa = a->priv; __alloc_pstat(s, a, "Lockless allocator params:\n"); __alloc_pstat(s, a, " start = 0x%llx\n", pa->base); __alloc_pstat(s, a, " end = 0x%llx\n", pa->base + pa->length); /* Actual stats. */ __alloc_pstat(s, a, "Stats:\n"); __alloc_pstat(s, a, " Number allocs = %d\n", nvgpu_atomic_read(&pa->nr_allocs)); __alloc_pstat(s, a, " Number free = %d\n", pa->nr_nodes - nvgpu_atomic_read(&pa->nr_allocs)); } #endif static const struct nvgpu_allocator_ops pool_ops = { .alloc = nvgpu_lockless_alloc, .free = nvgpu_lockless_free, .base = nvgpu_lockless_alloc_base, .length = nvgpu_lockless_alloc_length, .end = nvgpu_lockless_alloc_end, .inited = nvgpu_lockless_alloc_inited, .fini = nvgpu_lockless_alloc_destroy, #ifdef __KERNEL__ .print_stats = nvgpu_lockless_print_stats, #endif }; int nvgpu_lockless_allocator_init(struct gk20a *g, struct nvgpu_allocator *__a, const char *name, u64 base, u64 length, u64 blk_size, u64 flags) { int i; int err; int nr_nodes; u64 count; struct nvgpu_lockless_allocator *a; if (!blk_size) return -EINVAL; /* * Ensure we have space for at least one node & there's no overflow. * In order to control memory footprint, we require count < INT_MAX */ count = length / blk_size; if (!base || !count || count > INT_MAX) return -EINVAL; a = nvgpu_kzalloc(g, sizeof(struct nvgpu_lockless_allocator)); if (!a) return -ENOMEM; err = __nvgpu_alloc_common_init(__a, g, name, a, false, &pool_ops); if (err) goto fail; a->next = nvgpu_vzalloc(g, sizeof(*a->next) * count); if (!a->next) { err = -ENOMEM; goto fail; } /* chain the elements together to form the initial free list */ nr_nodes = (int)count; for (i = 0; i < nr_nodes; i++) a->next[i] = i + 1; a->next[nr_nodes - 1] = -1; a->base = base; a->length = length; a->blk_size = blk_size; a->nr_nodes = nr_nodes; a->flags = flags; nvgpu_atomic_set(&a->nr_allocs, 0); nvgpu_smp_wmb(); a->inited = true; #ifdef CONFIG_DEBUG_FS nvgpu_init_alloc_debug(g, __a); #endif alloc_dbg(__a, "New allocator: type lockless\n"); alloc_dbg(__a, " base 0x%llx\n", a->base); alloc_dbg(__a, " nodes %d\n", a->nr_nodes); alloc_dbg(__a, " blk_size 0x%llx\n", a->blk_size); alloc_dbg(__a, " flags 0x%llx\n", a->flags); return 0; fail: nvgpu_kfree(g, a); return err; }