/*
* Copyright (c) 2016 - 2017, NVIDIA CORPORATION. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person obtaining a
* copy of this software and associated documentation files (the "Software"),
* to deal in the Software without restriction, including without limitation
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
* and/or sell copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
* DEALINGS IN THE SOFTWARE.
*/
/*
* Basics:
*
* - Lockless memory allocator for fixed-size structures, whose
* size is defined up front at init time.
* - Memory footprint scales linearly w/ the number of structures in
* the pool. It is ~= sizeof(int) * N.
* - Memory is pre-allocated by the client. The allocator itself
* only computes the addresses for allocations.
* - Limit of MAX_INT nodes that the allocator can be responsible for.
*
* Implementation details:
*
* The allocator maintains a single list of free nodes. We allocate &
* free nodes from the head of the list. We rely on the cmpxchg() operator
* to maintain atomicity on the head.
*
* So, both allocs & frees are O(1)!!
*
* -- Definitions --
* Block Size - size of a single structure that this allocator will
* allocate.
* Node - one of the elements of size blk_size in the
* client-allocated buffer.
* Node Index - zero-based index of a node in the client-allocated
* contiguous buffer.
*
* -- Initial State --
* We maintain the following to track the state of the free list:
*
* 1) A "head" index to track the index of the first free node in the list
* 2) A "next" array to track the index of the next free node in the list
* for every node. So next[head], will give the index to the 2nd free
* element in the list.
*
* So, to begin with, the free list consists of all node indices, and each
* position in the next array contains index N + 1:
*
* head = 0
* next = [1, 2, 3, 4, -1] : Example for a user-allocated buffer of 5 nodes
* free_list = 0->1->2->3->4->-1
*
* -- Allocations --
* 1) Read the current head (aka acq_head)
* 2) Read next[acq_head], to get the 2nd free element (aka new_head)
* 3) cmp_xchg(&head, acq_head, new_head)
* 4) If it succeeds, compute the address of the node, based on
* base address, blk_size, & acq_head.
*
* head = 1;
* next = [1, 2, 3, 4, -1] : Example after allocating Node #0
* free_list = 1->2->3->4->-1
*
* head = 2;
* next = [1, 2, 3, 4, -1] : Example after allocating Node #1
* free_list = 2->3->4->-1
*
* -- Frees --
* 1) Based on the address to be freed, calculate the index of the node
* being freed (cur_idx)
* 2) Read the current head (old_head)
* 3) So the freed node is going to go at the head of the list, and we
* want to put the old_head after it. So next[cur_idx] = old_head
* 4) cmpxchg(head, old_head, cur_idx)
*
* head = 0
* next = [2, 2, 3, 4, -1]
* free_list = 0->2->3->4->-1 : Example after freeing Node #0
*
* head = 1
* next = [2, 0, 3, 4, -1]
* free_list = 1->0->2->3->4->-1 : Example after freeing Node #1
*/
#ifndef LOCKLESS_ALLOCATOR_PRIV_H
#define LOCKLESS_ALLOCATOR_PRIV_H
struct nvgpu_allocator;
struct nvgpu_lockless_allocator {
struct nvgpu_allocator *owner;
u64 base; /* Base address of the space. */
u64 length; /* Length of the space. */
u64 blk_size; /* Size of the structure being allocated */
int nr_nodes; /* Number of nodes available for allocation */
int *next; /* An array holding the next indices per node */
int head; /* Current node at the top of the stack */
u64 flags;
bool inited;
/* Statistics */
nvgpu_atomic_t nr_allocs;
};
static inline struct nvgpu_lockless_allocator *lockless_allocator(
struct nvgpu_allocator *a)
{
return (struct nvgpu_lockless_allocator *)(a)->priv;
}
#endif