gpu: nvgpu: Move allocators to common/mm/

Move the GPU allocators to common/mm/ since the allocators are common code across all GPUs. Also rename the allocator code to move away from gk20a_ prefixed structs and functions. This caused one issue with the nvgpu_alloc() and nvgpu_free() functions. There was a function for allocating either with kmalloc() or vmalloc() depending on the size of the allocation. Those have now been renamed to nvgpu_kalloc() and nvgpu_kfree(). Bug 1799159 Change-Id: Iddda92c013612bcb209847084ec85b8953002fa5 Signed-off-by: Alex Waterman <alexw@nvidia.com> Reviewed-on: http://git-master/r/1274400 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Alex Waterman <alexw@nvidia.com> 2016-12-20 16:55:48 -0500
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2017-01-09 15:33:16 -0500
commit: 6df3992b60959d32c7113cb77e131a2547174f3a (patch)
tree: efbdc9e6ccd2330d5c469ca0783ecb0137da8fc4 /drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h
parent: e229514bece5a109cdbfe263f6329efe987e5939 (diff)
1 files changed, 121 insertions, 0 deletions
diff --git a/drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h b/drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h
new file mode 100644
index 00000000..32421ac1
--- /dev/null
+++ b/drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h
@@ -0,0 +1,121 @@
+/*
+ * Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
+ *
+ * This program is free software; you can redistribute it and/or modify it
+ * under the terms and conditions of the GNU General Public License,
+ * version 2, as published by the Free Software Foundation.
+ *
+ * This program is distributed in the hope it will be useful, but WITHOUT
+ * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
+ * more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+/*
+ * Basics:
+ *
+ *    - Lockless memory allocator for fixed-size structures, whose
+ *      size is defined up front at init time.
+ *    - Memory footprint scales linearly w/ the number of structures in
+ *      the pool. It is ~= sizeof(int) * N.
+ *    - Memory is pre-allocated by the client. The allocator itself
+ *      only computes the addresses for allocations.
+ *    - Limit of MAX_INT nodes that the allocator can be responsible for.
+ *
+ * Implementation details:
+ *
+ *    The allocator maintains a single list of free nodes. We allocate &
+ *    free nodes from the head of the list. We rely on the cmpxchg() operator
+ *    to maintain atomicity on the head.
+ *
+ *    So, both allocs & frees are O(1)!!
+ *
+ *    -- Definitions --
+ *    Block Size - size of a single structure that this allocator will
+ *                 allocate.
+ *    Node       - one of the elements of size blk_size in the
+ *                 client-allocated buffer.
+ *    Node Index - zero-based index of a node in the client-allocated
+ *                 contiguous buffer.
+ *
+ *    -- Initial State --
+ *    We maintain the following to track the state of the free list:
+ *
+ *    1) A "head" index to track the index of the first free node in the list
+ *    2) A "next" array to track the index of the next free node in the list
+ *       for every node. So next[head], will give the index to the 2nd free
+ *       element in the list.
+ *
+ *    So, to begin with, the free list consists of all node indices, and each
+ *    position in the next array contains index N + 1:
+ *
+ *    head = 0
+ *    next = [1, 2, 3, 4, -1] : Example for a user-allocated buffer of 5 nodes
+ *    free_list = 0->1->2->3->4->-1
+ *
+ *    -- Allocations --
+ *    1) Read the current head (aka acq_head)
+ *    2) Read next[acq_head], to get the 2nd free element (aka new_head)
+ *    3) cmp_xchg(&head, acq_head, new_head)
+ *    4) If it succeeds, compute the address of the node, based on
+ *       base address, blk_size, & acq_head.
+ *
+ *    head = 1;
+ *    next = [1, 2, 3, 4, -1] : Example after allocating Node #0
+ *    free_list = 1->2->3->4->-1
+ *
+ *    head = 2;
+ *    next = [1, 2, 3, 4, -1] : Example after allocating Node #1
+ *    free_list = 2->3->4->-1
+ *
+ *    -- Frees --
+ *    1) Based on the address to be freed, calculate the index of the node
+ *       being freed (cur_idx)
+ *    2) Read the current head (old_head)
+ *    3) So the freed node is going to go at the head of the list, and we
+ *       want to put the old_head after it. So next[cur_idx] = old_head
+ *    4) cmpxchg(head, old_head, cur_idx)
+ *
+ *    head = 0
+ *    next = [2, 2, 3, 4, -1]
+ *    free_list = 0->2->3->4->-1 : Example after freeing Node #0
+ *
+ *    head = 1
+ *    next = [2, 0, 3, 4, -1]
+ *    free_list = 1->0->2->3->4->-1 : Example after freeing Node #1
+ */
+#ifndef LOCKLESS_ALLOCATOR_PRIV_H
+#define LOCKLESS_ALLOCATOR_PRIV_H
+struct nvgpu_allocator;
+struct nvgpu_lockless_allocator {
+        struct nvgpu_allocator *owner;
+        u64 base;               /* Base address of the space. */
+        u64 length;             /* Length of the space. */
+        u64 blk_size;           /* Size of the structure being allocated */
+        int nr_nodes;           /* Number of nodes available for allocation */
+        int *next;              /* An array holding the next indices per node */
+        int head;               /* Current node at the top of the stack */
+        u64 flags;
+        bool inited;
+        /* Statistics */
+        atomic_t nr_allocs;
+};
+static inline struct nvgpu_lockless_allocator *lockless_allocator(
+        struct nvgpu_allocator *a)
+{
+        return (struct nvgpu_lockless_allocator *)(a)->priv;
+}
+#endif
author	Alex Waterman <alexw@nvidia.com>	2016-12-20 16:55:48 -0500
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2017-01-09 15:33:16 -0500
commit	6df3992b60959d32c7113cb77e131a2547174f3a (patch)
tree	efbdc9e6ccd2330d5c469ca0783ecb0137da8fc4 /drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h
parent	e229514bece5a109cdbfe263f6329efe987e5939 (diff)

diff --git a/drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h b/drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h new file mode 100644 index 00000000..32421ac1 --- /dev/null +++ b/drivers/gpu/nvgpu/common/mm/lockless_allocator_priv.h
@@ -0,0 +1,121 @@
	1	/*
	2	* Copyright (c) 2016, NVIDIA CORPORATION. All rights reserved.
	3	*
	4	* This program is free software; you can redistribute it and/or modify it
	5	* under the terms and conditions of the GNU General Public License,
	6	* version 2, as published by the Free Software Foundation.
	7	*
	8	* This program is distributed in the hope it will be useful, but WITHOUT
	9	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
	10	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
	11	* more details.
	12	*
	13	* You should have received a copy of the GNU General Public License
	14	* along with this program. If not, see <http://www.gnu.org/licenses/>.
	15	*/
	16
	17	/*
	18	* Basics:
	19	*
	20	* - Lockless memory allocator for fixed-size structures, whose
	21	* size is defined up front at init time.
	22	* - Memory footprint scales linearly w/ the number of structures in
	23	* the pool. It is ~= sizeof(int) * N.
	24	* - Memory is pre-allocated by the client. The allocator itself
	25	* only computes the addresses for allocations.
	26	* - Limit of MAX_INT nodes that the allocator can be responsible for.
	27	*
	28	* Implementation details:
	29	*
	30	* The allocator maintains a single list of free nodes. We allocate &
	31	* free nodes from the head of the list. We rely on the cmpxchg() operator
	32	* to maintain atomicity on the head.
	33	*
	34	* So, both allocs & frees are O(1)!!
	35	*
	36	* -- Definitions --
	37	* Block Size - size of a single structure that this allocator will
	38	* allocate.
	39	* Node - one of the elements of size blk_size in the
	40	* client-allocated buffer.
	41	* Node Index - zero-based index of a node in the client-allocated
	42	* contiguous buffer.
	43	*
	44	* -- Initial State --
	45	* We maintain the following to track the state of the free list:
	46	*
	47	* 1) A "head" index to track the index of the first free node in the list
	48	* 2) A "next" array to track the index of the next free node in the list
	49	* for every node. So next[head], will give the index to the 2nd free
	50	* element in the list.
	51	*
	52	* So, to begin with, the free list consists of all node indices, and each
	53	* position in the next array contains index N + 1:
	54	*
	55	* head = 0
	56	* next = [1, 2, 3, 4, -1] : Example for a user-allocated buffer of 5 nodes
	57	* free_list = 0->1->2->3->4->-1
	58	*
	59	* -- Allocations --
	60	* 1) Read the current head (aka acq_head)
	61	* 2) Read next[acq_head], to get the 2nd free element (aka new_head)
	62	* 3) cmp_xchg(&head, acq_head, new_head)
	63	* 4) If it succeeds, compute the address of the node, based on
	64	* base address, blk_size, & acq_head.
	65	*
	66	* head = 1;
	67	* next = [1, 2, 3, 4, -1] : Example after allocating Node #0
	68	* free_list = 1->2->3->4->-1
	69	*
	70	* head = 2;
	71	* next = [1, 2, 3, 4, -1] : Example after allocating Node #1
	72	* free_list = 2->3->4->-1
	73	*
	74	* -- Frees --
	75	* 1) Based on the address to be freed, calculate the index of the node
	76	* being freed (cur_idx)
	77	* 2) Read the current head (old_head)
	78	* 3) So the freed node is going to go at the head of the list, and we
	79	* want to put the old_head after it. So next[cur_idx] = old_head
	80	* 4) cmpxchg(head, old_head, cur_idx)
	81	*
	82	* head = 0
	83	* next = [2, 2, 3, 4, -1]
	84	* free_list = 0->2->3->4->-1 : Example after freeing Node #0
	85	*
	86	* head = 1
	87	* next = [2, 0, 3, 4, -1]
	88	* free_list = 1->0->2->3->4->-1 : Example after freeing Node #1
	89	*/
	90
	91	#ifndef LOCKLESS_ALLOCATOR_PRIV_H
	92	#define LOCKLESS_ALLOCATOR_PRIV_H
	93
	94	struct nvgpu_allocator;
	95
	96	struct nvgpu_lockless_allocator {
	97	struct nvgpu_allocator *owner;
	98
	99	u64 base; /* Base address of the space. */
	100	u64 length; /* Length of the space. */
	101	u64 blk_size; /* Size of the structure being allocated */
	102	int nr_nodes; /* Number of nodes available for allocation */
	103
	104	int next; / An array holding the next indices per node */
	105	int head; /* Current node at the top of the stack */
	106
	107	u64 flags;
	108
	109	bool inited;
	110
	111	/* Statistics */
	112	atomic_t nr_allocs;
	113	};
	114
	115	static inline struct nvgpu_lockless_allocator *lockless_allocator(
	116	struct nvgpu_allocator *a)
	117	{
	118	return (struct nvgpu_lockless_allocator *)(a)->priv;
	119	}
	120
	121	#endif