/* * Copyright (c) 2011-2015, NVIDIA CORPORATION. All rights reserved. * * This program is free software; you can redistribute it and/or modify it * under the terms and conditions of the GNU General Public License, * version 2, as published by the Free Software Foundation. * * This program is distributed in the hope it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for * more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . */ #ifndef GK20A_ALLOCATOR_H #define GK20A_ALLOCATOR_H #include #include #include #include /* #define ALLOCATOR_DEBUG */ /* * Each buddy is an element in a binary tree. */ struct gk20a_buddy { struct gk20a_buddy *parent; /* Parent node. */ struct gk20a_buddy *buddy; /* This node's buddy. */ struct gk20a_buddy *left; /* Lower address sub-node. */ struct gk20a_buddy *right; /* Higher address sub-node. */ struct list_head buddy_entry; /* List entry for various lists. */ struct rb_node alloced_entry; /* RB tree of allocations. */ u64 start; /* Start address of this buddy. */ u64 end; /* End address of this buddy. */ u64 order; /* Buddy order. */ #define BALLOC_BUDDY_ALLOCED 0x1 #define BALLOC_BUDDY_SPLIT 0x2 #define BALLOC_BUDDY_IN_LIST 0x4 int flags; /* List of associated flags. */ /* * Size of the PDE this buddy is using. This allows for grouping like * sized allocations into the same PDE. */ #define BALLOC_PTE_SIZE_ANY 0x0 #define BALLOC_PTE_SIZE_SMALL 0x1 #define BALLOC_PTE_SIZE_BIG 0x2 int pte_size; }; #define __buddy_flag_ops(flag, flag_up) \ static inline int buddy_is_ ## flag(struct gk20a_buddy *b) \ { \ return b->flags & BALLOC_BUDDY_ ## flag_up; \ } \ static inline void buddy_set_ ## flag(struct gk20a_buddy *b) \ { \ b->flags |= BALLOC_BUDDY_ ## flag_up; \ } \ static inline void buddy_clr_ ## flag(struct gk20a_buddy *b) \ { \ b->flags &= ~BALLOC_BUDDY_ ## flag_up; \ } /* * int buddy_is_alloced(struct gk20a_buddy *b); * void buddy_set_alloced(struct gk20a_buddy *b); * void buddy_clr_alloced(struct gk20a_buddy *b); * * int buddy_is_split(struct gk20a_buddy *b); * void buddy_set_split(struct gk20a_buddy *b); * void buddy_clr_split(struct gk20a_buddy *b); * * int buddy_is_in_list(struct gk20a_buddy *b); * void buddy_set_in_list(struct gk20a_buddy *b); * void buddy_clr_in_list(struct gk20a_buddy *b); */ __buddy_flag_ops(alloced, ALLOCED); __buddy_flag_ops(split, SPLIT); __buddy_flag_ops(in_list, IN_LIST); /* * Keeps info for a fixed allocation. */ struct gk20a_fixed_alloc { struct list_head buddies; /* List of buddies. */ struct rb_node alloced_entry; /* RB tree of fixed allocations. */ u64 start; /* Start of fixed block. */ u64 end; /* End address. */ }; struct vm_gk20a; /* * GPU buddy allocator for the various GPU address spaces. Each addressable unit * doesn't have to correspond to a byte. In some cases each unit is a more * complex object such as a comp_tag line or the like. * * The max order is computed based on the size of the minimum order and the size * of the address space. * * order_size is the size of an order 0 buddy. */ struct gk20a_allocator { struct vm_gk20a *vm; /* Parent VM - can be NULL. */ char name[32]; /* Name of allocator. */ u64 base; /* Base address of the space. */ u64 length; /* Length of the space. */ u64 blk_size; /* Size of order 0 allocation. */ u64 blk_shift; /* Shift to divide by blk_size. */ int init; /* Non-zero if initialized. */ /* Internal stuff. */ u64 start; /* Real start (aligned to blk_size). */ u64 end; /* Real end, trimmed if needed. */ u64 count; /* Count of objects in space. */ u64 blks; /* Count of blks in the space. */ u64 max_order; /* Specific maximum order. */ struct rb_root alloced_buddies; /* Outstanding allocations. */ struct rb_root fixed_allocs; /* Outstanding fixed allocations. */ struct mutex lock; /* Protects buddy access. */ #define GPU_BALLOC_GVA_SPACE 0x1 u64 flags; /* * Impose an upper bound on the maximum order. */ #define GPU_BALLOC_MAX_ORDER 31 #define GPU_BALLOC_ORDER_LIST_LEN (GPU_BALLOC_MAX_ORDER + 1) struct list_head buddy_list[GPU_BALLOC_ORDER_LIST_LEN]; u64 buddy_list_len[GPU_BALLOC_ORDER_LIST_LEN]; u64 buddy_list_split[GPU_BALLOC_ORDER_LIST_LEN]; u64 buddy_list_alloced[GPU_BALLOC_ORDER_LIST_LEN]; /* * This is for when the allocator is managing a GVA space (the * GPU_BALLOC_GVA_SPACE bit is set in @flags). This requires * that we group like sized allocations into PDE blocks. */ u64 pte_blk_order; struct dentry *debugfs_entry; u64 bytes_alloced; u64 bytes_alloced_real; u64 bytes_freed; }; #define balloc_lock(a) mutex_lock(&(a)->lock) #define balloc_unlock(a) mutex_unlock(&(a)->lock) #define balloc_get_order_list(a, order) (&(a)->buddy_list[(order)]) #define balloc_order_to_len(a, order) ((1 << order) * (a)->blk_size) #define balloc_base_shift(a, base) ((base) - (a)->start) #define balloc_base_unshift(a, base) ((base) + (a)->start) int gk20a_allocator_init(struct gk20a_allocator *allocator, const char *name, u64 base, u64 size, u64 order0); int __gk20a_allocator_init(struct gk20a_allocator *allocator, struct vm_gk20a *vm, const char *name, u64 base, u64 size, u64 order0, u64 max_order, u64 flags); void gk20a_allocator_destroy(struct gk20a_allocator *allocator); /* * Normal alloc/free operations for the buddy allocator. */ u64 gk20a_balloc(struct gk20a_allocator *allocator, u64 len); void gk20a_bfree(struct gk20a_allocator *allocator, u64 addr); /* * Special interface to allocate a memory regions with a specific starting * address. Yikes. */ u64 gk20a_balloc_fixed(struct gk20a_allocator *allocator, u64 base, u64 len); /* * Debugfs init. */ void gk20a_alloc_debugfs_init(struct platform_device *pdev); #if defined(ALLOCATOR_DEBUG) #define balloc_dbg(alloctor, format, arg...) \ pr_info("%-25s %25s() " format, \ alloctor->name, __func__, ##arg) #else #define balloc_dbg(allocator, format, arg...) #endif #endif /* GK20A_ALLOCATOR_H */