diff options
author | Alex Waterman <alexw@nvidia.com> | 2017-10-05 20:22:41 -0400 |
---|---|---|
committer | mobile promotions <svcmobile_promotions@nvidia.com> | 2017-10-20 22:03:57 -0400 |
commit | e26ce10cc6b59314ccf5931a8c5b46a9e57b085a (patch) | |
tree | 2bcafc57fcb8679c09195ba08ccf7a6fdfc91fe1 /drivers/gpu/nvgpu/gk20a/mm_gk20a.h | |
parent | 8c5ea40ccaad022401e45e61d5b6ff3354ffa413 (diff) |
gpu: nvgpu: Convert VIDMEM work_struct to thread
Convert the work_struct used by the vidmem background clearing to
a thread to make it more cross platform. The thread waits on a
condition variable to determine when work needs to be done. The
signal comes from the DMA API when it enqueues a new nvgpu_mem that
needs clearing.
Add logic for handling suspend: the CE cannot be accessed while
the GPU is suspended. As such the background thread must be paused
while the GPU is suspended and the CE is not available.
Several other changes were also made:
o Move the code that enqueues a nvgpu_mem from the DMA API
code to a function in the VIDMEM code.
o Move nvgpu_vidmem_get_pending_alloc() to the Linux specific
code as this function is only used there. It's a trivial
function that QNX can easily implement as well.
o Remove the was_empty logic from the enqueue. Now just always
signal the condition variable when anew nvgpu_mem comes in.
o Move CE suspend to after MM suspend.
JIRA NVGPU-30
JIRA NVGPU-138
Change-Id: Ie9286ae5a127c3fced86dfb9794e7d81eab0491c
Signed-off-by: Alex Waterman <alexw@nvidia.com>
Reviewed-on: https://git-master.nvidia.com/r/1574498
Reviewed-by: Automatic_Commit_Validation_User
GVS: Gerrit_Virtual_Submit
Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com>
Diffstat (limited to 'drivers/gpu/nvgpu/gk20a/mm_gk20a.h')
-rw-r--r-- | drivers/gpu/nvgpu/gk20a/mm_gk20a.h | 8 |
1 files changed, 7 insertions, 1 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h index 556cb234..13698cd7 100644 --- a/drivers/gpu/nvgpu/gk20a/mm_gk20a.h +++ b/drivers/gpu/nvgpu/gk20a/mm_gk20a.h | |||
@@ -36,6 +36,8 @@ | |||
36 | #include <nvgpu/rbtree.h> | 36 | #include <nvgpu/rbtree.h> |
37 | #include <nvgpu/kref.h> | 37 | #include <nvgpu/kref.h> |
38 | #include <nvgpu/atomic.h> | 38 | #include <nvgpu/atomic.h> |
39 | #include <nvgpu/cond.h> | ||
40 | #include <nvgpu/thread.h> | ||
39 | 41 | ||
40 | struct nvgpu_pd_cache; | 42 | struct nvgpu_pd_cache; |
41 | 43 | ||
@@ -272,7 +274,11 @@ struct mm_gk20a { | |||
272 | struct nvgpu_list_node clear_list_head; | 274 | struct nvgpu_list_node clear_list_head; |
273 | struct nvgpu_mutex clear_list_mutex; | 275 | struct nvgpu_mutex clear_list_mutex; |
274 | 276 | ||
275 | struct work_struct clear_mem_worker; | 277 | struct nvgpu_cond clearing_thread_cond; |
278 | struct nvgpu_thread clearing_thread; | ||
279 | struct nvgpu_mutex clearing_thread_lock; | ||
280 | nvgpu_atomic_t pause_count; | ||
281 | |||
276 | nvgpu_atomic64_t bytes_pending; | 282 | nvgpu_atomic64_t bytes_pending; |
277 | } vidmem; | 283 | } vidmem; |
278 | }; | 284 | }; |