gpu: nvgpu: simplify job semaphore release in abort

Instead of looping all jobs and releasing their semaphores separately, do just one semaphore release. All the jobs are using the same sema index, and the final, maximum value of it is known. Move also this resetting into ch->sync->set_min_eq_max() to be consistent with syncpoints. Change-Id: I03601aae67db0a65750c8df6b43387c042d383bd Signed-off-by: Konsta Holtta <kholtta@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1680362 Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com> GVS: Gerrit_Virtual_Submit Reviewed-by: Alex Waterman <alexw@nvidia.com> Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Konsta Holtta <kholtta@nvidia.com> 2018-03-22 09:47:43 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2018-03-28 15:13:07 -0400
commit: d20a501dcbf2e29d5d319670485f273afa3aefad (patch)
tree: 22d3443589f0cf3186ef2c4096d0f82569b5401b /drivers/gpu/nvgpu/gk20a
parent: 9b70ad24934988141c585d9fd85c59f5c9d58a38 (diff)
2 files changed, 12 insertions, 45 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/channel_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_gk20a.c
index 5befe086..8b144864 100644
--- a/drivers/gpu/nvgpu/gk20a/channel_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/channel_gk20a.c
@@ -185,10 +185,6 @@ int gk20a_disable_channel_tsg(struct gk20a *g, struct channel_gk20a *ch)
 void gk20a_channel_abort_clean_up(struct channel_gk20a *ch)
 {
-        struct channel_gk20a_job *job, *n;
-        bool released_job_semaphore = false;
-        bool pre_alloc_enabled = channel_gk20a_is_prealloc_enabled(ch);
        /* synchronize with actual job cleanup */
        nvgpu_mutex_acquire(&ch->joblist.cleanup_lock);
@@ -200,48 +196,8 @@ void gk20a_channel_abort_clean_up(struct channel_gk20a *ch)
                ch->user_sync->set_safe_state(ch->user_sync);
        nvgpu_mutex_release(&ch->sync_lock);
-        /* release all job semaphores (applies only to jobs that use
-           semaphore synchronization) */
-        channel_gk20a_joblist_lock(ch);
-        if (pre_alloc_enabled) {
-                int tmp_get = ch->joblist.pre_alloc.get;
-                int put = ch->joblist.pre_alloc.put;
-                /*
-                 * ensure put is read before any subsequent reads.
-                 * see corresponding nvgpu_smp_wmb in gk20a_channel_add_job()
-                 */
-                nvgpu_smp_rmb();
-                while (tmp_get != put) {
-                        job = &ch->joblist.pre_alloc.jobs[tmp_get];
-                        if (job->post_fence->semaphore) {
-                                nvgpu_semaphore_reset(
-                                        job->post_fence->semaphore,
-                                        ch->hw_sema);
-                                released_job_semaphore = true;
-                        }
-                        tmp_get = (tmp_get + 1) % ch->joblist.pre_alloc.length;
-                }
-        } else {
-                nvgpu_list_for_each_entry_safe(job, n,
-                                &ch->joblist.dynamic.jobs,
-                                channel_gk20a_job, list) {
-                        if (job->post_fence->semaphore) {
-                                nvgpu_semaphore_reset(
-                                        job->post_fence->semaphore,
-                                        ch->hw_sema);
-                                released_job_semaphore = true;
-                        }
-                }
-        }
-        channel_gk20a_joblist_unlock(ch);
        nvgpu_mutex_release(&ch->joblist.cleanup_lock);
-        if (released_job_semaphore)
-                nvgpu_cond_broadcast_interruptible(&ch->semaphore_wq);
        /*
         * When closing the channel, this scheduled update holds one ref which
         * is waited for before advancing with freeing.
diff --git a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
index d87b8661..bf467210 100644
--- a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
@@ -646,7 +646,18 @@ static int gk20a_channel_semaphore_incr_user(
 static void gk20a_channel_semaphore_set_min_eq_max(struct gk20a_channel_sync *s)
 {
-        /* Nothing to do. */
+        struct gk20a_channel_semaphore *sp =
+                container_of(s, struct gk20a_channel_semaphore, ops);
+        struct channel_gk20a *c = sp->c;
+        bool updated;
+        if (!c->hw_sema)
+                return;
+        updated = nvgpu_semaphore_reset(c->hw_sema);
+        if (updated)
+                nvgpu_cond_broadcast_interruptible(&c->semaphore_wq);
 }
 static void gk20a_channel_semaphore_set_safe_state(struct gk20a_channel_sync *s)
author	Konsta Holtta <kholtta@nvidia.com>	2018-03-22 09:47:43 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2018-03-28 15:13:07 -0400
commit	d20a501dcbf2e29d5d319670485f273afa3aefad (patch)
tree	22d3443589f0cf3186ef2c4096d0f82569b5401b /drivers/gpu/nvgpu/gk20a
parent	9b70ad24934988141c585d9fd85c59f5c9d58a38 (diff)

diff --git a/drivers/gpu/nvgpu/gk20a/channel_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_gk20a.c index 5befe086..8b144864 100644 --- a/drivers/gpu/nvgpu/gk20a/channel_gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/channel_gk20a.c
@@ -185,10 +185,6 @@ int gk20a_disable_channel_tsg(struct gk20a g, struct channel_gk20a ch)
185		185
186	void gk20a_channel_abort_clean_up(struct channel_gk20a *ch)	186	void gk20a_channel_abort_clean_up(struct channel_gk20a *ch)
187	{	187	{
188	struct channel_gk20a_job job, n;
189	bool released_job_semaphore = false;
190	bool pre_alloc_enabled = channel_gk20a_is_prealloc_enabled(ch);
191
192	/* synchronize with actual job cleanup */	188	/* synchronize with actual job cleanup */
193	nvgpu_mutex_acquire(&ch->joblist.cleanup_lock);	189	nvgpu_mutex_acquire(&ch->joblist.cleanup_lock);
194		190
@@ -200,48 +196,8 @@ void gk20a_channel_abort_clean_up(struct channel_gk20a *ch)
200	ch->user_sync->set_safe_state(ch->user_sync);	196	ch->user_sync->set_safe_state(ch->user_sync);
201	nvgpu_mutex_release(&ch->sync_lock);	197	nvgpu_mutex_release(&ch->sync_lock);
202		198
203	/* release all job semaphores (applies only to jobs that use
204	semaphore synchronization) */
205	channel_gk20a_joblist_lock(ch);
206	if (pre_alloc_enabled) {
207	int tmp_get = ch->joblist.pre_alloc.get;
208	int put = ch->joblist.pre_alloc.put;
209
210	/*
211	* ensure put is read before any subsequent reads.
212	* see corresponding nvgpu_smp_wmb in gk20a_channel_add_job()
213	*/
214	nvgpu_smp_rmb();
215
216	while (tmp_get != put) {
217	job = &ch->joblist.pre_alloc.jobs[tmp_get];
218	if (job->post_fence->semaphore) {
219	nvgpu_semaphore_reset(
220	job->post_fence->semaphore,
221	ch->hw_sema);
222	released_job_semaphore = true;
223	}
224	tmp_get = (tmp_get + 1) % ch->joblist.pre_alloc.length;
225	}
226	} else {
227	nvgpu_list_for_each_entry_safe(job, n,
228	&ch->joblist.dynamic.jobs,
229	channel_gk20a_job, list) {
230	if (job->post_fence->semaphore) {
231	nvgpu_semaphore_reset(
232	job->post_fence->semaphore,
233	ch->hw_sema);
234	released_job_semaphore = true;
235	}
236	}
237	}
238	channel_gk20a_joblist_unlock(ch);
239
240	nvgpu_mutex_release(&ch->joblist.cleanup_lock);	199	nvgpu_mutex_release(&ch->joblist.cleanup_lock);
241		200
242	if (released_job_semaphore)
243	nvgpu_cond_broadcast_interruptible(&ch->semaphore_wq);
244
245	/*	201	/*
246	* When closing the channel, this scheduled update holds one ref which	202	* When closing the channel, this scheduled update holds one ref which
247	* is waited for before advancing with freeing.	203	* is waited for before advancing with freeing.


diff --git a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c index d87b8661..bf467210 100644 --- a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
@@ -646,7 +646,18 @@ static int gk20a_channel_semaphore_incr_user(
646		646
647	static void gk20a_channel_semaphore_set_min_eq_max(struct gk20a_channel_sync *s)	647	static void gk20a_channel_semaphore_set_min_eq_max(struct gk20a_channel_sync *s)
648	{	648	{
649	/* Nothing to do. */	649	struct gk20a_channel_semaphore *sp =
		650	container_of(s, struct gk20a_channel_semaphore, ops);
		651	struct channel_gk20a *c = sp->c;
		652	bool updated;
		653
		654	if (!c->hw_sema)
		655	return;
		656
		657	updated = nvgpu_semaphore_reset(c->hw_sema);
		658
		659	if (updated)
		660	nvgpu_cond_broadcast_interruptible(&c->semaphore_wq);
650	}	661	}
651		662
652	static void gk20a_channel_semaphore_set_safe_state(struct gk20a_channel_sync *s)	663	static void gk20a_channel_semaphore_set_safe_state(struct gk20a_channel_sync *s)