gpu: nvgpu: remove support for foreign sema syncfds

Delete the proxy waiter for non-semaphore-backed syncfds in sema wait path to simplify code, to remove dependencies to the sync framework (and thus Linux) and to support upcoming refactorings. This feature has never been used for actually foreign fences. Jira NVGPU-43 Jira NVGPU-66 Change-Id: I2b539aefd2d096a7bf5f40e61d48de7a9b3dccae Signed-off-by: Konsta Holtta <kholtta@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1665119 Reviewed-by: svc-mobile-coverity <svc-mobile-coverity@nvidia.com> Reviewed-by: Alex Waterman <alexw@nvidia.com> GVS: Gerrit_Virtual_Submit Reviewed-by: Terje Bergstrom <tbergstrom@nvidia.com> Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Konsta Holtta <kholtta@nvidia.com> 2018-03-16 12:10:33 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2018-03-16 20:11:03 -0400
commit: 69252b3fb629d9534e7a9c4e3b75d3462653f00d (patch)
tree: 3297d9f0a4c26b01dd018d2e132dc1c872e3c831 /drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
parent: 703c1ea59638151846690e02d098cad83b7d6a78 (diff)
1 files changed, 1 insertions, 222 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
index e896eb88..20460c80 100644
--- a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
@@ -379,127 +379,6 @@ struct gk20a_channel_semaphore {
        struct sync_timeline *timeline;
 };
-#ifdef CONFIG_SYNC
-struct wait_fence_work {
-        struct sync_fence_waiter waiter;
-        struct sync_fence *fence;
-        struct channel_gk20a *ch;
-        struct nvgpu_semaphore *sema;
-        struct gk20a *g;
-        struct nvgpu_list_node entry;
-};
-static inline struct wait_fence_work *
-wait_fence_work_from_entry(struct nvgpu_list_node *node)
-{
-        return (struct wait_fence_work *)
-                ((uintptr_t)node - offsetof(struct wait_fence_work, entry));
-};
-/*
- * Keep track of all the pending waits on semaphores that exist for a GPU. This
- * has to be done because the waits on fences backed by semaphores are
- * asynchronous so it's impossible to otherwise know when they will fire. During
- * driver cleanup this list can be checked and all existing waits can be
- * canceled.
- */
-static void gk20a_add_pending_sema_wait(struct gk20a *g,
-                                        struct wait_fence_work *work)
-{
-        nvgpu_raw_spinlock_acquire(&g->pending_sema_waits_lock);
-        nvgpu_list_add(&work->entry, &g->pending_sema_waits);
-        nvgpu_raw_spinlock_release(&g->pending_sema_waits_lock);
-}
-/*
- * Copy the list head from the pending wait list to the passed list and
- * then delete the entire pending list.
- */
-static void gk20a_start_sema_wait_cancel(struct gk20a *g,
-                                         struct nvgpu_list_node *list)
-{
-        nvgpu_raw_spinlock_acquire(&g->pending_sema_waits_lock);
-        nvgpu_list_replace_init(&g->pending_sema_waits, list);
-        nvgpu_raw_spinlock_release(&g->pending_sema_waits_lock);
-}
-/*
- * During shutdown this should be called to make sure that any pending sema
- * waits are canceled. This is a fairly delicate and tricky bit of code. Here's
- * how it works.
- *
- * Every time a semaphore wait is initiated in SW the wait_fence_work struct is
- * added to the pending_sema_waits list. When the semaphore launcher code runs
- * it checks the pending_sema_waits list. If this list is non-empty that means
- * that the wait_fence_work struct must be present and can be removed.
- *
- * When the driver shuts down one of the steps is to cancel pending sema waits.
- * To do this the entire list of pending sema waits is removed (and stored in a
- * separate local list). So now, if the semaphore launcher code runs it will see
- * that the pending_sema_waits list is empty and knows that it no longer owns
- * the wait_fence_work struct.
- */
-void gk20a_channel_cancel_pending_sema_waits(struct gk20a *g)
-{
-        struct wait_fence_work *work;
-        struct nvgpu_list_node local_pending_sema_waits;
-        gk20a_start_sema_wait_cancel(g, &local_pending_sema_waits);
-        while (!nvgpu_list_empty(&local_pending_sema_waits)) {
-                int ret;
-                work = nvgpu_list_first_entry(&local_pending_sema_waits,
-                                        wait_fence_work,
-                                        entry);
-                nvgpu_list_del(&work->entry);
-                /*
-                 * Only nvgpu_kfree() work if the cancel is successful.
-                 * Otherwise it's in use by the
-                 * gk20a_channel_semaphore_launcher() code.
-                 */
-                ret = sync_fence_cancel_async(work->fence, &work->waiter);
-                if (ret == 0)
-                        nvgpu_kfree(g, work);
-        }
-}
-static void gk20a_channel_semaphore_launcher(
-                struct sync_fence *fence,
-                struct sync_fence_waiter *waiter)
-{
-        int err;
-        struct wait_fence_work *w =
-                container_of(waiter, struct wait_fence_work, waiter);
-        struct gk20a *g = w->g;
-        /*
-         * This spinlock must protect a _very_ small critical section -
-         * otherwise it's possible that the deterministic submit path suffers.
-         */
-        nvgpu_raw_spinlock_acquire(&g->pending_sema_waits_lock);
-        if (!nvgpu_list_empty(&g->pending_sema_waits))
-                nvgpu_list_del(&w->entry);
-        nvgpu_raw_spinlock_release(&g->pending_sema_waits_lock);
-        gk20a_dbg_info("waiting for pre fence %p '%s'",
-                        fence, fence->name);
-        err = sync_fence_wait(fence, -1);
-        if (err < 0)
-                nvgpu_err(g, "error waiting pre-fence: %d", err);
-        gk20a_dbg_info(
-                  "wait completed (%d) for fence %p '%s', triggering gpu work",
-                  err, fence, fence->name);
-        sync_fence_put(fence);
-        nvgpu_semaphore_release(w->sema, w->ch->hw_sema);
-        nvgpu_semaphore_put(w->sema);
-        nvgpu_kfree(g, w);
-}
-#endif
 static void add_sema_cmd(struct gk20a *g, struct channel_gk20a *c,
                         struct nvgpu_semaphore *s, struct priv_cmd_entry *cmd,
                         u32 offset, bool acquire, bool wfi)
@@ -638,102 +517,6 @@ put_fence:
        sync_fence_put(sync_fence);
        return err;
 }
-static int semaphore_wait_fd_proxy(struct channel_gk20a *c, int fd,
-                struct priv_cmd_entry *wait_cmd,
-                struct gk20a_fence *fence_out,
-                struct sync_timeline *timeline)
-{
-        const int wait_cmd_size = 8;
-        struct sync_fence *sync_fence;
-        struct wait_fence_work *w = NULL;
-        int err, status;
-        sync_fence = sync_fence_fdget(fd);
-        if (!sync_fence)
-                return -EINVAL;
-        /* If the fence has signaled there is no reason to wait on it. */
-        status = atomic_read(&sync_fence->status);
-        if (status == 0) {
-                sync_fence_put(sync_fence);
-                return 0;
-        }
-        err = gk20a_channel_alloc_priv_cmdbuf(c, wait_cmd_size, wait_cmd);
-        if (err) {
-                nvgpu_err(c->g,
-                                "not enough priv cmd buffer space");
-                goto clean_up_sync_fence;
-        }
-        w = nvgpu_kzalloc(c->g, sizeof(*w));
-        if (!w) {
-                err = -ENOMEM;
-                goto clean_up_priv_cmd;
-        }
-        sync_fence_waiter_init(&w->waiter, gk20a_channel_semaphore_launcher);
-        w->fence = sync_fence;
-        w->g = c->g;
-        w->ch = c;
-        w->sema = nvgpu_semaphore_alloc(c);
-        if (!w->sema) {
-                nvgpu_err(c->g, "ran out of semaphores");
-                err = -ENOMEM;
-                goto clean_up_worker;
-        }
-        /* worker takes one reference */
-        nvgpu_semaphore_get(w->sema);
-        nvgpu_semaphore_incr(w->sema, c->hw_sema);
-        /* GPU unblocked when the semaphore value increments. */
-        add_sema_cmd(c->g, c, w->sema, wait_cmd, 0, true, false);
-        /*
-         *  We need to create the fence before adding the waiter to ensure
-         *  that we properly clean up in the event the sync_fence has
-         *  already signaled
-         */
-        err = gk20a_fence_from_semaphore(c->g, fence_out, timeline,
-                        w->sema, &c->semaphore_wq, false);
-        if (err)
-                goto clean_up_sema;
-        err = sync_fence_wait_async(sync_fence, &w->waiter);
-        gk20a_add_pending_sema_wait(c->g, w);
-        /*
-         * If the sync_fence has already signaled then the above wait_async
-         * will not get scheduled; the fence completed just after doing the
-         * status check above before allocs and waiter init, and won the race.
-         * This causes the waiter to be skipped, so let's release the semaphore
-         * here and put the refs taken for the worker.
-         */
-        if (err == 1) {
-                sync_fence_put(sync_fence);
-                nvgpu_semaphore_release(w->sema, c->hw_sema);
-                nvgpu_semaphore_put(w->sema);
-        }
-        return 0;
-clean_up_sema:
-        /*
-         * Release the refs to the semaphore, including
-         * the one for the worker since it will never run.
-         */
-        nvgpu_semaphore_put(w->sema);
-        nvgpu_semaphore_put(w->sema);
-clean_up_worker:
-        nvgpu_kfree(c->g, w);
-clean_up_priv_cmd:
-        gk20a_free_priv_cmdbuf(c, wait_cmd);
-clean_up_sync_fence:
-        sync_fence_put(sync_fence);
-        return err;
-}
 #endif
 static int gk20a_channel_semaphore_wait_fd(
@@ -745,12 +528,8 @@ static int gk20a_channel_semaphore_wait_fd(
                container_of(s, struct gk20a_channel_semaphore, ops);
        struct channel_gk20a *c = sema->c;
 #ifdef CONFIG_SYNC
-        int err;
-        err = semaphore_wait_fd_native(c, fd, entry);
+        return semaphore_wait_fd_native(c, fd, entry);
-        if (err)
-                err = semaphore_wait_fd_proxy(c, fd, entry, fence, sema->timeline);
-        return err;
 #else
        nvgpu_err(c->g,
                  "trying to use sync fds with CONFIG_SYNC disabled");
author	Konsta Holtta <kholtta@nvidia.com>	2018-03-16 12:10:33 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2018-03-16 20:11:03 -0400
commit	69252b3fb629d9534e7a9c4e3b75d3462653f00d (patch)
tree	3297d9f0a4c26b01dd018d2e132dc1c872e3c831 /drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
parent	703c1ea59638151846690e02d098cad83b7d6a78 (diff)

diff --git a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c index e896eb88..20460c80 100644 --- a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
@@ -379,127 +379,6 @@ struct gk20a_channel_semaphore {
379	struct sync_timeline *timeline;	379	struct sync_timeline *timeline;
380	};	380	};
381		381
382	#ifdef CONFIG_SYNC
383	struct wait_fence_work {
384	struct sync_fence_waiter waiter;
385	struct sync_fence *fence;
386	struct channel_gk20a *ch;
387	struct nvgpu_semaphore *sema;
388	struct gk20a *g;
389	struct nvgpu_list_node entry;
390	};
391
392	static inline struct wait_fence_work *
393	wait_fence_work_from_entry(struct nvgpu_list_node *node)
394	{
395	return (struct wait_fence_work *)
396	((uintptr_t)node - offsetof(struct wait_fence_work, entry));
397	};
398
399	/*
400	* Keep track of all the pending waits on semaphores that exist for a GPU. This
401	* has to be done because the waits on fences backed by semaphores are
402	* asynchronous so it's impossible to otherwise know when they will fire. During
403	* driver cleanup this list can be checked and all existing waits can be
404	* canceled.
405	*/
406	static void gk20a_add_pending_sema_wait(struct gk20a *g,
407	struct wait_fence_work *work)
408	{
409	nvgpu_raw_spinlock_acquire(&g->pending_sema_waits_lock);
410	nvgpu_list_add(&work->entry, &g->pending_sema_waits);
411	nvgpu_raw_spinlock_release(&g->pending_sema_waits_lock);
412	}
413
414	/*
415	* Copy the list head from the pending wait list to the passed list and
416	* then delete the entire pending list.
417	*/
418	static void gk20a_start_sema_wait_cancel(struct gk20a *g,
419	struct nvgpu_list_node *list)
420	{
421	nvgpu_raw_spinlock_acquire(&g->pending_sema_waits_lock);
422	nvgpu_list_replace_init(&g->pending_sema_waits, list);
423	nvgpu_raw_spinlock_release(&g->pending_sema_waits_lock);
424	}
425
426	/*
427	* During shutdown this should be called to make sure that any pending sema
428	* waits are canceled. This is a fairly delicate and tricky bit of code. Here's
429	* how it works.
430	*
431	* Every time a semaphore wait is initiated in SW the wait_fence_work struct is
432	* added to the pending_sema_waits list. When the semaphore launcher code runs
433	* it checks the pending_sema_waits list. If this list is non-empty that means
434	* that the wait_fence_work struct must be present and can be removed.
435	*
436	* When the driver shuts down one of the steps is to cancel pending sema waits.
437	* To do this the entire list of pending sema waits is removed (and stored in a
438	* separate local list). So now, if the semaphore launcher code runs it will see
439	* that the pending_sema_waits list is empty and knows that it no longer owns
440	* the wait_fence_work struct.
441	*/
442	void gk20a_channel_cancel_pending_sema_waits(struct gk20a *g)
443	{
444	struct wait_fence_work *work;
445	struct nvgpu_list_node local_pending_sema_waits;
446
447	gk20a_start_sema_wait_cancel(g, &local_pending_sema_waits);
448
449	while (!nvgpu_list_empty(&local_pending_sema_waits)) {
450	int ret;
451
452	work = nvgpu_list_first_entry(&local_pending_sema_waits,
453	wait_fence_work,
454	entry);
455
456	nvgpu_list_del(&work->entry);
457
458	/*
459	* Only nvgpu_kfree() work if the cancel is successful.
460	* Otherwise it's in use by the
461	* gk20a_channel_semaphore_launcher() code.
462	*/
463	ret = sync_fence_cancel_async(work->fence, &work->waiter);
464	if (ret == 0)
465	nvgpu_kfree(g, work);
466	}
467	}
468
469	static void gk20a_channel_semaphore_launcher(
470	struct sync_fence *fence,
471	struct sync_fence_waiter *waiter)
472	{
473	int err;
474	struct wait_fence_work *w =
475	container_of(waiter, struct wait_fence_work, waiter);
476	struct gk20a *g = w->g;
477
478	/*
479	* This spinlock must protect a _very_ small critical section -
480	* otherwise it's possible that the deterministic submit path suffers.
481	*/
482	nvgpu_raw_spinlock_acquire(&g->pending_sema_waits_lock);
483	if (!nvgpu_list_empty(&g->pending_sema_waits))
484	nvgpu_list_del(&w->entry);
485	nvgpu_raw_spinlock_release(&g->pending_sema_waits_lock);
486
487	gk20a_dbg_info("waiting for pre fence %p '%s'",
488	fence, fence->name);
489	err = sync_fence_wait(fence, -1);
490	if (err < 0)
491	nvgpu_err(g, "error waiting pre-fence: %d", err);
492
493	gk20a_dbg_info(
494	"wait completed (%d) for fence %p '%s', triggering gpu work",
495	err, fence, fence->name);
496	sync_fence_put(fence);
497	nvgpu_semaphore_release(w->sema, w->ch->hw_sema);
498	nvgpu_semaphore_put(w->sema);
499	nvgpu_kfree(g, w);
500	}
501	#endif
502
503	static void add_sema_cmd(struct gk20a g, struct channel_gk20a c,	382	static void add_sema_cmd(struct gk20a g, struct channel_gk20a c,
504	struct nvgpu_semaphore s, struct priv_cmd_entry cmd,	383	struct nvgpu_semaphore s, struct priv_cmd_entry cmd,
505	u32 offset, bool acquire, bool wfi)	384	u32 offset, bool acquire, bool wfi)
@@ -638,102 +517,6 @@ put_fence:
638	sync_fence_put(sync_fence);	517	sync_fence_put(sync_fence);
639	return err;	518	return err;
640	}	519	}
641
642	static int semaphore_wait_fd_proxy(struct channel_gk20a *c, int fd,
643	struct priv_cmd_entry *wait_cmd,
644	struct gk20a_fence *fence_out,
645	struct sync_timeline *timeline)
646	{
647	const int wait_cmd_size = 8;
648	struct sync_fence *sync_fence;
649	struct wait_fence_work *w = NULL;
650	int err, status;
651
652	sync_fence = sync_fence_fdget(fd);
653	if (!sync_fence)
654	return -EINVAL;
655
656	/* If the fence has signaled there is no reason to wait on it. */
657	status = atomic_read(&sync_fence->status);
658	if (status == 0) {
659	sync_fence_put(sync_fence);
660	return 0;
661	}
662
663	err = gk20a_channel_alloc_priv_cmdbuf(c, wait_cmd_size, wait_cmd);
664	if (err) {
665	nvgpu_err(c->g,
666	"not enough priv cmd buffer space");
667	goto clean_up_sync_fence;
668	}
669
670	w = nvgpu_kzalloc(c->g, sizeof(*w));
671	if (!w) {
672	err = -ENOMEM;
673	goto clean_up_priv_cmd;
674	}
675
676	sync_fence_waiter_init(&w->waiter, gk20a_channel_semaphore_launcher);
677	w->fence = sync_fence;
678	w->g = c->g;
679	w->ch = c;
680	w->sema = nvgpu_semaphore_alloc(c);
681	if (!w->sema) {
682	nvgpu_err(c->g, "ran out of semaphores");
683	err = -ENOMEM;
684	goto clean_up_worker;
685	}
686
687	/* worker takes one reference */
688	nvgpu_semaphore_get(w->sema);
689	nvgpu_semaphore_incr(w->sema, c->hw_sema);
690
691	/* GPU unblocked when the semaphore value increments. */
692	add_sema_cmd(c->g, c, w->sema, wait_cmd, 0, true, false);
693
694	/*
695	* We need to create the fence before adding the waiter to ensure
696	* that we properly clean up in the event the sync_fence has
697	* already signaled
698	*/
699	err = gk20a_fence_from_semaphore(c->g, fence_out, timeline,
700	w->sema, &c->semaphore_wq, false);
701	if (err)
702	goto clean_up_sema;
703
704	err = sync_fence_wait_async(sync_fence, &w->waiter);
705	gk20a_add_pending_sema_wait(c->g, w);
706
707	/*
708	* If the sync_fence has already signaled then the above wait_async
709	* will not get scheduled; the fence completed just after doing the
710	* status check above before allocs and waiter init, and won the race.
711	* This causes the waiter to be skipped, so let's release the semaphore
712	* here and put the refs taken for the worker.
713	*/
714	if (err == 1) {
715	sync_fence_put(sync_fence);
716	nvgpu_semaphore_release(w->sema, c->hw_sema);
717	nvgpu_semaphore_put(w->sema);
718	}
719
720	return 0;
721
722	clean_up_sema:
723	/*
724	* Release the refs to the semaphore, including
725	* the one for the worker since it will never run.
726	*/
727	nvgpu_semaphore_put(w->sema);
728	nvgpu_semaphore_put(w->sema);
729	clean_up_worker:
730	nvgpu_kfree(c->g, w);
731	clean_up_priv_cmd:
732	gk20a_free_priv_cmdbuf(c, wait_cmd);
733	clean_up_sync_fence:
734	sync_fence_put(sync_fence);
735	return err;
736	}
737	#endif	520	#endif
738		521
739	static int gk20a_channel_semaphore_wait_fd(	522	static int gk20a_channel_semaphore_wait_fd(
@@ -745,12 +528,8 @@ static int gk20a_channel_semaphore_wait_fd(
745	container_of(s, struct gk20a_channel_semaphore, ops);	528	container_of(s, struct gk20a_channel_semaphore, ops);
746	struct channel_gk20a *c = sema->c;	529	struct channel_gk20a *c = sema->c;
747	#ifdef CONFIG_SYNC	530	#ifdef CONFIG_SYNC
748	int err;
749		531
750	err = semaphore_wait_fd_native(c, fd, entry);	532	return semaphore_wait_fd_native(c, fd, entry);
751	if (err)
752	err = semaphore_wait_fd_proxy(c, fd, entry, fence, sema->timeline);
753	return err;
754	#else	533	#else
755	nvgpu_err(c->g,	534	nvgpu_err(c->g,
756	"trying to use sync fds with CONFIG_SYNC disabled");	535	"trying to use sync fds with CONFIG_SYNC disabled");