gpu: nvgpu: adapt gk20a_channel_syncpt to use os_fence

This patch adapts gk20a_channel_syncpt to use os_fence for post fence as well as pre-fence(wait) use cases. Jira NVGPU-66 Change-Id: I49627d1f88d52a53511a02f5de60fed6df8350de Signed-off-by: Debarshi Dutta <ddutta@nvidia.com> Reviewed-on: https://git-master.nvidia.com/r/1676631 Reviewed-by: mobile promotions <svcmobile_promotions@nvidia.com> Tested-by: mobile promotions <svcmobile_promotions@nvidia.com>
author: Debarshi Dutta <ddutta@nvidia.com> 2018-04-23 07:56:51 -0400
committer: mobile promotions <svcmobile_promotions@nvidia.com> 2018-05-10 11:40:11 -0400
commit: 70e69e2686527990865b221a60e0ec1e9a53d316 (patch)
tree: 623d0c2612162227370f7b6eb5388fc5b0e11326 /drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
parent: 4dfd6e43cfe303c8b23421ef32738db2ee52e291 (diff)
1 files changed, 53 insertions, 95 deletions
diff --git a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
index a0b0ac1e..16898593 100644
--- a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
+++ b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
@@ -51,6 +51,39 @@ struct gk20a_channel_syncpt {
        struct nvgpu_mem syncpt_buf;
 };
+int gk20a_channel_gen_syncpt_wait_cmd(struct channel_gk20a *c,
+        u32 id, u32 thresh, struct priv_cmd_entry *wait_cmd,
+        u32 wait_cmd_size, int pos, bool preallocated)
+{
+        int err = 0;
+        bool is_expired = nvgpu_nvhost_syncpt_is_expired_ext(
+                c->g->nvhost_dev, id, thresh);
+        if (is_expired) {
+                if (preallocated) {
+                        nvgpu_memset(c->g, wait_cmd->mem,
+                        (wait_cmd->off + pos * wait_cmd_size) * sizeof(u32),
+                                0, wait_cmd_size * sizeof(u32));
+                }
+        } else {
+                if (!preallocated) {
+                        err = gk20a_channel_alloc_priv_cmdbuf(c,
+                                c->g->ops.fifo.get_syncpt_wait_cmd_size(), wait_cmd);
+                        if (err) {
+                                nvgpu_err(c->g, "not enough priv cmd buffer space");
+                                return err;
+                        }
+                }
+                nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
+                                id, c->vm->syncpt_ro_map_gpu_va);
+                c->g->ops.fifo.add_syncpt_wait_cmd(c->g, wait_cmd,
+                        pos * wait_cmd_size, id, thresh,
+                        c->vm->syncpt_ro_map_gpu_va);
+        }
+        return 0;
+}
 static int gk20a_channel_syncpt_wait_syncpt(struct gk20a_channel_sync *s,
                u32 id, u32 thresh, struct priv_cmd_entry *wait_cmd)
 {
@@ -58,108 +91,36 @@ static int gk20a_channel_syncpt_wait_syncpt(struct gk20a_channel_sync *s,
                container_of(s, struct gk20a_channel_syncpt, ops);
        struct channel_gk20a *c = sp->c;
        int err = 0;
+        u32 wait_cmd_size = c->g->ops.fifo.get_syncpt_wait_cmd_size();
        if (!nvgpu_nvhost_syncpt_is_valid_pt_ext(sp->nvhost_dev, id))
                return -EINVAL;
-        if (nvgpu_nvhost_syncpt_is_expired_ext(sp->nvhost_dev, id, thresh))
+        err = gk20a_channel_gen_syncpt_wait_cmd(c, id, thresh,
-                return 0;
+                        wait_cmd, wait_cmd_size, 0, false);
-        err = gk20a_channel_alloc_priv_cmdbuf(c,
+        return err;
-                        c->g->ops.fifo.get_syncpt_wait_cmd_size(), wait_cmd);
-        if (err) {
-                nvgpu_err(c->g,
-                                "not enough priv cmd buffer space");
-                return err;
-        }
-        nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
-                                        id, sp->c->vm->syncpt_ro_map_gpu_va);
-        c->g->ops.fifo.add_syncpt_wait_cmd(c->g, wait_cmd, 0, id,
-                                        thresh, c->vm->syncpt_ro_map_gpu_va);
-        return 0;
 }
 static int gk20a_channel_syncpt_wait_fd(struct gk20a_channel_sync *s, int fd,
-                       struct priv_cmd_entry *wait_cmd, int max_wait_cmds)
+        struct priv_cmd_entry *wait_cmd, int max_wait_cmds)
 {
-#ifdef CONFIG_SYNC
+        struct nvgpu_os_fence os_fence = {0};
-        int i;
-        int num_wait_cmds;
-        struct sync_fence *sync_fence;
-        struct sync_pt *pt;
        struct gk20a_channel_syncpt *sp =
                container_of(s, struct gk20a_channel_syncpt, ops);
        struct channel_gk20a *c = sp->c;
-        u32 wait_id;
        int err = 0;
-        u32 wait_cmd_size = 0;
-        sync_fence = nvgpu_nvhost_sync_fdget(fd);
-        if (!sync_fence)
-                return -EINVAL;
-        if (max_wait_cmds && sync_fence->num_fences > max_wait_cmds) {
+        err = nvgpu_os_fence_fdget(&os_fence, c, fd);
-                sync_fence_put(sync_fence);
+        if (err)
                return -EINVAL;
-        }
-        /* validate syncpt ids */
-        for (i = 0; i < sync_fence->num_fences; i++) {
-                pt = sync_pt_from_fence(sync_fence->cbs[i].sync_pt);
-                wait_id = nvgpu_nvhost_sync_pt_id(pt);
-                if (!wait_id || !nvgpu_nvhost_syncpt_is_valid_pt_ext(
-                                        sp->nvhost_dev, wait_id)) {
-                        sync_fence_put(sync_fence);
-                        return -EINVAL;
-                }
-        }
-        num_wait_cmds = nvgpu_nvhost_sync_num_pts(sync_fence);
+        err = os_fence.ops->program_waits(&os_fence,
-        if (num_wait_cmds == 0) {
+                wait_cmd, c, max_wait_cmds);
-                sync_fence_put(sync_fence);
-                return 0;
-        }
-        wait_cmd_size = c->g->ops.fifo.get_syncpt_wait_cmd_size();
-        err = gk20a_channel_alloc_priv_cmdbuf(c,
-                wait_cmd_size * num_wait_cmds,
-                wait_cmd);
-        if (err) {
-                nvgpu_err(c->g,
-                                "not enough priv cmd buffer space");
-                sync_fence_put(sync_fence);
-                return err;
-        }
-        i = 0;
-        for (i = 0; i < sync_fence->num_fences; i++) {
-                struct fence *f = sync_fence->cbs[i].sync_pt;
-                struct sync_pt *pt = sync_pt_from_fence(f);
-                u32 wait_id = nvgpu_nvhost_sync_pt_id(pt);
-                u32 wait_value = nvgpu_nvhost_sync_pt_thresh(pt);
-                if (nvgpu_nvhost_syncpt_is_expired_ext(sp->nvhost_dev,
-                                wait_id, wait_value)) {
-                        nvgpu_memset(c->g, wait_cmd->mem,
-                        (wait_cmd->off + i * wait_cmd_size) * sizeof(u32),
-                                0, wait_cmd_size * sizeof(u32));
-                } else {
-                        nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
-                                        wait_id, sp->syncpt_buf.gpu_va);
-                        c->g->ops.fifo.add_syncpt_wait_cmd(c->g, wait_cmd,
-                                i * wait_cmd_size, wait_id, wait_value,
-                                c->vm->syncpt_ro_map_gpu_va);
-                }
-        }
-        WARN_ON(i != num_wait_cmds);
+        os_fence.ops->drop_ref(&os_fence);
-        sync_fence_put(sync_fence);
-        return 0;
+        return err;
-#else
-        return -ENODEV;
-#endif
 }
 static void gk20a_channel_syncpt_update(void *priv, int nr_completed)
@@ -185,6 +146,7 @@ static int __gk20a_channel_syncpt_incr(struct gk20a_channel_sync *s,
                container_of(s, struct gk20a_channel_syncpt, ops);
        struct channel_gk20a *c = sp->c;
        struct sync_fence *sync_fence = NULL;
+        struct nvgpu_os_fence os_fence = {0};
        err = gk20a_channel_alloc_priv_cmdbuf(c,
                        c->g->ops.fifo.get_syncpt_incr_cmd_size(wfi_cmd),
@@ -226,26 +188,22 @@ static int __gk20a_channel_syncpt_incr(struct gk20a_channel_sync *s,
                }
        }
-#ifdef CONFIG_SYNC
        if (need_sync_fence) {
-                sync_fence = nvgpu_nvhost_sync_create_fence(sp->nvhost_dev,
+                err = nvgpu_os_fence_syncpt_create(&os_fence, c, sp->nvhost_dev,
-                        sp->id, thresh, "fence");
+                        sp->id, thresh);
-                if (IS_ERR(sync_fence)) {
+                if (err)
-                        err = PTR_ERR(sync_fence);
                        goto clean_up_priv_cmd;
-                }
+                sync_fence = (struct sync_fence *)os_fence.priv;
        }
-#endif
        err = gk20a_fence_from_syncpt(fence, sp->nvhost_dev,
         sp->id, thresh, sync_fence);
        if (err) {
-#ifdef CONFIG_SYNC
+                if (nvgpu_os_fence_is_initialized(&os_fence))
-                if (sync_fence)
+                        os_fence.ops->drop_ref(&os_fence);
-                        sync_fence_put(sync_fence);
-#endif
                goto clean_up_priv_cmd;
        }
author	Debarshi Dutta <ddutta@nvidia.com>	2018-04-23 07:56:51 -0400
committer	mobile promotions <svcmobile_promotions@nvidia.com>	2018-05-10 11:40:11 -0400
commit	70e69e2686527990865b221a60e0ec1e9a53d316 (patch)
tree	623d0c2612162227370f7b6eb5388fc5b0e11326 /drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
parent	4dfd6e43cfe303c8b23421ef32738db2ee52e291 (diff)

diff --git a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c index a0b0ac1e..16898593 100644 --- a/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c +++ b/drivers/gpu/nvgpu/gk20a/channel_sync_gk20a.c
@@ -51,6 +51,39 @@ struct gk20a_channel_syncpt {
51	struct nvgpu_mem syncpt_buf;	51	struct nvgpu_mem syncpt_buf;
52	};	52	};
53		53
		54	int gk20a_channel_gen_syncpt_wait_cmd(struct channel_gk20a *c,
		55	u32 id, u32 thresh, struct priv_cmd_entry *wait_cmd,
		56	u32 wait_cmd_size, int pos, bool preallocated)
		57	{
		58	int err = 0;
		59	bool is_expired = nvgpu_nvhost_syncpt_is_expired_ext(
		60	c->g->nvhost_dev, id, thresh);
		61
		62	if (is_expired) {
		63	if (preallocated) {
		64	nvgpu_memset(c->g, wait_cmd->mem,
		65	(wait_cmd->off + pos * wait_cmd_size) * sizeof(u32),
		66	0, wait_cmd_size * sizeof(u32));
		67	}
		68	} else {
		69	if (!preallocated) {
		70	err = gk20a_channel_alloc_priv_cmdbuf(c,
		71	c->g->ops.fifo.get_syncpt_wait_cmd_size(), wait_cmd);
		72	if (err) {
		73	nvgpu_err(c->g, "not enough priv cmd buffer space");
		74	return err;
		75	}
		76	}
		77	nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
		78	id, c->vm->syncpt_ro_map_gpu_va);
		79	c->g->ops.fifo.add_syncpt_wait_cmd(c->g, wait_cmd,
		80	pos * wait_cmd_size, id, thresh,
		81	c->vm->syncpt_ro_map_gpu_va);
		82	}
		83
		84	return 0;
		85	}
		86
54	static int gk20a_channel_syncpt_wait_syncpt(struct gk20a_channel_sync *s,	87	static int gk20a_channel_syncpt_wait_syncpt(struct gk20a_channel_sync *s,
55	u32 id, u32 thresh, struct priv_cmd_entry *wait_cmd)	88	u32 id, u32 thresh, struct priv_cmd_entry *wait_cmd)
56	{	89	{
@@ -58,108 +91,36 @@ static int gk20a_channel_syncpt_wait_syncpt(struct gk20a_channel_sync *s,
58	container_of(s, struct gk20a_channel_syncpt, ops);	91	container_of(s, struct gk20a_channel_syncpt, ops);
59	struct channel_gk20a *c = sp->c;	92	struct channel_gk20a *c = sp->c;
60	int err = 0;	93	int err = 0;
		94	u32 wait_cmd_size = c->g->ops.fifo.get_syncpt_wait_cmd_size();
61		95
62	if (!nvgpu_nvhost_syncpt_is_valid_pt_ext(sp->nvhost_dev, id))	96	if (!nvgpu_nvhost_syncpt_is_valid_pt_ext(sp->nvhost_dev, id))
63	return -EINVAL;	97	return -EINVAL;
64		98
65	if (nvgpu_nvhost_syncpt_is_expired_ext(sp->nvhost_dev, id, thresh))	99	err = gk20a_channel_gen_syncpt_wait_cmd(c, id, thresh,
66	return 0;	100	wait_cmd, wait_cmd_size, 0, false);
67		101
68	err = gk20a_channel_alloc_priv_cmdbuf(c,	102	return err;
69	c->g->ops.fifo.get_syncpt_wait_cmd_size(), wait_cmd);
70	if (err) {
71	nvgpu_err(c->g,
72	"not enough priv cmd buffer space");
73	return err;
74	}
75
76	nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
77	id, sp->c->vm->syncpt_ro_map_gpu_va);
78	c->g->ops.fifo.add_syncpt_wait_cmd(c->g, wait_cmd, 0, id,
79	thresh, c->vm->syncpt_ro_map_gpu_va);
80
81	return 0;
82	}	103	}
83		104
84	static int gk20a_channel_syncpt_wait_fd(struct gk20a_channel_sync *s, int fd,	105	static int gk20a_channel_syncpt_wait_fd(struct gk20a_channel_sync *s, int fd,
85	struct priv_cmd_entry *wait_cmd, int max_wait_cmds)	106	struct priv_cmd_entry *wait_cmd, int max_wait_cmds)
86	{	107	{
87	#ifdef CONFIG_SYNC	108	struct nvgpu_os_fence os_fence = {0};
88	int i;
89	int num_wait_cmds;
90	struct sync_fence *sync_fence;
91	struct sync_pt *pt;
92	struct gk20a_channel_syncpt *sp =	109	struct gk20a_channel_syncpt *sp =
93	container_of(s, struct gk20a_channel_syncpt, ops);	110	container_of(s, struct gk20a_channel_syncpt, ops);
94	struct channel_gk20a *c = sp->c;	111	struct channel_gk20a *c = sp->c;
95	u32 wait_id;
96	int err = 0;	112	int err = 0;
97	u32 wait_cmd_size = 0;
98
99	sync_fence = nvgpu_nvhost_sync_fdget(fd);
100	if (!sync_fence)
101	return -EINVAL;
102		113
103	if (max_wait_cmds && sync_fence->num_fences > max_wait_cmds) {	114	err = nvgpu_os_fence_fdget(&os_fence, c, fd);
104	sync_fence_put(sync_fence);	115	if (err)
105	return -EINVAL;	116	return -EINVAL;
106	}
107
108	/* validate syncpt ids */
109	for (i = 0; i < sync_fence->num_fences; i++) {
110	pt = sync_pt_from_fence(sync_fence->cbs[i].sync_pt);
111	wait_id = nvgpu_nvhost_sync_pt_id(pt);
112	if (!wait_id \|\| !nvgpu_nvhost_syncpt_is_valid_pt_ext(
113	sp->nvhost_dev, wait_id)) {
114	sync_fence_put(sync_fence);
115	return -EINVAL;
116	}
117	}
118		117
119	num_wait_cmds = nvgpu_nvhost_sync_num_pts(sync_fence);	118	err = os_fence.ops->program_waits(&os_fence,
120	if (num_wait_cmds == 0) {	119	wait_cmd, c, max_wait_cmds);
121	sync_fence_put(sync_fence);
122	return 0;
123	}
124	wait_cmd_size = c->g->ops.fifo.get_syncpt_wait_cmd_size();
125	err = gk20a_channel_alloc_priv_cmdbuf(c,
126	wait_cmd_size * num_wait_cmds,
127	wait_cmd);
128	if (err) {
129	nvgpu_err(c->g,
130	"not enough priv cmd buffer space");
131	sync_fence_put(sync_fence);
132	return err;
133	}
134
135	i = 0;
136	for (i = 0; i < sync_fence->num_fences; i++) {
137	struct fence *f = sync_fence->cbs[i].sync_pt;
138	struct sync_pt *pt = sync_pt_from_fence(f);
139	u32 wait_id = nvgpu_nvhost_sync_pt_id(pt);
140	u32 wait_value = nvgpu_nvhost_sync_pt_thresh(pt);
141
142	if (nvgpu_nvhost_syncpt_is_expired_ext(sp->nvhost_dev,
143	wait_id, wait_value)) {
144	nvgpu_memset(c->g, wait_cmd->mem,
145	(wait_cmd->off + i * wait_cmd_size) * sizeof(u32),
146	0, wait_cmd_size * sizeof(u32));
147	} else {
148	nvgpu_log(c->g, gpu_dbg_info, "sp->id %d gpu va %llx",
149	wait_id, sp->syncpt_buf.gpu_va);
150	c->g->ops.fifo.add_syncpt_wait_cmd(c->g, wait_cmd,
151	i * wait_cmd_size, wait_id, wait_value,
152	c->vm->syncpt_ro_map_gpu_va);
153	}
154	}
155		120
156	WARN_ON(i != num_wait_cmds);	121	os_fence.ops->drop_ref(&os_fence);
157	sync_fence_put(sync_fence);
158		122
159	return 0;	123	return err;
160	#else
161	return -ENODEV;
162	#endif
163	}	124	}
164		125
165	static void gk20a_channel_syncpt_update(void *priv, int nr_completed)	126	static void gk20a_channel_syncpt_update(void *priv, int nr_completed)
@@ -185,6 +146,7 @@ static int __gk20a_channel_syncpt_incr(struct gk20a_channel_sync *s,
185	container_of(s, struct gk20a_channel_syncpt, ops);	146	container_of(s, struct gk20a_channel_syncpt, ops);
186	struct channel_gk20a *c = sp->c;	147	struct channel_gk20a *c = sp->c;
187	struct sync_fence *sync_fence = NULL;	148	struct sync_fence *sync_fence = NULL;
		149	struct nvgpu_os_fence os_fence = {0};
188		150
189	err = gk20a_channel_alloc_priv_cmdbuf(c,	151	err = gk20a_channel_alloc_priv_cmdbuf(c,
190	c->g->ops.fifo.get_syncpt_incr_cmd_size(wfi_cmd),	152	c->g->ops.fifo.get_syncpt_incr_cmd_size(wfi_cmd),
@@ -226,26 +188,22 @@ static int __gk20a_channel_syncpt_incr(struct gk20a_channel_sync *s,
226	}	188	}
227	}	189	}
228		190
229	#ifdef CONFIG_SYNC
230	if (need_sync_fence) {	191	if (need_sync_fence) {
231	sync_fence = nvgpu_nvhost_sync_create_fence(sp->nvhost_dev,	192	err = nvgpu_os_fence_syncpt_create(&os_fence, c, sp->nvhost_dev,
232	sp->id, thresh, "fence");	193	sp->id, thresh);
233		194
234	if (IS_ERR(sync_fence)) {	195	if (err)
235	err = PTR_ERR(sync_fence);
236	goto clean_up_priv_cmd;	196	goto clean_up_priv_cmd;
237	}	197
		198	sync_fence = (struct sync_fence *)os_fence.priv;
238	}	199	}
239	#endif
240		200
241	err = gk20a_fence_from_syncpt(fence, sp->nvhost_dev,	201	err = gk20a_fence_from_syncpt(fence, sp->nvhost_dev,
242	sp->id, thresh, sync_fence);	202	sp->id, thresh, sync_fence);
243		203
244	if (err) {	204	if (err) {
245	#ifdef CONFIG_SYNC	205	if (nvgpu_os_fence_is_initialized(&os_fence))
246	if (sync_fence)	206	os_fence.ops->drop_ref(&os_fence);
247	sync_fence_put(sync_fence);
248	#endif
249	goto clean_up_priv_cmd;	207	goto clean_up_priv_cmd;
250	}	208	}
251		209