diff options
Diffstat (limited to 'drivers/misc/cxl/native.c')
-rw-r--r-- | drivers/misc/cxl/native.c | 683 |
1 files changed, 683 insertions, 0 deletions
diff --git a/drivers/misc/cxl/native.c b/drivers/misc/cxl/native.c new file mode 100644 index 000000000000..623286a77114 --- /dev/null +++ b/drivers/misc/cxl/native.c | |||
@@ -0,0 +1,683 @@ | |||
1 | /* | ||
2 | * Copyright 2014 IBM Corp. | ||
3 | * | ||
4 | * This program is free software; you can redistribute it and/or | ||
5 | * modify it under the terms of the GNU General Public License | ||
6 | * as published by the Free Software Foundation; either version | ||
7 | * 2 of the License, or (at your option) any later version. | ||
8 | */ | ||
9 | |||
10 | #include <linux/spinlock.h> | ||
11 | #include <linux/sched.h> | ||
12 | #include <linux/slab.h> | ||
13 | #include <linux/sched.h> | ||
14 | #include <linux/mutex.h> | ||
15 | #include <linux/mm.h> | ||
16 | #include <linux/uaccess.h> | ||
17 | #include <asm/synch.h> | ||
18 | #include <misc/cxl.h> | ||
19 | |||
20 | #include "cxl.h" | ||
21 | |||
22 | static int afu_control(struct cxl_afu *afu, u64 command, | ||
23 | u64 result, u64 mask, bool enabled) | ||
24 | { | ||
25 | u64 AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); | ||
26 | unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); | ||
27 | |||
28 | spin_lock(&afu->afu_cntl_lock); | ||
29 | pr_devel("AFU command starting: %llx\n", command); | ||
30 | |||
31 | cxl_p2n_write(afu, CXL_AFU_Cntl_An, AFU_Cntl | command); | ||
32 | |||
33 | AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); | ||
34 | while ((AFU_Cntl & mask) != result) { | ||
35 | if (time_after_eq(jiffies, timeout)) { | ||
36 | dev_warn(&afu->dev, "WARNING: AFU control timed out!\n"); | ||
37 | spin_unlock(&afu->afu_cntl_lock); | ||
38 | return -EBUSY; | ||
39 | } | ||
40 | pr_devel_ratelimited("AFU control... (0x%.16llx)\n", | ||
41 | AFU_Cntl | command); | ||
42 | cpu_relax(); | ||
43 | AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); | ||
44 | }; | ||
45 | pr_devel("AFU command complete: %llx\n", command); | ||
46 | afu->enabled = enabled; | ||
47 | spin_unlock(&afu->afu_cntl_lock); | ||
48 | |||
49 | return 0; | ||
50 | } | ||
51 | |||
52 | static int afu_enable(struct cxl_afu *afu) | ||
53 | { | ||
54 | pr_devel("AFU enable request\n"); | ||
55 | |||
56 | return afu_control(afu, CXL_AFU_Cntl_An_E, | ||
57 | CXL_AFU_Cntl_An_ES_Enabled, | ||
58 | CXL_AFU_Cntl_An_ES_MASK, true); | ||
59 | } | ||
60 | |||
61 | int cxl_afu_disable(struct cxl_afu *afu) | ||
62 | { | ||
63 | pr_devel("AFU disable request\n"); | ||
64 | |||
65 | return afu_control(afu, 0, CXL_AFU_Cntl_An_ES_Disabled, | ||
66 | CXL_AFU_Cntl_An_ES_MASK, false); | ||
67 | } | ||
68 | |||
69 | /* This will disable as well as reset */ | ||
70 | int cxl_afu_reset(struct cxl_afu *afu) | ||
71 | { | ||
72 | pr_devel("AFU reset request\n"); | ||
73 | |||
74 | return afu_control(afu, CXL_AFU_Cntl_An_RA, | ||
75 | CXL_AFU_Cntl_An_RS_Complete | CXL_AFU_Cntl_An_ES_Disabled, | ||
76 | CXL_AFU_Cntl_An_RS_MASK | CXL_AFU_Cntl_An_ES_MASK, | ||
77 | false); | ||
78 | } | ||
79 | |||
80 | static int afu_check_and_enable(struct cxl_afu *afu) | ||
81 | { | ||
82 | if (afu->enabled) | ||
83 | return 0; | ||
84 | return afu_enable(afu); | ||
85 | } | ||
86 | |||
87 | int cxl_psl_purge(struct cxl_afu *afu) | ||
88 | { | ||
89 | u64 PSL_CNTL = cxl_p1n_read(afu, CXL_PSL_SCNTL_An); | ||
90 | u64 AFU_Cntl = cxl_p2n_read(afu, CXL_AFU_Cntl_An); | ||
91 | u64 dsisr, dar; | ||
92 | u64 start, end; | ||
93 | unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); | ||
94 | |||
95 | pr_devel("PSL purge request\n"); | ||
96 | |||
97 | if ((AFU_Cntl & CXL_AFU_Cntl_An_ES_MASK) != CXL_AFU_Cntl_An_ES_Disabled) { | ||
98 | WARN(1, "psl_purge request while AFU not disabled!\n"); | ||
99 | cxl_afu_disable(afu); | ||
100 | } | ||
101 | |||
102 | cxl_p1n_write(afu, CXL_PSL_SCNTL_An, | ||
103 | PSL_CNTL | CXL_PSL_SCNTL_An_Pc); | ||
104 | start = local_clock(); | ||
105 | PSL_CNTL = cxl_p1n_read(afu, CXL_PSL_SCNTL_An); | ||
106 | while ((PSL_CNTL & CXL_PSL_SCNTL_An_Ps_MASK) | ||
107 | == CXL_PSL_SCNTL_An_Ps_Pending) { | ||
108 | if (time_after_eq(jiffies, timeout)) { | ||
109 | dev_warn(&afu->dev, "WARNING: PSL Purge timed out!\n"); | ||
110 | return -EBUSY; | ||
111 | } | ||
112 | dsisr = cxl_p2n_read(afu, CXL_PSL_DSISR_An); | ||
113 | pr_devel_ratelimited("PSL purging... PSL_CNTL: 0x%.16llx PSL_DSISR: 0x%.16llx\n", PSL_CNTL, dsisr); | ||
114 | if (dsisr & CXL_PSL_DSISR_TRANS) { | ||
115 | dar = cxl_p2n_read(afu, CXL_PSL_DAR_An); | ||
116 | dev_notice(&afu->dev, "PSL purge terminating pending translation, DSISR: 0x%.16llx, DAR: 0x%.16llx\n", dsisr, dar); | ||
117 | cxl_p2n_write(afu, CXL_PSL_TFC_An, CXL_PSL_TFC_An_AE); | ||
118 | } else if (dsisr) { | ||
119 | dev_notice(&afu->dev, "PSL purge acknowledging pending non-translation fault, DSISR: 0x%.16llx\n", dsisr); | ||
120 | cxl_p2n_write(afu, CXL_PSL_TFC_An, CXL_PSL_TFC_An_A); | ||
121 | } else { | ||
122 | cpu_relax(); | ||
123 | } | ||
124 | PSL_CNTL = cxl_p1n_read(afu, CXL_PSL_SCNTL_An); | ||
125 | }; | ||
126 | end = local_clock(); | ||
127 | pr_devel("PSL purged in %lld ns\n", end - start); | ||
128 | |||
129 | cxl_p1n_write(afu, CXL_PSL_SCNTL_An, | ||
130 | PSL_CNTL & ~CXL_PSL_SCNTL_An_Pc); | ||
131 | return 0; | ||
132 | } | ||
133 | |||
134 | static int spa_max_procs(int spa_size) | ||
135 | { | ||
136 | /* | ||
137 | * From the CAIA: | ||
138 | * end_of_SPA_area = SPA_Base + ((n+4) * 128) + (( ((n*8) + 127) >> 7) * 128) + 255 | ||
139 | * Most of that junk is really just an overly-complicated way of saying | ||
140 | * the last 256 bytes are __aligned(128), so it's really: | ||
141 | * end_of_SPA_area = end_of_PSL_queue_area + __aligned(128) 255 | ||
142 | * and | ||
143 | * end_of_PSL_queue_area = SPA_Base + ((n+4) * 128) + (n*8) - 1 | ||
144 | * so | ||
145 | * sizeof(SPA) = ((n+4) * 128) + (n*8) + __aligned(128) 256 | ||
146 | * Ignore the alignment (which is safe in this case as long as we are | ||
147 | * careful with our rounding) and solve for n: | ||
148 | */ | ||
149 | return ((spa_size / 8) - 96) / 17; | ||
150 | } | ||
151 | |||
152 | static int alloc_spa(struct cxl_afu *afu) | ||
153 | { | ||
154 | u64 spap; | ||
155 | |||
156 | /* Work out how many pages to allocate */ | ||
157 | afu->spa_order = 0; | ||
158 | do { | ||
159 | afu->spa_order++; | ||
160 | afu->spa_size = (1 << afu->spa_order) * PAGE_SIZE; | ||
161 | afu->spa_max_procs = spa_max_procs(afu->spa_size); | ||
162 | } while (afu->spa_max_procs < afu->num_procs); | ||
163 | |||
164 | WARN_ON(afu->spa_size > 0x100000); /* Max size supported by the hardware */ | ||
165 | |||
166 | if (!(afu->spa = (struct cxl_process_element *) | ||
167 | __get_free_pages(GFP_KERNEL | __GFP_ZERO, afu->spa_order))) { | ||
168 | pr_err("cxl_alloc_spa: Unable to allocate scheduled process area\n"); | ||
169 | return -ENOMEM; | ||
170 | } | ||
171 | pr_devel("spa pages: %i afu->spa_max_procs: %i afu->num_procs: %i\n", | ||
172 | 1<<afu->spa_order, afu->spa_max_procs, afu->num_procs); | ||
173 | |||
174 | afu->sw_command_status = (__be64 *)((char *)afu->spa + | ||
175 | ((afu->spa_max_procs + 3) * 128)); | ||
176 | |||
177 | spap = virt_to_phys(afu->spa) & CXL_PSL_SPAP_Addr; | ||
178 | spap |= ((afu->spa_size >> (12 - CXL_PSL_SPAP_Size_Shift)) - 1) & CXL_PSL_SPAP_Size; | ||
179 | spap |= CXL_PSL_SPAP_V; | ||
180 | pr_devel("cxl: SPA allocated at 0x%p. Max processes: %i, sw_command_status: 0x%p CXL_PSL_SPAP_An=0x%016llx\n", afu->spa, afu->spa_max_procs, afu->sw_command_status, spap); | ||
181 | cxl_p1n_write(afu, CXL_PSL_SPAP_An, spap); | ||
182 | |||
183 | return 0; | ||
184 | } | ||
185 | |||
186 | static void release_spa(struct cxl_afu *afu) | ||
187 | { | ||
188 | free_pages((unsigned long) afu->spa, afu->spa_order); | ||
189 | } | ||
190 | |||
191 | int cxl_tlb_slb_invalidate(struct cxl *adapter) | ||
192 | { | ||
193 | unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); | ||
194 | |||
195 | pr_devel("CXL adapter wide TLBIA & SLBIA\n"); | ||
196 | |||
197 | cxl_p1_write(adapter, CXL_PSL_AFUSEL, CXL_PSL_AFUSEL_A); | ||
198 | |||
199 | cxl_p1_write(adapter, CXL_PSL_TLBIA, CXL_TLB_SLB_IQ_ALL); | ||
200 | while (cxl_p1_read(adapter, CXL_PSL_TLBIA) & CXL_TLB_SLB_P) { | ||
201 | if (time_after_eq(jiffies, timeout)) { | ||
202 | dev_warn(&adapter->dev, "WARNING: CXL adapter wide TLBIA timed out!\n"); | ||
203 | return -EBUSY; | ||
204 | } | ||
205 | cpu_relax(); | ||
206 | } | ||
207 | |||
208 | cxl_p1_write(adapter, CXL_PSL_SLBIA, CXL_TLB_SLB_IQ_ALL); | ||
209 | while (cxl_p1_read(adapter, CXL_PSL_SLBIA) & CXL_TLB_SLB_P) { | ||
210 | if (time_after_eq(jiffies, timeout)) { | ||
211 | dev_warn(&adapter->dev, "WARNING: CXL adapter wide SLBIA timed out!\n"); | ||
212 | return -EBUSY; | ||
213 | } | ||
214 | cpu_relax(); | ||
215 | } | ||
216 | return 0; | ||
217 | } | ||
218 | |||
219 | int cxl_afu_slbia(struct cxl_afu *afu) | ||
220 | { | ||
221 | unsigned long timeout = jiffies + (HZ * CXL_TIMEOUT); | ||
222 | |||
223 | pr_devel("cxl_afu_slbia issuing SLBIA command\n"); | ||
224 | cxl_p2n_write(afu, CXL_SLBIA_An, CXL_TLB_SLB_IQ_ALL); | ||
225 | while (cxl_p2n_read(afu, CXL_SLBIA_An) & CXL_TLB_SLB_P) { | ||
226 | if (time_after_eq(jiffies, timeout)) { | ||
227 | dev_warn(&afu->dev, "WARNING: CXL AFU SLBIA timed out!\n"); | ||
228 | return -EBUSY; | ||
229 | } | ||
230 | cpu_relax(); | ||
231 | } | ||
232 | return 0; | ||
233 | } | ||
234 | |||
235 | static int cxl_write_sstp(struct cxl_afu *afu, u64 sstp0, u64 sstp1) | ||
236 | { | ||
237 | int rc; | ||
238 | |||
239 | /* 1. Disable SSTP by writing 0 to SSTP1[V] */ | ||
240 | cxl_p2n_write(afu, CXL_SSTP1_An, 0); | ||
241 | |||
242 | /* 2. Invalidate all SLB entries */ | ||
243 | if ((rc = cxl_afu_slbia(afu))) | ||
244 | return rc; | ||
245 | |||
246 | /* 3. Set SSTP0_An */ | ||
247 | cxl_p2n_write(afu, CXL_SSTP0_An, sstp0); | ||
248 | |||
249 | /* 4. Set SSTP1_An */ | ||
250 | cxl_p2n_write(afu, CXL_SSTP1_An, sstp1); | ||
251 | |||
252 | return 0; | ||
253 | } | ||
254 | |||
255 | /* Using per slice version may improve performance here. (ie. SLBIA_An) */ | ||
256 | static void slb_invalid(struct cxl_context *ctx) | ||
257 | { | ||
258 | struct cxl *adapter = ctx->afu->adapter; | ||
259 | u64 slbia; | ||
260 | |||
261 | WARN_ON(!mutex_is_locked(&ctx->afu->spa_mutex)); | ||
262 | |||
263 | cxl_p1_write(adapter, CXL_PSL_LBISEL, | ||
264 | ((u64)be32_to_cpu(ctx->elem->common.pid) << 32) | | ||
265 | be32_to_cpu(ctx->elem->lpid)); | ||
266 | cxl_p1_write(adapter, CXL_PSL_SLBIA, CXL_TLB_SLB_IQ_LPIDPID); | ||
267 | |||
268 | while (1) { | ||
269 | slbia = cxl_p1_read(adapter, CXL_PSL_SLBIA); | ||
270 | if (!(slbia & CXL_TLB_SLB_P)) | ||
271 | break; | ||
272 | cpu_relax(); | ||
273 | } | ||
274 | } | ||
275 | |||
276 | static int do_process_element_cmd(struct cxl_context *ctx, | ||
277 | u64 cmd, u64 pe_state) | ||
278 | { | ||
279 | u64 state; | ||
280 | |||
281 | WARN_ON(!ctx->afu->enabled); | ||
282 | |||
283 | ctx->elem->software_state = cpu_to_be32(pe_state); | ||
284 | smp_wmb(); | ||
285 | *(ctx->afu->sw_command_status) = cpu_to_be64(cmd | 0 | ctx->pe); | ||
286 | smp_mb(); | ||
287 | cxl_p1n_write(ctx->afu, CXL_PSL_LLCMD_An, cmd | ctx->pe); | ||
288 | while (1) { | ||
289 | state = be64_to_cpup(ctx->afu->sw_command_status); | ||
290 | if (state == ~0ULL) { | ||
291 | pr_err("cxl: Error adding process element to AFU\n"); | ||
292 | return -1; | ||
293 | } | ||
294 | if ((state & (CXL_SPA_SW_CMD_MASK | CXL_SPA_SW_STATE_MASK | CXL_SPA_SW_LINK_MASK)) == | ||
295 | (cmd | (cmd >> 16) | ctx->pe)) | ||
296 | break; | ||
297 | /* | ||
298 | * The command won't finish in the PSL if there are | ||
299 | * outstanding DSIs. Hence we need to yield here in | ||
300 | * case there are outstanding DSIs that we need to | ||
301 | * service. Tuning possiblity: we could wait for a | ||
302 | * while before sched | ||
303 | */ | ||
304 | schedule(); | ||
305 | |||
306 | } | ||
307 | return 0; | ||
308 | } | ||
309 | |||
310 | static int add_process_element(struct cxl_context *ctx) | ||
311 | { | ||
312 | int rc = 0; | ||
313 | |||
314 | mutex_lock(&ctx->afu->spa_mutex); | ||
315 | pr_devel("%s Adding pe: %i started\n", __func__, ctx->pe); | ||
316 | if (!(rc = do_process_element_cmd(ctx, CXL_SPA_SW_CMD_ADD, CXL_PE_SOFTWARE_STATE_V))) | ||
317 | ctx->pe_inserted = true; | ||
318 | pr_devel("%s Adding pe: %i finished\n", __func__, ctx->pe); | ||
319 | mutex_unlock(&ctx->afu->spa_mutex); | ||
320 | return rc; | ||
321 | } | ||
322 | |||
323 | static int terminate_process_element(struct cxl_context *ctx) | ||
324 | { | ||
325 | int rc = 0; | ||
326 | |||
327 | /* fast path terminate if it's already invalid */ | ||
328 | if (!(ctx->elem->software_state & cpu_to_be32(CXL_PE_SOFTWARE_STATE_V))) | ||
329 | return rc; | ||
330 | |||
331 | mutex_lock(&ctx->afu->spa_mutex); | ||
332 | pr_devel("%s Terminate pe: %i started\n", __func__, ctx->pe); | ||
333 | rc = do_process_element_cmd(ctx, CXL_SPA_SW_CMD_TERMINATE, | ||
334 | CXL_PE_SOFTWARE_STATE_V | CXL_PE_SOFTWARE_STATE_T); | ||
335 | ctx->elem->software_state = 0; /* Remove Valid bit */ | ||
336 | pr_devel("%s Terminate pe: %i finished\n", __func__, ctx->pe); | ||
337 | mutex_unlock(&ctx->afu->spa_mutex); | ||
338 | return rc; | ||
339 | } | ||
340 | |||
341 | static int remove_process_element(struct cxl_context *ctx) | ||
342 | { | ||
343 | int rc = 0; | ||
344 | |||
345 | mutex_lock(&ctx->afu->spa_mutex); | ||
346 | pr_devel("%s Remove pe: %i started\n", __func__, ctx->pe); | ||
347 | if (!(rc = do_process_element_cmd(ctx, CXL_SPA_SW_CMD_REMOVE, 0))) | ||
348 | ctx->pe_inserted = false; | ||
349 | slb_invalid(ctx); | ||
350 | pr_devel("%s Remove pe: %i finished\n", __func__, ctx->pe); | ||
351 | mutex_unlock(&ctx->afu->spa_mutex); | ||
352 | |||
353 | return rc; | ||
354 | } | ||
355 | |||
356 | |||
357 | static void assign_psn_space(struct cxl_context *ctx) | ||
358 | { | ||
359 | if (!ctx->afu->pp_size || ctx->master) { | ||
360 | ctx->psn_phys = ctx->afu->psn_phys; | ||
361 | ctx->psn_size = ctx->afu->adapter->ps_size; | ||
362 | } else { | ||
363 | ctx->psn_phys = ctx->afu->psn_phys + | ||
364 | (ctx->afu->pp_offset + ctx->afu->pp_size * ctx->pe); | ||
365 | ctx->psn_size = ctx->afu->pp_size; | ||
366 | } | ||
367 | } | ||
368 | |||
369 | static int activate_afu_directed(struct cxl_afu *afu) | ||
370 | { | ||
371 | int rc; | ||
372 | |||
373 | dev_info(&afu->dev, "Activating AFU directed mode\n"); | ||
374 | |||
375 | if (alloc_spa(afu)) | ||
376 | return -ENOMEM; | ||
377 | |||
378 | cxl_p1n_write(afu, CXL_PSL_SCNTL_An, CXL_PSL_SCNTL_An_PM_AFU); | ||
379 | cxl_p1n_write(afu, CXL_PSL_AMOR_An, 0xFFFFFFFFFFFFFFFFULL); | ||
380 | cxl_p1n_write(afu, CXL_PSL_ID_An, CXL_PSL_ID_An_F | CXL_PSL_ID_An_L); | ||
381 | |||
382 | afu->current_mode = CXL_MODE_DIRECTED; | ||
383 | afu->num_procs = afu->max_procs_virtualised; | ||
384 | |||
385 | if ((rc = cxl_chardev_m_afu_add(afu))) | ||
386 | return rc; | ||
387 | |||
388 | if ((rc = cxl_sysfs_afu_m_add(afu))) | ||
389 | goto err; | ||
390 | |||
391 | if ((rc = cxl_chardev_s_afu_add(afu))) | ||
392 | goto err1; | ||
393 | |||
394 | return 0; | ||
395 | err1: | ||
396 | cxl_sysfs_afu_m_remove(afu); | ||
397 | err: | ||
398 | cxl_chardev_afu_remove(afu); | ||
399 | return rc; | ||
400 | } | ||
401 | |||
402 | #ifdef CONFIG_CPU_LITTLE_ENDIAN | ||
403 | #define set_endian(sr) ((sr) |= CXL_PSL_SR_An_LE) | ||
404 | #else | ||
405 | #define set_endian(sr) ((sr) &= ~(CXL_PSL_SR_An_LE)) | ||
406 | #endif | ||
407 | |||
408 | static int attach_afu_directed(struct cxl_context *ctx, u64 wed, u64 amr) | ||
409 | { | ||
410 | u64 sr; | ||
411 | int r, result; | ||
412 | |||
413 | assign_psn_space(ctx); | ||
414 | |||
415 | ctx->elem->ctxtime = 0; /* disable */ | ||
416 | ctx->elem->lpid = cpu_to_be32(mfspr(SPRN_LPID)); | ||
417 | ctx->elem->haurp = 0; /* disable */ | ||
418 | ctx->elem->sdr = cpu_to_be64(mfspr(SPRN_SDR1)); | ||
419 | |||
420 | sr = CXL_PSL_SR_An_SC; | ||
421 | if (ctx->master) | ||
422 | sr |= CXL_PSL_SR_An_MP; | ||
423 | if (mfspr(SPRN_LPCR) & LPCR_TC) | ||
424 | sr |= CXL_PSL_SR_An_TC; | ||
425 | /* HV=0, PR=1, R=1 for userspace | ||
426 | * For kernel contexts: this would need to change | ||
427 | */ | ||
428 | sr |= CXL_PSL_SR_An_PR | CXL_PSL_SR_An_R; | ||
429 | set_endian(sr); | ||
430 | sr &= ~(CXL_PSL_SR_An_HV); | ||
431 | if (!test_tsk_thread_flag(current, TIF_32BIT)) | ||
432 | sr |= CXL_PSL_SR_An_SF; | ||
433 | ctx->elem->common.pid = cpu_to_be32(current->pid); | ||
434 | ctx->elem->common.tid = 0; | ||
435 | ctx->elem->sr = cpu_to_be64(sr); | ||
436 | |||
437 | ctx->elem->common.csrp = 0; /* disable */ | ||
438 | ctx->elem->common.aurp0 = 0; /* disable */ | ||
439 | ctx->elem->common.aurp1 = 0; /* disable */ | ||
440 | |||
441 | cxl_prefault(ctx, wed); | ||
442 | |||
443 | ctx->elem->common.sstp0 = cpu_to_be64(ctx->sstp0); | ||
444 | ctx->elem->common.sstp1 = cpu_to_be64(ctx->sstp1); | ||
445 | |||
446 | for (r = 0; r < CXL_IRQ_RANGES; r++) { | ||
447 | ctx->elem->ivte_offsets[r] = cpu_to_be16(ctx->irqs.offset[r]); | ||
448 | ctx->elem->ivte_ranges[r] = cpu_to_be16(ctx->irqs.range[r]); | ||
449 | } | ||
450 | |||
451 | ctx->elem->common.amr = cpu_to_be64(amr); | ||
452 | ctx->elem->common.wed = cpu_to_be64(wed); | ||
453 | |||
454 | /* first guy needs to enable */ | ||
455 | if ((result = afu_check_and_enable(ctx->afu))) | ||
456 | return result; | ||
457 | |||
458 | add_process_element(ctx); | ||
459 | |||
460 | return 0; | ||
461 | } | ||
462 | |||
463 | static int deactivate_afu_directed(struct cxl_afu *afu) | ||
464 | { | ||
465 | dev_info(&afu->dev, "Deactivating AFU directed mode\n"); | ||
466 | |||
467 | afu->current_mode = 0; | ||
468 | afu->num_procs = 0; | ||
469 | |||
470 | cxl_sysfs_afu_m_remove(afu); | ||
471 | cxl_chardev_afu_remove(afu); | ||
472 | |||
473 | cxl_afu_reset(afu); | ||
474 | cxl_afu_disable(afu); | ||
475 | cxl_psl_purge(afu); | ||
476 | |||
477 | release_spa(afu); | ||
478 | |||
479 | return 0; | ||
480 | } | ||
481 | |||
482 | static int activate_dedicated_process(struct cxl_afu *afu) | ||
483 | { | ||
484 | dev_info(&afu->dev, "Activating dedicated process mode\n"); | ||
485 | |||
486 | cxl_p1n_write(afu, CXL_PSL_SCNTL_An, CXL_PSL_SCNTL_An_PM_Process); | ||
487 | |||
488 | cxl_p1n_write(afu, CXL_PSL_CtxTime_An, 0); /* disable */ | ||
489 | cxl_p1n_write(afu, CXL_PSL_SPAP_An, 0); /* disable */ | ||
490 | cxl_p1n_write(afu, CXL_PSL_AMOR_An, 0xFFFFFFFFFFFFFFFFULL); | ||
491 | cxl_p1n_write(afu, CXL_PSL_LPID_An, mfspr(SPRN_LPID)); | ||
492 | cxl_p1n_write(afu, CXL_HAURP_An, 0); /* disable */ | ||
493 | cxl_p1n_write(afu, CXL_PSL_SDR_An, mfspr(SPRN_SDR1)); | ||
494 | |||
495 | cxl_p2n_write(afu, CXL_CSRP_An, 0); /* disable */ | ||
496 | cxl_p2n_write(afu, CXL_AURP0_An, 0); /* disable */ | ||
497 | cxl_p2n_write(afu, CXL_AURP1_An, 0); /* disable */ | ||
498 | |||
499 | afu->current_mode = CXL_MODE_DEDICATED; | ||
500 | afu->num_procs = 1; | ||
501 | |||
502 | return cxl_chardev_d_afu_add(afu); | ||
503 | } | ||
504 | |||
505 | static int attach_dedicated(struct cxl_context *ctx, u64 wed, u64 amr) | ||
506 | { | ||
507 | struct cxl_afu *afu = ctx->afu; | ||
508 | u64 sr; | ||
509 | int rc; | ||
510 | |||
511 | sr = CXL_PSL_SR_An_SC; | ||
512 | set_endian(sr); | ||
513 | if (ctx->master) | ||
514 | sr |= CXL_PSL_SR_An_MP; | ||
515 | if (mfspr(SPRN_LPCR) & LPCR_TC) | ||
516 | sr |= CXL_PSL_SR_An_TC; | ||
517 | sr |= CXL_PSL_SR_An_PR | CXL_PSL_SR_An_R; | ||
518 | if (!test_tsk_thread_flag(current, TIF_32BIT)) | ||
519 | sr |= CXL_PSL_SR_An_SF; | ||
520 | cxl_p2n_write(afu, CXL_PSL_PID_TID_An, (u64)current->pid << 32); | ||
521 | cxl_p1n_write(afu, CXL_PSL_SR_An, sr); | ||
522 | |||
523 | if ((rc = cxl_write_sstp(afu, ctx->sstp0, ctx->sstp1))) | ||
524 | return rc; | ||
525 | |||
526 | cxl_prefault(ctx, wed); | ||
527 | |||
528 | cxl_p1n_write(afu, CXL_PSL_IVTE_Offset_An, | ||
529 | (((u64)ctx->irqs.offset[0] & 0xffff) << 48) | | ||
530 | (((u64)ctx->irqs.offset[1] & 0xffff) << 32) | | ||
531 | (((u64)ctx->irqs.offset[2] & 0xffff) << 16) | | ||
532 | ((u64)ctx->irqs.offset[3] & 0xffff)); | ||
533 | cxl_p1n_write(afu, CXL_PSL_IVTE_Limit_An, (u64) | ||
534 | (((u64)ctx->irqs.range[0] & 0xffff) << 48) | | ||
535 | (((u64)ctx->irqs.range[1] & 0xffff) << 32) | | ||
536 | (((u64)ctx->irqs.range[2] & 0xffff) << 16) | | ||
537 | ((u64)ctx->irqs.range[3] & 0xffff)); | ||
538 | |||
539 | cxl_p2n_write(afu, CXL_PSL_AMR_An, amr); | ||
540 | |||
541 | /* master only context for dedicated */ | ||
542 | assign_psn_space(ctx); | ||
543 | |||
544 | if ((rc = cxl_afu_reset(afu))) | ||
545 | return rc; | ||
546 | |||
547 | cxl_p2n_write(afu, CXL_PSL_WED_An, wed); | ||
548 | |||
549 | return afu_enable(afu); | ||
550 | } | ||
551 | |||
552 | static int deactivate_dedicated_process(struct cxl_afu *afu) | ||
553 | { | ||
554 | dev_info(&afu->dev, "Deactivating dedicated process mode\n"); | ||
555 | |||
556 | afu->current_mode = 0; | ||
557 | afu->num_procs = 0; | ||
558 | |||
559 | cxl_chardev_afu_remove(afu); | ||
560 | |||
561 | return 0; | ||
562 | } | ||
563 | |||
564 | int _cxl_afu_deactivate_mode(struct cxl_afu *afu, int mode) | ||
565 | { | ||
566 | if (mode == CXL_MODE_DIRECTED) | ||
567 | return deactivate_afu_directed(afu); | ||
568 | if (mode == CXL_MODE_DEDICATED) | ||
569 | return deactivate_dedicated_process(afu); | ||
570 | return 0; | ||
571 | } | ||
572 | |||
573 | int cxl_afu_deactivate_mode(struct cxl_afu *afu) | ||
574 | { | ||
575 | return _cxl_afu_deactivate_mode(afu, afu->current_mode); | ||
576 | } | ||
577 | |||
578 | int cxl_afu_activate_mode(struct cxl_afu *afu, int mode) | ||
579 | { | ||
580 | if (!mode) | ||
581 | return 0; | ||
582 | if (!(mode & afu->modes_supported)) | ||
583 | return -EINVAL; | ||
584 | |||
585 | if (mode == CXL_MODE_DIRECTED) | ||
586 | return activate_afu_directed(afu); | ||
587 | if (mode == CXL_MODE_DEDICATED) | ||
588 | return activate_dedicated_process(afu); | ||
589 | |||
590 | return -EINVAL; | ||
591 | } | ||
592 | |||
593 | int cxl_attach_process(struct cxl_context *ctx, bool kernel, u64 wed, u64 amr) | ||
594 | { | ||
595 | ctx->kernel = kernel; | ||
596 | if (ctx->afu->current_mode == CXL_MODE_DIRECTED) | ||
597 | return attach_afu_directed(ctx, wed, amr); | ||
598 | |||
599 | if (ctx->afu->current_mode == CXL_MODE_DEDICATED) | ||
600 | return attach_dedicated(ctx, wed, amr); | ||
601 | |||
602 | return -EINVAL; | ||
603 | } | ||
604 | |||
605 | static inline int detach_process_native_dedicated(struct cxl_context *ctx) | ||
606 | { | ||
607 | cxl_afu_reset(ctx->afu); | ||
608 | cxl_afu_disable(ctx->afu); | ||
609 | cxl_psl_purge(ctx->afu); | ||
610 | return 0; | ||
611 | } | ||
612 | |||
613 | /* | ||
614 | * TODO: handle case when this is called inside a rcu_read_lock() which may | ||
615 | * happen when we unbind the driver (ie. cxl_context_detach_all()) . Terminate | ||
616 | * & remove use a mutex lock and schedule which will not good with lock held. | ||
617 | * May need to write do_process_element_cmd() that handles outstanding page | ||
618 | * faults synchronously. | ||
619 | */ | ||
620 | static inline int detach_process_native_afu_directed(struct cxl_context *ctx) | ||
621 | { | ||
622 | if (!ctx->pe_inserted) | ||
623 | return 0; | ||
624 | if (terminate_process_element(ctx)) | ||
625 | return -1; | ||
626 | if (remove_process_element(ctx)) | ||
627 | return -1; | ||
628 | |||
629 | return 0; | ||
630 | } | ||
631 | |||
632 | int cxl_detach_process(struct cxl_context *ctx) | ||
633 | { | ||
634 | if (ctx->afu->current_mode == CXL_MODE_DEDICATED) | ||
635 | return detach_process_native_dedicated(ctx); | ||
636 | |||
637 | return detach_process_native_afu_directed(ctx); | ||
638 | } | ||
639 | |||
640 | int cxl_get_irq(struct cxl_context *ctx, struct cxl_irq_info *info) | ||
641 | { | ||
642 | u64 pidtid; | ||
643 | |||
644 | info->dsisr = cxl_p2n_read(ctx->afu, CXL_PSL_DSISR_An); | ||
645 | info->dar = cxl_p2n_read(ctx->afu, CXL_PSL_DAR_An); | ||
646 | info->dsr = cxl_p2n_read(ctx->afu, CXL_PSL_DSR_An); | ||
647 | pidtid = cxl_p2n_read(ctx->afu, CXL_PSL_PID_TID_An); | ||
648 | info->pid = pidtid >> 32; | ||
649 | info->tid = pidtid & 0xffffffff; | ||
650 | info->afu_err = cxl_p2n_read(ctx->afu, CXL_AFU_ERR_An); | ||
651 | info->errstat = cxl_p2n_read(ctx->afu, CXL_PSL_ErrStat_An); | ||
652 | |||
653 | return 0; | ||
654 | } | ||
655 | |||
656 | static void recover_psl_err(struct cxl_afu *afu, u64 errstat) | ||
657 | { | ||
658 | u64 dsisr; | ||
659 | |||
660 | pr_devel("RECOVERING FROM PSL ERROR... (0x%.16llx)\n", errstat); | ||
661 | |||
662 | /* Clear PSL_DSISR[PE] */ | ||
663 | dsisr = cxl_p2n_read(afu, CXL_PSL_DSISR_An); | ||
664 | cxl_p2n_write(afu, CXL_PSL_DSISR_An, dsisr & ~CXL_PSL_DSISR_An_PE); | ||
665 | |||
666 | /* Write 1s to clear error status bits */ | ||
667 | cxl_p2n_write(afu, CXL_PSL_ErrStat_An, errstat); | ||
668 | } | ||
669 | |||
670 | int cxl_ack_irq(struct cxl_context *ctx, u64 tfc, u64 psl_reset_mask) | ||
671 | { | ||
672 | if (tfc) | ||
673 | cxl_p2n_write(ctx->afu, CXL_PSL_TFC_An, tfc); | ||
674 | if (psl_reset_mask) | ||
675 | recover_psl_err(ctx->afu, psl_reset_mask); | ||
676 | |||
677 | return 0; | ||
678 | } | ||
679 | |||
680 | int cxl_check_error(struct cxl_afu *afu) | ||
681 | { | ||
682 | return (cxl_p1n_read(afu, CXL_PSL_SCNTL_An) == ~0ULL); | ||
683 | } | ||