2 * Copyright 2014 IBM Corp.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
10 #include <linux/spinlock.h>
11 #include <linux/sched.h>
12 #include <linux/sched/clock.h>
13 #include <linux/slab.h>
14 #include <linux/mutex.h>
16 #include <linux/uaccess.h>
17 #include <linux/delay.h>
18 #include <asm/synch.h>
19 #include <asm/switch_to.h>
20 #include <misc/cxl-base.h>
25 static int afu_control(struct cxl_afu
*afu
, u64 command
, u64 clear
,
26 u64 result
, u64 mask
, bool enabled
)
29 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
32 spin_lock(&afu
->afu_cntl_lock
);
33 pr_devel("AFU command starting: %llx\n", command
);
35 trace_cxl_afu_ctrl(afu
, command
);
37 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
38 cxl_p2n_write(afu
, CXL_AFU_Cntl_An
, (AFU_Cntl
& ~clear
) | command
);
40 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
41 while ((AFU_Cntl
& mask
) != result
) {
42 if (time_after_eq(jiffies
, timeout
)) {
43 dev_warn(&afu
->dev
, "WARNING: AFU control timed out!\n");
48 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
49 afu
->enabled
= enabled
;
54 pr_devel_ratelimited("AFU control... (0x%016llx)\n",
57 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
60 if (AFU_Cntl
& CXL_AFU_Cntl_An_RA
) {
62 * Workaround for a bug in the XSL used in the Mellanox CX4
63 * that fails to clear the RA bit after an AFU reset,
64 * preventing subsequent AFU resets from working.
66 cxl_p2n_write(afu
, CXL_AFU_Cntl_An
, AFU_Cntl
& ~CXL_AFU_Cntl_An_RA
);
69 pr_devel("AFU command complete: %llx\n", command
);
70 afu
->enabled
= enabled
;
72 trace_cxl_afu_ctrl_done(afu
, command
, rc
);
73 spin_unlock(&afu
->afu_cntl_lock
);
78 static int afu_enable(struct cxl_afu
*afu
)
80 pr_devel("AFU enable request\n");
82 return afu_control(afu
, CXL_AFU_Cntl_An_E
, 0,
83 CXL_AFU_Cntl_An_ES_Enabled
,
84 CXL_AFU_Cntl_An_ES_MASK
, true);
87 int cxl_afu_disable(struct cxl_afu
*afu
)
89 pr_devel("AFU disable request\n");
91 return afu_control(afu
, 0, CXL_AFU_Cntl_An_E
,
92 CXL_AFU_Cntl_An_ES_Disabled
,
93 CXL_AFU_Cntl_An_ES_MASK
, false);
96 /* This will disable as well as reset */
97 static int native_afu_reset(struct cxl_afu
*afu
)
102 pr_devel("AFU reset request\n");
104 rc
= afu_control(afu
, CXL_AFU_Cntl_An_RA
, 0,
105 CXL_AFU_Cntl_An_RS_Complete
| CXL_AFU_Cntl_An_ES_Disabled
,
106 CXL_AFU_Cntl_An_RS_MASK
| CXL_AFU_Cntl_An_ES_MASK
,
110 * Re-enable any masked interrupts when the AFU is not
111 * activated to avoid side effects after attaching a process
114 if (afu
->current_mode
== 0) {
115 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
116 serr
&= ~CXL_PSL_SERR_An_IRQ_MASKS
;
117 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
123 static int native_afu_check_and_enable(struct cxl_afu
*afu
)
125 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
126 WARN(1, "Refusing to enable afu while link down!\n");
131 return afu_enable(afu
);
134 int cxl_psl_purge(struct cxl_afu
*afu
)
136 u64 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
137 u64 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
140 u64 trans_fault
= 0x0ULL
;
141 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
144 trace_cxl_psl_ctrl(afu
, CXL_PSL_SCNTL_An_Pc
);
146 pr_devel("PSL purge request\n");
149 trans_fault
= CXL_PSL_DSISR_TRANS
;
151 trans_fault
= CXL_PSL9_DSISR_An_TF
;
153 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
154 dev_warn(&afu
->dev
, "PSL Purge called with link down, ignoring\n");
159 if ((AFU_Cntl
& CXL_AFU_Cntl_An_ES_MASK
) != CXL_AFU_Cntl_An_ES_Disabled
) {
160 WARN(1, "psl_purge request while AFU not disabled!\n");
161 cxl_afu_disable(afu
);
164 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
,
165 PSL_CNTL
| CXL_PSL_SCNTL_An_Pc
);
166 start
= local_clock();
167 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
168 while ((PSL_CNTL
& CXL_PSL_SCNTL_An_Ps_MASK
)
169 == CXL_PSL_SCNTL_An_Ps_Pending
) {
170 if (time_after_eq(jiffies
, timeout
)) {
171 dev_warn(&afu
->dev
, "WARNING: PSL Purge timed out!\n");
175 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
180 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
181 pr_devel_ratelimited("PSL purging... PSL_CNTL: 0x%016llx PSL_DSISR: 0x%016llx\n",
184 if (dsisr
& trans_fault
) {
185 dar
= cxl_p2n_read(afu
, CXL_PSL_DAR_An
);
186 dev_notice(&afu
->dev
, "PSL purge terminating pending translation, DSISR: 0x%016llx, DAR: 0x%016llx\n",
188 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_AE
);
190 dev_notice(&afu
->dev
, "PSL purge acknowledging pending non-translation fault, DSISR: 0x%016llx\n",
192 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_A
);
196 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
199 pr_devel("PSL purged in %lld ns\n", end
- start
);
201 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
,
202 PSL_CNTL
& ~CXL_PSL_SCNTL_An_Pc
);
204 trace_cxl_psl_ctrl_done(afu
, CXL_PSL_SCNTL_An_Pc
, rc
);
208 static int spa_max_procs(int spa_size
)
212 * end_of_SPA_area = SPA_Base + ((n+4) * 128) + (( ((n*8) + 127) >> 7) * 128) + 255
213 * Most of that junk is really just an overly-complicated way of saying
214 * the last 256 bytes are __aligned(128), so it's really:
215 * end_of_SPA_area = end_of_PSL_queue_area + __aligned(128) 255
217 * end_of_PSL_queue_area = SPA_Base + ((n+4) * 128) + (n*8) - 1
219 * sizeof(SPA) = ((n+4) * 128) + (n*8) + __aligned(128) 256
220 * Ignore the alignment (which is safe in this case as long as we are
221 * careful with our rounding) and solve for n:
223 return ((spa_size
/ 8) - 96) / 17;
226 static int cxl_alloc_spa(struct cxl_afu
*afu
, int mode
)
230 /* Work out how many pages to allocate */
231 afu
->native
->spa_order
= -1;
233 afu
->native
->spa_order
++;
234 spa_size
= (1 << afu
->native
->spa_order
) * PAGE_SIZE
;
236 if (spa_size
> 0x100000) {
237 dev_warn(&afu
->dev
, "num_of_processes too large for the SPA, limiting to %i (0x%x)\n",
238 afu
->native
->spa_max_procs
, afu
->native
->spa_size
);
239 if (mode
!= CXL_MODE_DEDICATED
)
240 afu
->num_procs
= afu
->native
->spa_max_procs
;
244 afu
->native
->spa_size
= spa_size
;
245 afu
->native
->spa_max_procs
= spa_max_procs(afu
->native
->spa_size
);
246 } while (afu
->native
->spa_max_procs
< afu
->num_procs
);
248 if (!(afu
->native
->spa
= (struct cxl_process_element
*)
249 __get_free_pages(GFP_KERNEL
| __GFP_ZERO
, afu
->native
->spa_order
))) {
250 pr_err("cxl_alloc_spa: Unable to allocate scheduled process area\n");
253 pr_devel("spa pages: %i afu->spa_max_procs: %i afu->num_procs: %i\n",
254 1<<afu
->native
->spa_order
, afu
->native
->spa_max_procs
, afu
->num_procs
);
259 static void attach_spa(struct cxl_afu
*afu
)
263 afu
->native
->sw_command_status
= (__be64
*)((char *)afu
->native
->spa
+
264 ((afu
->native
->spa_max_procs
+ 3) * 128));
266 spap
= virt_to_phys(afu
->native
->spa
) & CXL_PSL_SPAP_Addr
;
267 spap
|= ((afu
->native
->spa_size
>> (12 - CXL_PSL_SPAP_Size_Shift
)) - 1) & CXL_PSL_SPAP_Size
;
268 spap
|= CXL_PSL_SPAP_V
;
269 pr_devel("cxl: SPA allocated at 0x%p. Max processes: %i, sw_command_status: 0x%p CXL_PSL_SPAP_An=0x%016llx\n",
270 afu
->native
->spa
, afu
->native
->spa_max_procs
,
271 afu
->native
->sw_command_status
, spap
);
272 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, spap
);
275 static inline void detach_spa(struct cxl_afu
*afu
)
277 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, 0);
280 void cxl_release_spa(struct cxl_afu
*afu
)
282 if (afu
->native
->spa
) {
283 free_pages((unsigned long) afu
->native
->spa
,
284 afu
->native
->spa_order
);
285 afu
->native
->spa
= NULL
;
290 * Invalidation of all ERAT entries is no longer required by CAIA2. Use
293 int cxl_invalidate_all_psl9(struct cxl
*adapter
)
295 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
298 pr_devel("CXL adapter - invalidation of all ERAT entries\n");
300 /* Invalidates all ERAT entries for Radix or HPT */
301 ierat
= CXL_XSL9_IERAT_IALL
;
303 ierat
|= CXL_XSL9_IERAT_INVR
;
304 cxl_p1_write(adapter
, CXL_XSL9_IERAT
, ierat
);
306 while (cxl_p1_read(adapter
, CXL_XSL9_IERAT
) & CXL_XSL9_IERAT_IINPROG
) {
307 if (time_after_eq(jiffies
, timeout
)) {
308 dev_warn(&adapter
->dev
,
309 "WARNING: CXL adapter invalidation of all ERAT entries timed out!\n");
312 if (!cxl_ops
->link_ok(adapter
, NULL
))
319 int cxl_invalidate_all_psl8(struct cxl
*adapter
)
321 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
323 pr_devel("CXL adapter wide TLBIA & SLBIA\n");
325 cxl_p1_write(adapter
, CXL_PSL_AFUSEL
, CXL_PSL_AFUSEL_A
);
327 cxl_p1_write(adapter
, CXL_PSL_TLBIA
, CXL_TLB_SLB_IQ_ALL
);
328 while (cxl_p1_read(adapter
, CXL_PSL_TLBIA
) & CXL_TLB_SLB_P
) {
329 if (time_after_eq(jiffies
, timeout
)) {
330 dev_warn(&adapter
->dev
, "WARNING: CXL adapter wide TLBIA timed out!\n");
333 if (!cxl_ops
->link_ok(adapter
, NULL
))
338 cxl_p1_write(adapter
, CXL_PSL_SLBIA
, CXL_TLB_SLB_IQ_ALL
);
339 while (cxl_p1_read(adapter
, CXL_PSL_SLBIA
) & CXL_TLB_SLB_P
) {
340 if (time_after_eq(jiffies
, timeout
)) {
341 dev_warn(&adapter
->dev
, "WARNING: CXL adapter wide SLBIA timed out!\n");
344 if (!cxl_ops
->link_ok(adapter
, NULL
))
351 int cxl_data_cache_flush(struct cxl
*adapter
)
354 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
357 * Do a datacache flush only if datacache is available.
358 * In case of PSL9D datacache absent hence flush operation.
361 if (adapter
->native
->no_data_cache
) {
362 pr_devel("No PSL data cache. Ignoring cache flush req.\n");
366 pr_devel("Flushing data cache\n");
367 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
368 reg
|= CXL_PSL_Control_Fr
;
369 cxl_p1_write(adapter
, CXL_PSL_Control
, reg
);
371 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
372 while ((reg
& CXL_PSL_Control_Fs_MASK
) != CXL_PSL_Control_Fs_Complete
) {
373 if (time_after_eq(jiffies
, timeout
)) {
374 dev_warn(&adapter
->dev
, "WARNING: cache flush timed out!\n");
378 if (!cxl_ops
->link_ok(adapter
, NULL
)) {
379 dev_warn(&adapter
->dev
, "WARNING: link down when flushing cache\n");
383 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
386 reg
&= ~CXL_PSL_Control_Fr
;
387 cxl_p1_write(adapter
, CXL_PSL_Control
, reg
);
391 static int cxl_write_sstp(struct cxl_afu
*afu
, u64 sstp0
, u64 sstp1
)
395 /* 1. Disable SSTP by writing 0 to SSTP1[V] */
396 cxl_p2n_write(afu
, CXL_SSTP1_An
, 0);
398 /* 2. Invalidate all SLB entries */
399 if ((rc
= cxl_afu_slbia(afu
)))
402 /* 3. Set SSTP0_An */
403 cxl_p2n_write(afu
, CXL_SSTP0_An
, sstp0
);
405 /* 4. Set SSTP1_An */
406 cxl_p2n_write(afu
, CXL_SSTP1_An
, sstp1
);
411 /* Using per slice version may improve performance here. (ie. SLBIA_An) */
412 static void slb_invalid(struct cxl_context
*ctx
)
414 struct cxl
*adapter
= ctx
->afu
->adapter
;
417 WARN_ON(!mutex_is_locked(&ctx
->afu
->native
->spa_mutex
));
419 cxl_p1_write(adapter
, CXL_PSL_LBISEL
,
420 ((u64
)be32_to_cpu(ctx
->elem
->common
.pid
) << 32) |
421 be32_to_cpu(ctx
->elem
->lpid
));
422 cxl_p1_write(adapter
, CXL_PSL_SLBIA
, CXL_TLB_SLB_IQ_LPIDPID
);
425 if (!cxl_ops
->link_ok(adapter
, NULL
))
427 slbia
= cxl_p1_read(adapter
, CXL_PSL_SLBIA
);
428 if (!(slbia
& CXL_TLB_SLB_P
))
434 static int do_process_element_cmd(struct cxl_context
*ctx
,
435 u64 cmd
, u64 pe_state
)
438 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
441 trace_cxl_llcmd(ctx
, cmd
);
443 WARN_ON(!ctx
->afu
->enabled
);
445 ctx
->elem
->software_state
= cpu_to_be32(pe_state
);
447 *(ctx
->afu
->native
->sw_command_status
) = cpu_to_be64(cmd
| 0 | ctx
->pe
);
449 cxl_p1n_write(ctx
->afu
, CXL_PSL_LLCMD_An
, cmd
| ctx
->pe
);
451 if (time_after_eq(jiffies
, timeout
)) {
452 dev_warn(&ctx
->afu
->dev
, "WARNING: Process Element Command timed out!\n");
456 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
)) {
457 dev_warn(&ctx
->afu
->dev
, "WARNING: Device link down, aborting Process Element Command!\n");
461 state
= be64_to_cpup(ctx
->afu
->native
->sw_command_status
);
462 if (state
== ~0ULL) {
463 pr_err("cxl: Error adding process element to AFU\n");
467 if ((state
& (CXL_SPA_SW_CMD_MASK
| CXL_SPA_SW_STATE_MASK
| CXL_SPA_SW_LINK_MASK
)) ==
468 (cmd
| (cmd
>> 16) | ctx
->pe
))
471 * The command won't finish in the PSL if there are
472 * outstanding DSIs. Hence we need to yield here in
473 * case there are outstanding DSIs that we need to
474 * service. Tuning possiblity: we could wait for a
481 trace_cxl_llcmd_done(ctx
, cmd
, rc
);
485 static int add_process_element(struct cxl_context
*ctx
)
489 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
490 pr_devel("%s Adding pe: %i started\n", __func__
, ctx
->pe
);
491 if (!(rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_ADD
, CXL_PE_SOFTWARE_STATE_V
)))
492 ctx
->pe_inserted
= true;
493 pr_devel("%s Adding pe: %i finished\n", __func__
, ctx
->pe
);
494 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
498 static int terminate_process_element(struct cxl_context
*ctx
)
502 /* fast path terminate if it's already invalid */
503 if (!(ctx
->elem
->software_state
& cpu_to_be32(CXL_PE_SOFTWARE_STATE_V
)))
506 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
507 pr_devel("%s Terminate pe: %i started\n", __func__
, ctx
->pe
);
508 /* We could be asked to terminate when the hw is down. That
509 * should always succeed: it's not running if the hw has gone
510 * away and is being reset.
512 if (cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
513 rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_TERMINATE
,
514 CXL_PE_SOFTWARE_STATE_V
| CXL_PE_SOFTWARE_STATE_T
);
515 ctx
->elem
->software_state
= 0; /* Remove Valid bit */
516 pr_devel("%s Terminate pe: %i finished\n", __func__
, ctx
->pe
);
517 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
521 static int remove_process_element(struct cxl_context
*ctx
)
525 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
526 pr_devel("%s Remove pe: %i started\n", __func__
, ctx
->pe
);
528 /* We could be asked to remove when the hw is down. Again, if
529 * the hw is down, the PE is gone, so we succeed.
531 if (cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
532 rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_REMOVE
, 0);
535 ctx
->pe_inserted
= false;
538 pr_devel("%s Remove pe: %i finished\n", __func__
, ctx
->pe
);
539 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
544 void cxl_assign_psn_space(struct cxl_context
*ctx
)
546 if (!ctx
->afu
->pp_size
|| ctx
->master
) {
547 ctx
->psn_phys
= ctx
->afu
->psn_phys
;
548 ctx
->psn_size
= ctx
->afu
->adapter
->ps_size
;
550 ctx
->psn_phys
= ctx
->afu
->psn_phys
+
551 (ctx
->afu
->native
->pp_offset
+ ctx
->afu
->pp_size
* ctx
->pe
);
552 ctx
->psn_size
= ctx
->afu
->pp_size
;
556 static int activate_afu_directed(struct cxl_afu
*afu
)
560 dev_info(&afu
->dev
, "Activating AFU directed mode\n");
562 afu
->num_procs
= afu
->max_procs_virtualised
;
563 if (afu
->native
->spa
== NULL
) {
564 if (cxl_alloc_spa(afu
, CXL_MODE_DIRECTED
))
569 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_AFU
);
571 cxl_p1n_write(afu
, CXL_PSL_AMOR_An
, 0xFFFFFFFFFFFFFFFFULL
);
572 cxl_p1n_write(afu
, CXL_PSL_ID_An
, CXL_PSL_ID_An_F
| CXL_PSL_ID_An_L
);
574 afu
->current_mode
= CXL_MODE_DIRECTED
;
576 if ((rc
= cxl_chardev_m_afu_add(afu
)))
579 if ((rc
= cxl_sysfs_afu_m_add(afu
)))
582 if ((rc
= cxl_chardev_s_afu_add(afu
)))
587 cxl_sysfs_afu_m_remove(afu
);
589 cxl_chardev_afu_remove(afu
);
593 #ifdef CONFIG_CPU_LITTLE_ENDIAN
594 #define set_endian(sr) ((sr) |= CXL_PSL_SR_An_LE)
596 #define set_endian(sr) ((sr) &= ~(CXL_PSL_SR_An_LE))
599 u64
cxl_calculate_sr(bool master
, bool kernel
, bool real_mode
, bool p9
)
605 sr
|= CXL_PSL_SR_An_MP
;
606 if (mfspr(SPRN_LPCR
) & LPCR_TC
)
607 sr
|= CXL_PSL_SR_An_TC
;
610 sr
|= CXL_PSL_SR_An_R
;
611 sr
|= (mfmsr() & MSR_SF
) | CXL_PSL_SR_An_HV
;
613 sr
|= CXL_PSL_SR_An_PR
| CXL_PSL_SR_An_R
;
615 sr
|= CXL_PSL_SR_An_HV
;
617 sr
&= ~(CXL_PSL_SR_An_HV
);
618 if (!test_tsk_thread_flag(current
, TIF_32BIT
))
619 sr
|= CXL_PSL_SR_An_SF
;
623 sr
|= CXL_PSL_SR_An_XLAT_ror
;
625 sr
|= CXL_PSL_SR_An_XLAT_hpt
;
630 static u64
calculate_sr(struct cxl_context
*ctx
)
632 return cxl_calculate_sr(ctx
->master
, ctx
->kernel
, ctx
->real_mode
,
636 static void update_ivtes_directed(struct cxl_context
*ctx
)
638 bool need_update
= (ctx
->status
== STARTED
);
642 WARN_ON(terminate_process_element(ctx
));
643 WARN_ON(remove_process_element(ctx
));
646 for (r
= 0; r
< CXL_IRQ_RANGES
; r
++) {
647 ctx
->elem
->ivte_offsets
[r
] = cpu_to_be16(ctx
->irqs
.offset
[r
]);
648 ctx
->elem
->ivte_ranges
[r
] = cpu_to_be16(ctx
->irqs
.range
[r
]);
652 * Theoretically we could use the update llcmd, instead of a
653 * terminate/remove/add (or if an atomic update was required we could
654 * do a suspend/update/resume), however it seems there might be issues
655 * with the update llcmd on some cards (including those using an XSL on
656 * an ASIC) so for now it's safest to go with the commands that are
657 * known to work. In the future if we come across a situation where the
658 * card may be performing transactions using the same PE while we are
659 * doing this update we might need to revisit this.
662 WARN_ON(add_process_element(ctx
));
665 static int process_element_entry_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
670 cxl_assign_psn_space(ctx
);
672 ctx
->elem
->ctxtime
= 0; /* disable */
673 ctx
->elem
->lpid
= cpu_to_be32(mfspr(SPRN_LPID
));
674 ctx
->elem
->haurp
= 0; /* disable */
679 if (ctx
->mm
== NULL
) {
680 pr_devel("%s: unable to get mm for pe=%d pid=%i\n",
681 __func__
, ctx
->pe
, pid_nr(ctx
->pid
));
684 pid
= ctx
->mm
->context
.id
;
687 /* Assign a unique TIDR (thread id) for the current thread */
688 if (!(ctx
->tidr
) && (ctx
->assign_tidr
)) {
689 rc
= set_thread_tidr(current
);
692 ctx
->tidr
= current
->thread
.tidr
;
693 pr_devel("%s: current tidr: %d\n", __func__
, ctx
->tidr
);
696 ctx
->elem
->common
.tid
= cpu_to_be32(ctx
->tidr
);
697 ctx
->elem
->common
.pid
= cpu_to_be32(pid
);
699 ctx
->elem
->sr
= cpu_to_be64(calculate_sr(ctx
));
701 ctx
->elem
->common
.csrp
= 0; /* disable */
703 cxl_prefault(ctx
, wed
);
706 * Ensure we have the multiplexed PSL interrupt set up to take faults
707 * for kernel contexts that may not have allocated any AFU IRQs at all:
709 if (ctx
->irqs
.range
[0] == 0) {
710 ctx
->irqs
.offset
[0] = ctx
->afu
->native
->psl_hwirq
;
711 ctx
->irqs
.range
[0] = 1;
714 ctx
->elem
->common
.amr
= cpu_to_be64(amr
);
715 ctx
->elem
->common
.wed
= cpu_to_be64(wed
);
720 int cxl_attach_afu_directed_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
724 /* fill the process element entry */
725 result
= process_element_entry_psl9(ctx
, wed
, amr
);
729 update_ivtes_directed(ctx
);
731 /* first guy needs to enable */
732 result
= cxl_ops
->afu_check_and_enable(ctx
->afu
);
736 return add_process_element(ctx
);
739 int cxl_attach_afu_directed_psl8(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
744 cxl_assign_psn_space(ctx
);
746 ctx
->elem
->ctxtime
= 0; /* disable */
747 ctx
->elem
->lpid
= cpu_to_be32(mfspr(SPRN_LPID
));
748 ctx
->elem
->haurp
= 0; /* disable */
749 ctx
->elem
->u
.sdr
= cpu_to_be64(mfspr(SPRN_SDR1
));
754 ctx
->elem
->common
.tid
= 0;
755 ctx
->elem
->common
.pid
= cpu_to_be32(pid
);
757 ctx
->elem
->sr
= cpu_to_be64(calculate_sr(ctx
));
759 ctx
->elem
->common
.csrp
= 0; /* disable */
760 ctx
->elem
->common
.u
.psl8
.aurp0
= 0; /* disable */
761 ctx
->elem
->common
.u
.psl8
.aurp1
= 0; /* disable */
763 cxl_prefault(ctx
, wed
);
765 ctx
->elem
->common
.u
.psl8
.sstp0
= cpu_to_be64(ctx
->sstp0
);
766 ctx
->elem
->common
.u
.psl8
.sstp1
= cpu_to_be64(ctx
->sstp1
);
769 * Ensure we have the multiplexed PSL interrupt set up to take faults
770 * for kernel contexts that may not have allocated any AFU IRQs at all:
772 if (ctx
->irqs
.range
[0] == 0) {
773 ctx
->irqs
.offset
[0] = ctx
->afu
->native
->psl_hwirq
;
774 ctx
->irqs
.range
[0] = 1;
777 update_ivtes_directed(ctx
);
779 ctx
->elem
->common
.amr
= cpu_to_be64(amr
);
780 ctx
->elem
->common
.wed
= cpu_to_be64(wed
);
782 /* first guy needs to enable */
783 if ((result
= cxl_ops
->afu_check_and_enable(ctx
->afu
)))
786 return add_process_element(ctx
);
789 static int deactivate_afu_directed(struct cxl_afu
*afu
)
791 dev_info(&afu
->dev
, "Deactivating AFU directed mode\n");
793 afu
->current_mode
= 0;
796 cxl_sysfs_afu_m_remove(afu
);
797 cxl_chardev_afu_remove(afu
);
800 * The CAIA section 2.2.1 indicates that the procedure for starting and
801 * stopping an AFU in AFU directed mode is AFU specific, which is not
802 * ideal since this code is generic and with one exception has no
803 * knowledge of the AFU. This is in contrast to the procedure for
804 * disabling a dedicated process AFU, which is documented to just
805 * require a reset. The architecture does indicate that both an AFU
806 * reset and an AFU disable should result in the AFU being disabled and
807 * we do both followed by a PSL purge for safety.
809 * Notably we used to have some issues with the disable sequence on PSL
810 * cards, which is why we ended up using this heavy weight procedure in
811 * the first place, however a bug was discovered that had rendered the
812 * disable operation ineffective, so it is conceivable that was the
813 * sole explanation for those difficulties. Careful regression testing
814 * is recommended if anyone attempts to remove or reorder these
817 * The XSL on the Mellanox CX4 behaves a little differently from the
818 * PSL based cards and will time out an AFU reset if the AFU is still
819 * enabled. That card is special in that we do have a means to identify
820 * it from this code, so in that case we skip the reset and just use a
821 * disable/purge to avoid the timeout and corresponding noise in the
824 if (afu
->adapter
->native
->sl_ops
->needs_reset_before_disable
)
825 cxl_ops
->afu_reset(afu
);
826 cxl_afu_disable(afu
);
832 int cxl_activate_dedicated_process_psl9(struct cxl_afu
*afu
)
834 dev_info(&afu
->dev
, "Activating dedicated process mode\n");
837 * If XSL is set to dedicated mode (Set in PSL_SCNTL reg), the
838 * XSL and AFU are programmed to work with a single context.
839 * The context information should be configured in the SPA area
840 * index 0 (so PSL_SPAP must be configured before enabling the
844 if (afu
->native
->spa
== NULL
) {
845 if (cxl_alloc_spa(afu
, CXL_MODE_DEDICATED
))
850 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_Process
);
851 cxl_p1n_write(afu
, CXL_PSL_ID_An
, CXL_PSL_ID_An_F
| CXL_PSL_ID_An_L
);
853 afu
->current_mode
= CXL_MODE_DEDICATED
;
855 return cxl_chardev_d_afu_add(afu
);
858 int cxl_activate_dedicated_process_psl8(struct cxl_afu
*afu
)
860 dev_info(&afu
->dev
, "Activating dedicated process mode\n");
862 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_Process
);
864 cxl_p1n_write(afu
, CXL_PSL_CtxTime_An
, 0); /* disable */
865 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, 0); /* disable */
866 cxl_p1n_write(afu
, CXL_PSL_AMOR_An
, 0xFFFFFFFFFFFFFFFFULL
);
867 cxl_p1n_write(afu
, CXL_PSL_LPID_An
, mfspr(SPRN_LPID
));
868 cxl_p1n_write(afu
, CXL_HAURP_An
, 0); /* disable */
869 cxl_p1n_write(afu
, CXL_PSL_SDR_An
, mfspr(SPRN_SDR1
));
871 cxl_p2n_write(afu
, CXL_CSRP_An
, 0); /* disable */
872 cxl_p2n_write(afu
, CXL_AURP0_An
, 0); /* disable */
873 cxl_p2n_write(afu
, CXL_AURP1_An
, 0); /* disable */
875 afu
->current_mode
= CXL_MODE_DEDICATED
;
878 return cxl_chardev_d_afu_add(afu
);
881 void cxl_update_dedicated_ivtes_psl9(struct cxl_context
*ctx
)
885 for (r
= 0; r
< CXL_IRQ_RANGES
; r
++) {
886 ctx
->elem
->ivte_offsets
[r
] = cpu_to_be16(ctx
->irqs
.offset
[r
]);
887 ctx
->elem
->ivte_ranges
[r
] = cpu_to_be16(ctx
->irqs
.range
[r
]);
891 void cxl_update_dedicated_ivtes_psl8(struct cxl_context
*ctx
)
893 struct cxl_afu
*afu
= ctx
->afu
;
895 cxl_p1n_write(afu
, CXL_PSL_IVTE_Offset_An
,
896 (((u64
)ctx
->irqs
.offset
[0] & 0xffff) << 48) |
897 (((u64
)ctx
->irqs
.offset
[1] & 0xffff) << 32) |
898 (((u64
)ctx
->irqs
.offset
[2] & 0xffff) << 16) |
899 ((u64
)ctx
->irqs
.offset
[3] & 0xffff));
900 cxl_p1n_write(afu
, CXL_PSL_IVTE_Limit_An
, (u64
)
901 (((u64
)ctx
->irqs
.range
[0] & 0xffff) << 48) |
902 (((u64
)ctx
->irqs
.range
[1] & 0xffff) << 32) |
903 (((u64
)ctx
->irqs
.range
[2] & 0xffff) << 16) |
904 ((u64
)ctx
->irqs
.range
[3] & 0xffff));
907 int cxl_attach_dedicated_process_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
909 struct cxl_afu
*afu
= ctx
->afu
;
912 /* fill the process element entry */
913 result
= process_element_entry_psl9(ctx
, wed
, amr
);
917 if (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
)
918 afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
920 ctx
->elem
->software_state
= cpu_to_be32(CXL_PE_SOFTWARE_STATE_V
);
922 * Ideally we should do a wmb() here to make sure the changes to the
923 * PE are visible to the card before we call afu_enable.
924 * On ppc64 though all mmios are preceded by a 'sync' instruction hence
925 * we dont dont need one here.
928 result
= cxl_ops
->afu_reset(afu
);
932 return afu_enable(afu
);
935 int cxl_attach_dedicated_process_psl8(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
937 struct cxl_afu
*afu
= ctx
->afu
;
941 pid
= (u64
)current
->pid
<< 32;
944 cxl_p2n_write(afu
, CXL_PSL_PID_TID_An
, pid
);
946 cxl_p1n_write(afu
, CXL_PSL_SR_An
, calculate_sr(ctx
));
948 if ((rc
= cxl_write_sstp(afu
, ctx
->sstp0
, ctx
->sstp1
)))
951 cxl_prefault(ctx
, wed
);
953 if (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
)
954 afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
956 cxl_p2n_write(afu
, CXL_PSL_AMR_An
, amr
);
958 /* master only context for dedicated */
959 cxl_assign_psn_space(ctx
);
961 if ((rc
= cxl_ops
->afu_reset(afu
)))
964 cxl_p2n_write(afu
, CXL_PSL_WED_An
, wed
);
966 return afu_enable(afu
);
969 static int deactivate_dedicated_process(struct cxl_afu
*afu
)
971 dev_info(&afu
->dev
, "Deactivating dedicated process mode\n");
973 afu
->current_mode
= 0;
976 cxl_chardev_afu_remove(afu
);
981 static int native_afu_deactivate_mode(struct cxl_afu
*afu
, int mode
)
983 if (mode
== CXL_MODE_DIRECTED
)
984 return deactivate_afu_directed(afu
);
985 if (mode
== CXL_MODE_DEDICATED
)
986 return deactivate_dedicated_process(afu
);
990 static int native_afu_activate_mode(struct cxl_afu
*afu
, int mode
)
994 if (!(mode
& afu
->modes_supported
))
997 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
998 WARN(1, "Device link is down, refusing to activate!\n");
1002 if (mode
== CXL_MODE_DIRECTED
)
1003 return activate_afu_directed(afu
);
1004 if ((mode
== CXL_MODE_DEDICATED
) &&
1005 (afu
->adapter
->native
->sl_ops
->activate_dedicated_process
))
1006 return afu
->adapter
->native
->sl_ops
->activate_dedicated_process(afu
);
1011 static int native_attach_process(struct cxl_context
*ctx
, bool kernel
,
1014 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
)) {
1015 WARN(1, "Device link is down, refusing to attach process!\n");
1019 ctx
->kernel
= kernel
;
1020 if ((ctx
->afu
->current_mode
== CXL_MODE_DIRECTED
) &&
1021 (ctx
->afu
->adapter
->native
->sl_ops
->attach_afu_directed
))
1022 return ctx
->afu
->adapter
->native
->sl_ops
->attach_afu_directed(ctx
, wed
, amr
);
1024 if ((ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
) &&
1025 (ctx
->afu
->adapter
->native
->sl_ops
->attach_dedicated_process
))
1026 return ctx
->afu
->adapter
->native
->sl_ops
->attach_dedicated_process(ctx
, wed
, amr
);
1031 static inline int detach_process_native_dedicated(struct cxl_context
*ctx
)
1034 * The CAIA section 2.1.1 indicates that we need to do an AFU reset to
1035 * stop the AFU in dedicated mode (we therefore do not make that
1036 * optional like we do in the afu directed path). It does not indicate
1037 * that we need to do an explicit disable (which should occur
1038 * implicitly as part of the reset) or purge, but we do these as well
1039 * to be on the safe side.
1041 * Notably we used to have some issues with the disable sequence
1042 * (before the sequence was spelled out in the architecture) which is
1043 * why we were so heavy weight in the first place, however a bug was
1044 * discovered that had rendered the disable operation ineffective, so
1045 * it is conceivable that was the sole explanation for those
1046 * difficulties. Point is, we should be careful and do some regression
1047 * testing if we ever attempt to remove any part of this procedure.
1049 cxl_ops
->afu_reset(ctx
->afu
);
1050 cxl_afu_disable(ctx
->afu
);
1051 cxl_psl_purge(ctx
->afu
);
1055 static void native_update_ivtes(struct cxl_context
*ctx
)
1057 if (ctx
->afu
->current_mode
== CXL_MODE_DIRECTED
)
1058 return update_ivtes_directed(ctx
);
1059 if ((ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
) &&
1060 (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
))
1061 return ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
1062 WARN(1, "native_update_ivtes: Bad mode\n");
1065 static inline int detach_process_native_afu_directed(struct cxl_context
*ctx
)
1067 if (!ctx
->pe_inserted
)
1069 if (terminate_process_element(ctx
))
1071 if (remove_process_element(ctx
))
1077 static int native_detach_process(struct cxl_context
*ctx
)
1079 trace_cxl_detach(ctx
);
1081 if (ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
)
1082 return detach_process_native_dedicated(ctx
);
1084 return detach_process_native_afu_directed(ctx
);
1087 static int native_get_irq_info(struct cxl_afu
*afu
, struct cxl_irq_info
*info
)
1089 /* If the adapter has gone away, we can't get any meaningful
1092 if (!cxl_ops
->link_ok(afu
->adapter
, afu
))
1095 info
->dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1096 info
->dar
= cxl_p2n_read(afu
, CXL_PSL_DAR_An
);
1097 if (cxl_is_power8())
1098 info
->dsr
= cxl_p2n_read(afu
, CXL_PSL_DSR_An
);
1099 info
->afu_err
= cxl_p2n_read(afu
, CXL_AFU_ERR_An
);
1100 info
->errstat
= cxl_p2n_read(afu
, CXL_PSL_ErrStat_An
);
1101 info
->proc_handle
= 0;
1106 void cxl_native_irq_dump_regs_psl9(struct cxl_context
*ctx
)
1110 fir1
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL9_FIR1
);
1112 dev_crit(&ctx
->afu
->dev
, "PSL_FIR1: 0x%016llx\n", fir1
);
1113 if (ctx
->afu
->adapter
->native
->sl_ops
->register_serr_irq
) {
1114 serr
= cxl_p1n_read(ctx
->afu
, CXL_PSL_SERR_An
);
1115 cxl_afu_decode_psl_serr(ctx
->afu
, serr
);
1119 void cxl_native_irq_dump_regs_psl8(struct cxl_context
*ctx
)
1121 u64 fir1
, fir2
, fir_slice
, serr
, afu_debug
;
1123 fir1
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL_FIR1
);
1124 fir2
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL_FIR2
);
1125 fir_slice
= cxl_p1n_read(ctx
->afu
, CXL_PSL_FIR_SLICE_An
);
1126 afu_debug
= cxl_p1n_read(ctx
->afu
, CXL_AFU_DEBUG_An
);
1128 dev_crit(&ctx
->afu
->dev
, "PSL_FIR1: 0x%016llx\n", fir1
);
1129 dev_crit(&ctx
->afu
->dev
, "PSL_FIR2: 0x%016llx\n", fir2
);
1130 if (ctx
->afu
->adapter
->native
->sl_ops
->register_serr_irq
) {
1131 serr
= cxl_p1n_read(ctx
->afu
, CXL_PSL_SERR_An
);
1132 cxl_afu_decode_psl_serr(ctx
->afu
, serr
);
1134 dev_crit(&ctx
->afu
->dev
, "PSL_FIR_SLICE_An: 0x%016llx\n", fir_slice
);
1135 dev_crit(&ctx
->afu
->dev
, "CXL_PSL_AFU_DEBUG_An: 0x%016llx\n", afu_debug
);
1138 static irqreturn_t
native_handle_psl_slice_error(struct cxl_context
*ctx
,
1139 u64 dsisr
, u64 errstat
)
1142 dev_crit(&ctx
->afu
->dev
, "PSL ERROR STATUS: 0x%016llx\n", errstat
);
1144 if (ctx
->afu
->adapter
->native
->sl_ops
->psl_irq_dump_registers
)
1145 ctx
->afu
->adapter
->native
->sl_ops
->psl_irq_dump_registers(ctx
);
1147 if (ctx
->afu
->adapter
->native
->sl_ops
->debugfs_stop_trace
) {
1148 dev_crit(&ctx
->afu
->dev
, "STOPPING CXL TRACE\n");
1149 ctx
->afu
->adapter
->native
->sl_ops
->debugfs_stop_trace(ctx
->afu
->adapter
);
1152 return cxl_ops
->ack_irq(ctx
, 0, errstat
);
1155 static bool cxl_is_translation_fault(struct cxl_afu
*afu
, u64 dsisr
)
1157 if ((cxl_is_power8()) && (dsisr
& CXL_PSL_DSISR_TRANS
))
1160 if ((cxl_is_power9()) && (dsisr
& CXL_PSL9_DSISR_An_TF
))
1166 irqreturn_t
cxl_fail_irq_psl(struct cxl_afu
*afu
, struct cxl_irq_info
*irq_info
)
1168 if (cxl_is_translation_fault(afu
, irq_info
->dsisr
))
1169 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_AE
);
1171 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_A
);
1176 static irqreturn_t
native_irq_multiplexed(int irq
, void *data
)
1178 struct cxl_afu
*afu
= data
;
1179 struct cxl_context
*ctx
;
1180 struct cxl_irq_info irq_info
;
1181 u64 phreg
= cxl_p2n_read(afu
, CXL_PSL_PEHandle_An
);
1182 int ph
, ret
= IRQ_HANDLED
, res
;
1184 /* check if eeh kicked in while the interrupt was in flight */
1185 if (unlikely(phreg
== ~0ULL)) {
1187 "Ignoring slice interrupt(%d) due to fenced card",
1191 /* Mask the pe-handle from register value */
1192 ph
= phreg
& 0xffff;
1193 if ((res
= native_get_irq_info(afu
, &irq_info
))) {
1194 WARN(1, "Unable to get CXL IRQ Info: %i\n", res
);
1195 if (afu
->adapter
->native
->sl_ops
->fail_irq
)
1196 return afu
->adapter
->native
->sl_ops
->fail_irq(afu
, &irq_info
);
1201 ctx
= idr_find(&afu
->contexts_idr
, ph
);
1203 if (afu
->adapter
->native
->sl_ops
->handle_interrupt
)
1204 ret
= afu
->adapter
->native
->sl_ops
->handle_interrupt(irq
, ctx
, &irq_info
);
1210 WARN(1, "Unable to demultiplex CXL PSL IRQ for PE %i DSISR %016llx DAR"
1211 " %016llx\n(Possible AFU HW issue - was a term/remove acked"
1212 " with outstanding transactions?)\n", ph
, irq_info
.dsisr
,
1214 if (afu
->adapter
->native
->sl_ops
->fail_irq
)
1215 ret
= afu
->adapter
->native
->sl_ops
->fail_irq(afu
, &irq_info
);
1219 static void native_irq_wait(struct cxl_context
*ctx
)
1226 * Wait until no further interrupts are presented by the PSL
1230 ph
= cxl_p2n_read(ctx
->afu
, CXL_PSL_PEHandle_An
) & 0xffff;
1233 dsisr
= cxl_p2n_read(ctx
->afu
, CXL_PSL_DSISR_An
);
1234 if (cxl_is_power8() &&
1235 ((dsisr
& CXL_PSL_DSISR_PENDING
) == 0))
1237 if (cxl_is_power9() &&
1238 ((dsisr
& CXL_PSL9_DSISR_PENDING
) == 0))
1241 * We are waiting for the workqueue to process our
1242 * irq, so need to let that run here.
1247 dev_warn(&ctx
->afu
->dev
, "WARNING: waiting on DSI for PE %i"
1248 " DSISR %016llx!\n", ph
, dsisr
);
1252 static irqreturn_t
native_slice_irq_err(int irq
, void *data
)
1254 struct cxl_afu
*afu
= data
;
1255 u64 errstat
, serr
, afu_error
, dsisr
;
1256 u64 fir_slice
, afu_debug
, irq_mask
;
1259 * slice err interrupt is only used with full PSL (no XSL)
1261 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
1262 errstat
= cxl_p2n_read(afu
, CXL_PSL_ErrStat_An
);
1263 afu_error
= cxl_p2n_read(afu
, CXL_AFU_ERR_An
);
1264 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1265 cxl_afu_decode_psl_serr(afu
, serr
);
1267 if (cxl_is_power8()) {
1268 fir_slice
= cxl_p1n_read(afu
, CXL_PSL_FIR_SLICE_An
);
1269 afu_debug
= cxl_p1n_read(afu
, CXL_AFU_DEBUG_An
);
1270 dev_crit(&afu
->dev
, "PSL_FIR_SLICE_An: 0x%016llx\n", fir_slice
);
1271 dev_crit(&afu
->dev
, "CXL_PSL_AFU_DEBUG_An: 0x%016llx\n", afu_debug
);
1273 dev_crit(&afu
->dev
, "CXL_PSL_ErrStat_An: 0x%016llx\n", errstat
);
1274 dev_crit(&afu
->dev
, "AFU_ERR_An: 0x%.16llx\n", afu_error
);
1275 dev_crit(&afu
->dev
, "PSL_DSISR_An: 0x%.16llx\n", dsisr
);
1277 /* mask off the IRQ so it won't retrigger until the AFU is reset */
1278 irq_mask
= (serr
& CXL_PSL_SERR_An_IRQS
) >> 32;
1280 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
1281 dev_info(&afu
->dev
, "Further such interrupts will be masked until the AFU is reset\n");
1286 void cxl_native_err_irq_dump_regs_psl9(struct cxl
*adapter
)
1290 fir1
= cxl_p1_read(adapter
, CXL_PSL9_FIR1
);
1291 dev_crit(&adapter
->dev
, "PSL_FIR: 0x%016llx\n", fir1
);
1294 void cxl_native_err_irq_dump_regs_psl8(struct cxl
*adapter
)
1298 fir1
= cxl_p1_read(adapter
, CXL_PSL_FIR1
);
1299 fir2
= cxl_p1_read(adapter
, CXL_PSL_FIR2
);
1300 dev_crit(&adapter
->dev
,
1301 "PSL_FIR1: 0x%016llx\nPSL_FIR2: 0x%016llx\n",
1305 static irqreturn_t
native_irq_err(int irq
, void *data
)
1307 struct cxl
*adapter
= data
;
1310 WARN(1, "CXL ERROR interrupt %i\n", irq
);
1312 err_ivte
= cxl_p1_read(adapter
, CXL_PSL_ErrIVTE
);
1313 dev_crit(&adapter
->dev
, "PSL_ErrIVTE: 0x%016llx\n", err_ivte
);
1315 if (adapter
->native
->sl_ops
->debugfs_stop_trace
) {
1316 dev_crit(&adapter
->dev
, "STOPPING CXL TRACE\n");
1317 adapter
->native
->sl_ops
->debugfs_stop_trace(adapter
);
1320 if (adapter
->native
->sl_ops
->err_irq_dump_registers
)
1321 adapter
->native
->sl_ops
->err_irq_dump_registers(adapter
);
1326 int cxl_native_register_psl_err_irq(struct cxl
*adapter
)
1330 adapter
->irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s-err",
1331 dev_name(&adapter
->dev
));
1332 if (!adapter
->irq_name
)
1335 if ((rc
= cxl_register_one_irq(adapter
, native_irq_err
, adapter
,
1336 &adapter
->native
->err_hwirq
,
1337 &adapter
->native
->err_virq
,
1338 adapter
->irq_name
))) {
1339 kfree(adapter
->irq_name
);
1340 adapter
->irq_name
= NULL
;
1344 cxl_p1_write(adapter
, CXL_PSL_ErrIVTE
, adapter
->native
->err_hwirq
& 0xffff);
1349 void cxl_native_release_psl_err_irq(struct cxl
*adapter
)
1351 if (adapter
->native
->err_virq
== 0 ||
1352 adapter
->native
->err_virq
!=
1353 irq_find_mapping(NULL
, adapter
->native
->err_hwirq
))
1356 cxl_p1_write(adapter
, CXL_PSL_ErrIVTE
, 0x0000000000000000);
1357 cxl_unmap_irq(adapter
->native
->err_virq
, adapter
);
1358 cxl_ops
->release_one_irq(adapter
, adapter
->native
->err_hwirq
);
1359 kfree(adapter
->irq_name
);
1360 adapter
->native
->err_virq
= 0;
1363 int cxl_native_register_serr_irq(struct cxl_afu
*afu
)
1368 afu
->err_irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s-err",
1369 dev_name(&afu
->dev
));
1370 if (!afu
->err_irq_name
)
1373 if ((rc
= cxl_register_one_irq(afu
->adapter
, native_slice_irq_err
, afu
,
1375 &afu
->serr_virq
, afu
->err_irq_name
))) {
1376 kfree(afu
->err_irq_name
);
1377 afu
->err_irq_name
= NULL
;
1381 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
1382 if (cxl_is_power8())
1383 serr
= (serr
& 0x00ffffffffff0000ULL
) | (afu
->serr_hwirq
& 0xffff);
1384 if (cxl_is_power9()) {
1386 * By default, all errors are masked. So don't set all masks.
1387 * Slice errors will be transfered.
1389 serr
= (serr
& ~0xff0000007fffffffULL
) | (afu
->serr_hwirq
& 0xffff);
1391 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
1396 void cxl_native_release_serr_irq(struct cxl_afu
*afu
)
1398 if (afu
->serr_virq
== 0 ||
1399 afu
->serr_virq
!= irq_find_mapping(NULL
, afu
->serr_hwirq
))
1402 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, 0x0000000000000000);
1403 cxl_unmap_irq(afu
->serr_virq
, afu
);
1404 cxl_ops
->release_one_irq(afu
->adapter
, afu
->serr_hwirq
);
1405 kfree(afu
->err_irq_name
);
1409 int cxl_native_register_psl_irq(struct cxl_afu
*afu
)
1413 afu
->psl_irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s",
1414 dev_name(&afu
->dev
));
1415 if (!afu
->psl_irq_name
)
1418 if ((rc
= cxl_register_one_irq(afu
->adapter
, native_irq_multiplexed
,
1419 afu
, &afu
->native
->psl_hwirq
, &afu
->native
->psl_virq
,
1420 afu
->psl_irq_name
))) {
1421 kfree(afu
->psl_irq_name
);
1422 afu
->psl_irq_name
= NULL
;
1427 void cxl_native_release_psl_irq(struct cxl_afu
*afu
)
1429 if (afu
->native
->psl_virq
== 0 ||
1430 afu
->native
->psl_virq
!=
1431 irq_find_mapping(NULL
, afu
->native
->psl_hwirq
))
1434 cxl_unmap_irq(afu
->native
->psl_virq
, afu
);
1435 cxl_ops
->release_one_irq(afu
->adapter
, afu
->native
->psl_hwirq
);
1436 kfree(afu
->psl_irq_name
);
1437 afu
->native
->psl_virq
= 0;
1440 static void recover_psl_err(struct cxl_afu
*afu
, u64 errstat
)
1444 pr_devel("RECOVERING FROM PSL ERROR... (0x%016llx)\n", errstat
);
1446 /* Clear PSL_DSISR[PE] */
1447 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1448 cxl_p2n_write(afu
, CXL_PSL_DSISR_An
, dsisr
& ~CXL_PSL_DSISR_An_PE
);
1450 /* Write 1s to clear error status bits */
1451 cxl_p2n_write(afu
, CXL_PSL_ErrStat_An
, errstat
);
1454 static int native_ack_irq(struct cxl_context
*ctx
, u64 tfc
, u64 psl_reset_mask
)
1456 trace_cxl_psl_irq_ack(ctx
, tfc
);
1458 cxl_p2n_write(ctx
->afu
, CXL_PSL_TFC_An
, tfc
);
1460 recover_psl_err(ctx
->afu
, psl_reset_mask
);
1465 int cxl_check_error(struct cxl_afu
*afu
)
1467 return (cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
) == ~0ULL);
1470 static bool native_support_attributes(const char *attr_name
,
1471 enum cxl_attrs type
)
1476 static int native_afu_cr_read64(struct cxl_afu
*afu
, int cr
, u64 off
, u64
*out
)
1478 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1480 if (unlikely(off
>= afu
->crs_len
))
1482 *out
= in_le64(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1483 (cr
* afu
->crs_len
) + off
);
1487 static int native_afu_cr_read32(struct cxl_afu
*afu
, int cr
, u64 off
, u32
*out
)
1489 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1491 if (unlikely(off
>= afu
->crs_len
))
1493 *out
= in_le32(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1494 (cr
* afu
->crs_len
) + off
);
1498 static int native_afu_cr_read16(struct cxl_afu
*afu
, int cr
, u64 off
, u16
*out
)
1500 u64 aligned_off
= off
& ~0x3L
;
1504 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val
);
1506 *out
= (val
>> ((off
& 0x3) * 8)) & 0xffff;
1510 static int native_afu_cr_read8(struct cxl_afu
*afu
, int cr
, u64 off
, u8
*out
)
1512 u64 aligned_off
= off
& ~0x3L
;
1516 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val
);
1518 *out
= (val
>> ((off
& 0x3) * 8)) & 0xff;
1522 static int native_afu_cr_write32(struct cxl_afu
*afu
, int cr
, u64 off
, u32 in
)
1524 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1526 if (unlikely(off
>= afu
->crs_len
))
1528 out_le32(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1529 (cr
* afu
->crs_len
) + off
, in
);
1533 static int native_afu_cr_write16(struct cxl_afu
*afu
, int cr
, u64 off
, u16 in
)
1535 u64 aligned_off
= off
& ~0x3L
;
1536 u32 val32
, mask
, shift
;
1539 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val32
);
1542 shift
= (off
& 0x3) * 8;
1543 WARN_ON(shift
== 24);
1544 mask
= 0xffff << shift
;
1545 val32
= (val32
& ~mask
) | (in
<< shift
);
1547 rc
= native_afu_cr_write32(afu
, cr
, aligned_off
, val32
);
1551 static int native_afu_cr_write8(struct cxl_afu
*afu
, int cr
, u64 off
, u8 in
)
1553 u64 aligned_off
= off
& ~0x3L
;
1554 u32 val32
, mask
, shift
;
1557 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val32
);
1560 shift
= (off
& 0x3) * 8;
1561 mask
= 0xff << shift
;
1562 val32
= (val32
& ~mask
) | (in
<< shift
);
1564 rc
= native_afu_cr_write32(afu
, cr
, aligned_off
, val32
);
1568 const struct cxl_backend_ops cxl_native_ops
= {
1569 .module
= THIS_MODULE
,
1570 .adapter_reset
= cxl_pci_reset
,
1571 .alloc_one_irq
= cxl_pci_alloc_one_irq
,
1572 .release_one_irq
= cxl_pci_release_one_irq
,
1573 .alloc_irq_ranges
= cxl_pci_alloc_irq_ranges
,
1574 .release_irq_ranges
= cxl_pci_release_irq_ranges
,
1575 .setup_irq
= cxl_pci_setup_irq
,
1576 .handle_psl_slice_error
= native_handle_psl_slice_error
,
1577 .psl_interrupt
= NULL
,
1578 .ack_irq
= native_ack_irq
,
1579 .irq_wait
= native_irq_wait
,
1580 .attach_process
= native_attach_process
,
1581 .detach_process
= native_detach_process
,
1582 .update_ivtes
= native_update_ivtes
,
1583 .support_attributes
= native_support_attributes
,
1584 .link_ok
= cxl_adapter_link_ok
,
1585 .release_afu
= cxl_pci_release_afu
,
1586 .afu_read_err_buffer
= cxl_pci_afu_read_err_buffer
,
1587 .afu_check_and_enable
= native_afu_check_and_enable
,
1588 .afu_activate_mode
= native_afu_activate_mode
,
1589 .afu_deactivate_mode
= native_afu_deactivate_mode
,
1590 .afu_reset
= native_afu_reset
,
1591 .afu_cr_read8
= native_afu_cr_read8
,
1592 .afu_cr_read16
= native_afu_cr_read16
,
1593 .afu_cr_read32
= native_afu_cr_read32
,
1594 .afu_cr_read64
= native_afu_cr_read64
,
1595 .afu_cr_write8
= native_afu_cr_write8
,
1596 .afu_cr_write16
= native_afu_cr_write16
,
1597 .afu_cr_write32
= native_afu_cr_write32
,
1598 .read_adapter_vpd
= cxl_pci_read_adapter_vpd
,