2 * Copyright 2014 IBM Corp.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
10 #include <linux/spinlock.h>
11 #include <linux/sched.h>
12 #include <linux/sched/clock.h>
13 #include <linux/slab.h>
14 #include <linux/mutex.h>
16 #include <linux/uaccess.h>
17 #include <linux/delay.h>
18 #include <asm/synch.h>
19 #include <asm/switch_to.h>
20 #include <misc/cxl-base.h>
25 static int afu_control(struct cxl_afu
*afu
, u64 command
, u64 clear
,
26 u64 result
, u64 mask
, bool enabled
)
29 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
32 spin_lock(&afu
->afu_cntl_lock
);
33 pr_devel("AFU command starting: %llx\n", command
);
35 trace_cxl_afu_ctrl(afu
, command
);
37 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
38 cxl_p2n_write(afu
, CXL_AFU_Cntl_An
, (AFU_Cntl
& ~clear
) | command
);
40 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
41 while ((AFU_Cntl
& mask
) != result
) {
42 if (time_after_eq(jiffies
, timeout
)) {
43 dev_warn(&afu
->dev
, "WARNING: AFU control timed out!\n");
48 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
49 afu
->enabled
= enabled
;
54 pr_devel_ratelimited("AFU control... (0x%016llx)\n",
57 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
60 if (AFU_Cntl
& CXL_AFU_Cntl_An_RA
) {
62 * Workaround for a bug in the XSL used in the Mellanox CX4
63 * that fails to clear the RA bit after an AFU reset,
64 * preventing subsequent AFU resets from working.
66 cxl_p2n_write(afu
, CXL_AFU_Cntl_An
, AFU_Cntl
& ~CXL_AFU_Cntl_An_RA
);
69 pr_devel("AFU command complete: %llx\n", command
);
70 afu
->enabled
= enabled
;
72 trace_cxl_afu_ctrl_done(afu
, command
, rc
);
73 spin_unlock(&afu
->afu_cntl_lock
);
78 static int afu_enable(struct cxl_afu
*afu
)
80 pr_devel("AFU enable request\n");
82 return afu_control(afu
, CXL_AFU_Cntl_An_E
, 0,
83 CXL_AFU_Cntl_An_ES_Enabled
,
84 CXL_AFU_Cntl_An_ES_MASK
, true);
87 int cxl_afu_disable(struct cxl_afu
*afu
)
89 pr_devel("AFU disable request\n");
91 return afu_control(afu
, 0, CXL_AFU_Cntl_An_E
,
92 CXL_AFU_Cntl_An_ES_Disabled
,
93 CXL_AFU_Cntl_An_ES_MASK
, false);
96 /* This will disable as well as reset */
97 static int native_afu_reset(struct cxl_afu
*afu
)
102 pr_devel("AFU reset request\n");
104 rc
= afu_control(afu
, CXL_AFU_Cntl_An_RA
, 0,
105 CXL_AFU_Cntl_An_RS_Complete
| CXL_AFU_Cntl_An_ES_Disabled
,
106 CXL_AFU_Cntl_An_RS_MASK
| CXL_AFU_Cntl_An_ES_MASK
,
110 * Re-enable any masked interrupts when the AFU is not
111 * activated to avoid side effects after attaching a process
114 if (afu
->current_mode
== 0) {
115 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
116 serr
&= ~CXL_PSL_SERR_An_IRQ_MASKS
;
117 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
123 static int native_afu_check_and_enable(struct cxl_afu
*afu
)
125 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
126 WARN(1, "Refusing to enable afu while link down!\n");
131 return afu_enable(afu
);
134 int cxl_psl_purge(struct cxl_afu
*afu
)
136 u64 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
137 u64 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
140 u64 trans_fault
= 0x0ULL
;
141 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
144 trace_cxl_psl_ctrl(afu
, CXL_PSL_SCNTL_An_Pc
);
146 pr_devel("PSL purge request\n");
149 trans_fault
= CXL_PSL_DSISR_TRANS
;
151 trans_fault
= CXL_PSL9_DSISR_An_TF
;
153 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
154 dev_warn(&afu
->dev
, "PSL Purge called with link down, ignoring\n");
159 if ((AFU_Cntl
& CXL_AFU_Cntl_An_ES_MASK
) != CXL_AFU_Cntl_An_ES_Disabled
) {
160 WARN(1, "psl_purge request while AFU not disabled!\n");
161 cxl_afu_disable(afu
);
164 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
,
165 PSL_CNTL
| CXL_PSL_SCNTL_An_Pc
);
166 start
= local_clock();
167 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
168 while ((PSL_CNTL
& CXL_PSL_SCNTL_An_Ps_MASK
)
169 == CXL_PSL_SCNTL_An_Ps_Pending
) {
170 if (time_after_eq(jiffies
, timeout
)) {
171 dev_warn(&afu
->dev
, "WARNING: PSL Purge timed out!\n");
175 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
180 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
181 pr_devel_ratelimited("PSL purging... PSL_CNTL: 0x%016llx PSL_DSISR: 0x%016llx\n",
184 if (dsisr
& trans_fault
) {
185 dar
= cxl_p2n_read(afu
, CXL_PSL_DAR_An
);
186 dev_notice(&afu
->dev
, "PSL purge terminating pending translation, DSISR: 0x%016llx, DAR: 0x%016llx\n",
188 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_AE
);
190 dev_notice(&afu
->dev
, "PSL purge acknowledging pending non-translation fault, DSISR: 0x%016llx\n",
192 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_A
);
196 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
199 pr_devel("PSL purged in %lld ns\n", end
- start
);
201 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
,
202 PSL_CNTL
& ~CXL_PSL_SCNTL_An_Pc
);
204 trace_cxl_psl_ctrl_done(afu
, CXL_PSL_SCNTL_An_Pc
, rc
);
208 static int spa_max_procs(int spa_size
)
212 * end_of_SPA_area = SPA_Base + ((n+4) * 128) + (( ((n*8) + 127) >> 7) * 128) + 255
213 * Most of that junk is really just an overly-complicated way of saying
214 * the last 256 bytes are __aligned(128), so it's really:
215 * end_of_SPA_area = end_of_PSL_queue_area + __aligned(128) 255
217 * end_of_PSL_queue_area = SPA_Base + ((n+4) * 128) + (n*8) - 1
219 * sizeof(SPA) = ((n+4) * 128) + (n*8) + __aligned(128) 256
220 * Ignore the alignment (which is safe in this case as long as we are
221 * careful with our rounding) and solve for n:
223 return ((spa_size
/ 8) - 96) / 17;
226 static int cxl_alloc_spa(struct cxl_afu
*afu
, int mode
)
230 /* Work out how many pages to allocate */
231 afu
->native
->spa_order
= -1;
233 afu
->native
->spa_order
++;
234 spa_size
= (1 << afu
->native
->spa_order
) * PAGE_SIZE
;
236 if (spa_size
> 0x100000) {
237 dev_warn(&afu
->dev
, "num_of_processes too large for the SPA, limiting to %i (0x%x)\n",
238 afu
->native
->spa_max_procs
, afu
->native
->spa_size
);
239 if (mode
!= CXL_MODE_DEDICATED
)
240 afu
->num_procs
= afu
->native
->spa_max_procs
;
244 afu
->native
->spa_size
= spa_size
;
245 afu
->native
->spa_max_procs
= spa_max_procs(afu
->native
->spa_size
);
246 } while (afu
->native
->spa_max_procs
< afu
->num_procs
);
248 if (!(afu
->native
->spa
= (struct cxl_process_element
*)
249 __get_free_pages(GFP_KERNEL
| __GFP_ZERO
, afu
->native
->spa_order
))) {
250 pr_err("cxl_alloc_spa: Unable to allocate scheduled process area\n");
253 pr_devel("spa pages: %i afu->spa_max_procs: %i afu->num_procs: %i\n",
254 1<<afu
->native
->spa_order
, afu
->native
->spa_max_procs
, afu
->num_procs
);
259 static void attach_spa(struct cxl_afu
*afu
)
263 afu
->native
->sw_command_status
= (__be64
*)((char *)afu
->native
->spa
+
264 ((afu
->native
->spa_max_procs
+ 3) * 128));
266 spap
= virt_to_phys(afu
->native
->spa
) & CXL_PSL_SPAP_Addr
;
267 spap
|= ((afu
->native
->spa_size
>> (12 - CXL_PSL_SPAP_Size_Shift
)) - 1) & CXL_PSL_SPAP_Size
;
268 spap
|= CXL_PSL_SPAP_V
;
269 pr_devel("cxl: SPA allocated at 0x%p. Max processes: %i, sw_command_status: 0x%p CXL_PSL_SPAP_An=0x%016llx\n",
270 afu
->native
->spa
, afu
->native
->spa_max_procs
,
271 afu
->native
->sw_command_status
, spap
);
272 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, spap
);
275 static inline void detach_spa(struct cxl_afu
*afu
)
277 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, 0);
280 void cxl_release_spa(struct cxl_afu
*afu
)
282 if (afu
->native
->spa
) {
283 free_pages((unsigned long) afu
->native
->spa
,
284 afu
->native
->spa_order
);
285 afu
->native
->spa
= NULL
;
290 * Invalidation of all ERAT entries is no longer required by CAIA2. Use
293 int cxl_invalidate_all_psl9(struct cxl
*adapter
)
295 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
298 pr_devel("CXL adapter - invalidation of all ERAT entries\n");
300 /* Invalidates all ERAT entries for Radix or HPT */
301 ierat
= CXL_XSL9_IERAT_IALL
;
303 ierat
|= CXL_XSL9_IERAT_INVR
;
304 cxl_p1_write(adapter
, CXL_XSL9_IERAT
, ierat
);
306 while (cxl_p1_read(adapter
, CXL_XSL9_IERAT
) & CXL_XSL9_IERAT_IINPROG
) {
307 if (time_after_eq(jiffies
, timeout
)) {
308 dev_warn(&adapter
->dev
,
309 "WARNING: CXL adapter invalidation of all ERAT entries timed out!\n");
312 if (!cxl_ops
->link_ok(adapter
, NULL
))
319 int cxl_invalidate_all_psl8(struct cxl
*adapter
)
321 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
323 pr_devel("CXL adapter wide TLBIA & SLBIA\n");
325 cxl_p1_write(adapter
, CXL_PSL_AFUSEL
, CXL_PSL_AFUSEL_A
);
327 cxl_p1_write(adapter
, CXL_PSL_TLBIA
, CXL_TLB_SLB_IQ_ALL
);
328 while (cxl_p1_read(adapter
, CXL_PSL_TLBIA
) & CXL_TLB_SLB_P
) {
329 if (time_after_eq(jiffies
, timeout
)) {
330 dev_warn(&adapter
->dev
, "WARNING: CXL adapter wide TLBIA timed out!\n");
333 if (!cxl_ops
->link_ok(adapter
, NULL
))
338 cxl_p1_write(adapter
, CXL_PSL_SLBIA
, CXL_TLB_SLB_IQ_ALL
);
339 while (cxl_p1_read(adapter
, CXL_PSL_SLBIA
) & CXL_TLB_SLB_P
) {
340 if (time_after_eq(jiffies
, timeout
)) {
341 dev_warn(&adapter
->dev
, "WARNING: CXL adapter wide SLBIA timed out!\n");
344 if (!cxl_ops
->link_ok(adapter
, NULL
))
351 int cxl_data_cache_flush(struct cxl
*adapter
)
354 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
357 * Do a datacache flush only if datacache is available.
358 * In case of PSL9D datacache absent hence flush operation.
361 if (adapter
->native
->no_data_cache
) {
362 pr_devel("No PSL data cache. Ignoring cache flush req.\n");
366 pr_devel("Flushing data cache\n");
367 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
368 reg
|= CXL_PSL_Control_Fr
;
369 cxl_p1_write(adapter
, CXL_PSL_Control
, reg
);
371 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
372 while ((reg
& CXL_PSL_Control_Fs_MASK
) != CXL_PSL_Control_Fs_Complete
) {
373 if (time_after_eq(jiffies
, timeout
)) {
374 dev_warn(&adapter
->dev
, "WARNING: cache flush timed out!\n");
378 if (!cxl_ops
->link_ok(adapter
, NULL
)) {
379 dev_warn(&adapter
->dev
, "WARNING: link down when flushing cache\n");
383 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
386 reg
&= ~CXL_PSL_Control_Fr
;
387 cxl_p1_write(adapter
, CXL_PSL_Control
, reg
);
391 static int cxl_write_sstp(struct cxl_afu
*afu
, u64 sstp0
, u64 sstp1
)
395 /* 1. Disable SSTP by writing 0 to SSTP1[V] */
396 cxl_p2n_write(afu
, CXL_SSTP1_An
, 0);
398 /* 2. Invalidate all SLB entries */
399 if ((rc
= cxl_afu_slbia(afu
)))
402 /* 3. Set SSTP0_An */
403 cxl_p2n_write(afu
, CXL_SSTP0_An
, sstp0
);
405 /* 4. Set SSTP1_An */
406 cxl_p2n_write(afu
, CXL_SSTP1_An
, sstp1
);
411 /* Using per slice version may improve performance here. (ie. SLBIA_An) */
412 static void slb_invalid(struct cxl_context
*ctx
)
414 struct cxl
*adapter
= ctx
->afu
->adapter
;
417 WARN_ON(!mutex_is_locked(&ctx
->afu
->native
->spa_mutex
));
419 cxl_p1_write(adapter
, CXL_PSL_LBISEL
,
420 ((u64
)be32_to_cpu(ctx
->elem
->common
.pid
) << 32) |
421 be32_to_cpu(ctx
->elem
->lpid
));
422 cxl_p1_write(adapter
, CXL_PSL_SLBIA
, CXL_TLB_SLB_IQ_LPIDPID
);
425 if (!cxl_ops
->link_ok(adapter
, NULL
))
427 slbia
= cxl_p1_read(adapter
, CXL_PSL_SLBIA
);
428 if (!(slbia
& CXL_TLB_SLB_P
))
434 static int do_process_element_cmd(struct cxl_context
*ctx
,
435 u64 cmd
, u64 pe_state
)
438 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
441 trace_cxl_llcmd(ctx
, cmd
);
443 WARN_ON(!ctx
->afu
->enabled
);
445 ctx
->elem
->software_state
= cpu_to_be32(pe_state
);
447 *(ctx
->afu
->native
->sw_command_status
) = cpu_to_be64(cmd
| 0 | ctx
->pe
);
449 cxl_p1n_write(ctx
->afu
, CXL_PSL_LLCMD_An
, cmd
| ctx
->pe
);
451 if (time_after_eq(jiffies
, timeout
)) {
452 dev_warn(&ctx
->afu
->dev
, "WARNING: Process Element Command timed out!\n");
456 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
)) {
457 dev_warn(&ctx
->afu
->dev
, "WARNING: Device link down, aborting Process Element Command!\n");
461 state
= be64_to_cpup(ctx
->afu
->native
->sw_command_status
);
462 if (state
== ~0ULL) {
463 pr_err("cxl: Error adding process element to AFU\n");
467 if ((state
& (CXL_SPA_SW_CMD_MASK
| CXL_SPA_SW_STATE_MASK
| CXL_SPA_SW_LINK_MASK
)) ==
468 (cmd
| (cmd
>> 16) | ctx
->pe
))
471 * The command won't finish in the PSL if there are
472 * outstanding DSIs. Hence we need to yield here in
473 * case there are outstanding DSIs that we need to
474 * service. Tuning possiblity: we could wait for a
481 trace_cxl_llcmd_done(ctx
, cmd
, rc
);
485 static int add_process_element(struct cxl_context
*ctx
)
489 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
490 pr_devel("%s Adding pe: %i started\n", __func__
, ctx
->pe
);
491 if (!(rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_ADD
, CXL_PE_SOFTWARE_STATE_V
)))
492 ctx
->pe_inserted
= true;
493 pr_devel("%s Adding pe: %i finished\n", __func__
, ctx
->pe
);
494 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
498 static int terminate_process_element(struct cxl_context
*ctx
)
502 /* fast path terminate if it's already invalid */
503 if (!(ctx
->elem
->software_state
& cpu_to_be32(CXL_PE_SOFTWARE_STATE_V
)))
506 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
507 pr_devel("%s Terminate pe: %i started\n", __func__
, ctx
->pe
);
508 /* We could be asked to terminate when the hw is down. That
509 * should always succeed: it's not running if the hw has gone
510 * away and is being reset.
512 if (cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
513 rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_TERMINATE
,
514 CXL_PE_SOFTWARE_STATE_V
| CXL_PE_SOFTWARE_STATE_T
);
515 ctx
->elem
->software_state
= 0; /* Remove Valid bit */
516 pr_devel("%s Terminate pe: %i finished\n", __func__
, ctx
->pe
);
517 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
521 static int remove_process_element(struct cxl_context
*ctx
)
525 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
526 pr_devel("%s Remove pe: %i started\n", __func__
, ctx
->pe
);
528 /* We could be asked to remove when the hw is down. Again, if
529 * the hw is down, the PE is gone, so we succeed.
531 if (cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
532 rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_REMOVE
, 0);
535 ctx
->pe_inserted
= false;
538 pr_devel("%s Remove pe: %i finished\n", __func__
, ctx
->pe
);
539 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
544 void cxl_assign_psn_space(struct cxl_context
*ctx
)
546 if (!ctx
->afu
->pp_size
|| ctx
->master
) {
547 ctx
->psn_phys
= ctx
->afu
->psn_phys
;
548 ctx
->psn_size
= ctx
->afu
->adapter
->ps_size
;
550 ctx
->psn_phys
= ctx
->afu
->psn_phys
+
551 (ctx
->afu
->native
->pp_offset
+ ctx
->afu
->pp_size
* ctx
->pe
);
552 ctx
->psn_size
= ctx
->afu
->pp_size
;
556 static int activate_afu_directed(struct cxl_afu
*afu
)
560 dev_info(&afu
->dev
, "Activating AFU directed mode\n");
562 afu
->num_procs
= afu
->max_procs_virtualised
;
563 if (afu
->native
->spa
== NULL
) {
564 if (cxl_alloc_spa(afu
, CXL_MODE_DIRECTED
))
569 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_AFU
);
571 cxl_p1n_write(afu
, CXL_PSL_AMOR_An
, 0xFFFFFFFFFFFFFFFFULL
);
572 cxl_p1n_write(afu
, CXL_PSL_ID_An
, CXL_PSL_ID_An_F
| CXL_PSL_ID_An_L
);
574 afu
->current_mode
= CXL_MODE_DIRECTED
;
576 if ((rc
= cxl_chardev_m_afu_add(afu
)))
579 if ((rc
= cxl_sysfs_afu_m_add(afu
)))
582 if ((rc
= cxl_chardev_s_afu_add(afu
)))
587 cxl_sysfs_afu_m_remove(afu
);
589 cxl_chardev_afu_remove(afu
);
593 #ifdef CONFIG_CPU_LITTLE_ENDIAN
594 #define set_endian(sr) ((sr) |= CXL_PSL_SR_An_LE)
596 #define set_endian(sr) ((sr) &= ~(CXL_PSL_SR_An_LE))
599 u64
cxl_calculate_sr(bool master
, bool kernel
, bool real_mode
, bool p9
)
605 sr
|= CXL_PSL_SR_An_MP
;
606 if (mfspr(SPRN_LPCR
) & LPCR_TC
)
607 sr
|= CXL_PSL_SR_An_TC
;
611 sr
|= CXL_PSL_SR_An_R
;
612 sr
|= (mfmsr() & MSR_SF
) | CXL_PSL_SR_An_HV
;
614 sr
|= CXL_PSL_SR_An_PR
| CXL_PSL_SR_An_R
;
616 sr
|= CXL_PSL_SR_An_HV
;
618 sr
&= ~(CXL_PSL_SR_An_HV
);
619 if (!test_tsk_thread_flag(current
, TIF_32BIT
))
620 sr
|= CXL_PSL_SR_An_SF
;
624 sr
|= CXL_PSL_SR_An_XLAT_ror
;
626 sr
|= CXL_PSL_SR_An_XLAT_hpt
;
631 static u64
calculate_sr(struct cxl_context
*ctx
)
633 return cxl_calculate_sr(ctx
->master
, ctx
->kernel
, false,
637 static void update_ivtes_directed(struct cxl_context
*ctx
)
639 bool need_update
= (ctx
->status
== STARTED
);
643 WARN_ON(terminate_process_element(ctx
));
644 WARN_ON(remove_process_element(ctx
));
647 for (r
= 0; r
< CXL_IRQ_RANGES
; r
++) {
648 ctx
->elem
->ivte_offsets
[r
] = cpu_to_be16(ctx
->irqs
.offset
[r
]);
649 ctx
->elem
->ivte_ranges
[r
] = cpu_to_be16(ctx
->irqs
.range
[r
]);
653 * Theoretically we could use the update llcmd, instead of a
654 * terminate/remove/add (or if an atomic update was required we could
655 * do a suspend/update/resume), however it seems there might be issues
656 * with the update llcmd on some cards (including those using an XSL on
657 * an ASIC) so for now it's safest to go with the commands that are
658 * known to work. In the future if we come across a situation where the
659 * card may be performing transactions using the same PE while we are
660 * doing this update we might need to revisit this.
663 WARN_ON(add_process_element(ctx
));
666 static int process_element_entry_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
671 cxl_assign_psn_space(ctx
);
673 ctx
->elem
->ctxtime
= 0; /* disable */
674 ctx
->elem
->lpid
= cpu_to_be32(mfspr(SPRN_LPID
));
675 ctx
->elem
->haurp
= 0; /* disable */
680 if (ctx
->mm
== NULL
) {
681 pr_devel("%s: unable to get mm for pe=%d pid=%i\n",
682 __func__
, ctx
->pe
, pid_nr(ctx
->pid
));
685 pid
= ctx
->mm
->context
.id
;
688 /* Assign a unique TIDR (thread id) for the current thread */
689 if (!(ctx
->tidr
) && (ctx
->assign_tidr
)) {
690 rc
= set_thread_tidr(current
);
693 ctx
->tidr
= current
->thread
.tidr
;
694 pr_devel("%s: current tidr: %d\n", __func__
, ctx
->tidr
);
697 ctx
->elem
->common
.tid
= cpu_to_be32(ctx
->tidr
);
698 ctx
->elem
->common
.pid
= cpu_to_be32(pid
);
700 ctx
->elem
->sr
= cpu_to_be64(calculate_sr(ctx
));
702 ctx
->elem
->common
.csrp
= 0; /* disable */
704 cxl_prefault(ctx
, wed
);
707 * Ensure we have the multiplexed PSL interrupt set up to take faults
708 * for kernel contexts that may not have allocated any AFU IRQs at all:
710 if (ctx
->irqs
.range
[0] == 0) {
711 ctx
->irqs
.offset
[0] = ctx
->afu
->native
->psl_hwirq
;
712 ctx
->irqs
.range
[0] = 1;
715 ctx
->elem
->common
.amr
= cpu_to_be64(amr
);
716 ctx
->elem
->common
.wed
= cpu_to_be64(wed
);
721 int cxl_attach_afu_directed_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
725 /* fill the process element entry */
726 result
= process_element_entry_psl9(ctx
, wed
, amr
);
730 update_ivtes_directed(ctx
);
732 /* first guy needs to enable */
733 result
= cxl_ops
->afu_check_and_enable(ctx
->afu
);
737 return add_process_element(ctx
);
740 int cxl_attach_afu_directed_psl8(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
745 cxl_assign_psn_space(ctx
);
747 ctx
->elem
->ctxtime
= 0; /* disable */
748 ctx
->elem
->lpid
= cpu_to_be32(mfspr(SPRN_LPID
));
749 ctx
->elem
->haurp
= 0; /* disable */
750 ctx
->elem
->u
.sdr
= cpu_to_be64(mfspr(SPRN_SDR1
));
755 ctx
->elem
->common
.tid
= 0;
756 ctx
->elem
->common
.pid
= cpu_to_be32(pid
);
758 ctx
->elem
->sr
= cpu_to_be64(calculate_sr(ctx
));
760 ctx
->elem
->common
.csrp
= 0; /* disable */
761 ctx
->elem
->common
.u
.psl8
.aurp0
= 0; /* disable */
762 ctx
->elem
->common
.u
.psl8
.aurp1
= 0; /* disable */
764 cxl_prefault(ctx
, wed
);
766 ctx
->elem
->common
.u
.psl8
.sstp0
= cpu_to_be64(ctx
->sstp0
);
767 ctx
->elem
->common
.u
.psl8
.sstp1
= cpu_to_be64(ctx
->sstp1
);
770 * Ensure we have the multiplexed PSL interrupt set up to take faults
771 * for kernel contexts that may not have allocated any AFU IRQs at all:
773 if (ctx
->irqs
.range
[0] == 0) {
774 ctx
->irqs
.offset
[0] = ctx
->afu
->native
->psl_hwirq
;
775 ctx
->irqs
.range
[0] = 1;
778 update_ivtes_directed(ctx
);
780 ctx
->elem
->common
.amr
= cpu_to_be64(amr
);
781 ctx
->elem
->common
.wed
= cpu_to_be64(wed
);
783 /* first guy needs to enable */
784 if ((result
= cxl_ops
->afu_check_and_enable(ctx
->afu
)))
787 return add_process_element(ctx
);
790 static int deactivate_afu_directed(struct cxl_afu
*afu
)
792 dev_info(&afu
->dev
, "Deactivating AFU directed mode\n");
794 afu
->current_mode
= 0;
797 cxl_sysfs_afu_m_remove(afu
);
798 cxl_chardev_afu_remove(afu
);
801 * The CAIA section 2.2.1 indicates that the procedure for starting and
802 * stopping an AFU in AFU directed mode is AFU specific, which is not
803 * ideal since this code is generic and with one exception has no
804 * knowledge of the AFU. This is in contrast to the procedure for
805 * disabling a dedicated process AFU, which is documented to just
806 * require a reset. The architecture does indicate that both an AFU
807 * reset and an AFU disable should result in the AFU being disabled and
808 * we do both followed by a PSL purge for safety.
810 * Notably we used to have some issues with the disable sequence on PSL
811 * cards, which is why we ended up using this heavy weight procedure in
812 * the first place, however a bug was discovered that had rendered the
813 * disable operation ineffective, so it is conceivable that was the
814 * sole explanation for those difficulties. Careful regression testing
815 * is recommended if anyone attempts to remove or reorder these
818 * The XSL on the Mellanox CX4 behaves a little differently from the
819 * PSL based cards and will time out an AFU reset if the AFU is still
820 * enabled. That card is special in that we do have a means to identify
821 * it from this code, so in that case we skip the reset and just use a
822 * disable/purge to avoid the timeout and corresponding noise in the
825 if (afu
->adapter
->native
->sl_ops
->needs_reset_before_disable
)
826 cxl_ops
->afu_reset(afu
);
827 cxl_afu_disable(afu
);
833 int cxl_activate_dedicated_process_psl9(struct cxl_afu
*afu
)
835 dev_info(&afu
->dev
, "Activating dedicated process mode\n");
838 * If XSL is set to dedicated mode (Set in PSL_SCNTL reg), the
839 * XSL and AFU are programmed to work with a single context.
840 * The context information should be configured in the SPA area
841 * index 0 (so PSL_SPAP must be configured before enabling the
845 if (afu
->native
->spa
== NULL
) {
846 if (cxl_alloc_spa(afu
, CXL_MODE_DEDICATED
))
851 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_Process
);
852 cxl_p1n_write(afu
, CXL_PSL_ID_An
, CXL_PSL_ID_An_F
| CXL_PSL_ID_An_L
);
854 afu
->current_mode
= CXL_MODE_DEDICATED
;
856 return cxl_chardev_d_afu_add(afu
);
859 int cxl_activate_dedicated_process_psl8(struct cxl_afu
*afu
)
861 dev_info(&afu
->dev
, "Activating dedicated process mode\n");
863 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_Process
);
865 cxl_p1n_write(afu
, CXL_PSL_CtxTime_An
, 0); /* disable */
866 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, 0); /* disable */
867 cxl_p1n_write(afu
, CXL_PSL_AMOR_An
, 0xFFFFFFFFFFFFFFFFULL
);
868 cxl_p1n_write(afu
, CXL_PSL_LPID_An
, mfspr(SPRN_LPID
));
869 cxl_p1n_write(afu
, CXL_HAURP_An
, 0); /* disable */
870 cxl_p1n_write(afu
, CXL_PSL_SDR_An
, mfspr(SPRN_SDR1
));
872 cxl_p2n_write(afu
, CXL_CSRP_An
, 0); /* disable */
873 cxl_p2n_write(afu
, CXL_AURP0_An
, 0); /* disable */
874 cxl_p2n_write(afu
, CXL_AURP1_An
, 0); /* disable */
876 afu
->current_mode
= CXL_MODE_DEDICATED
;
879 return cxl_chardev_d_afu_add(afu
);
882 void cxl_update_dedicated_ivtes_psl9(struct cxl_context
*ctx
)
886 for (r
= 0; r
< CXL_IRQ_RANGES
; r
++) {
887 ctx
->elem
->ivte_offsets
[r
] = cpu_to_be16(ctx
->irqs
.offset
[r
]);
888 ctx
->elem
->ivte_ranges
[r
] = cpu_to_be16(ctx
->irqs
.range
[r
]);
892 void cxl_update_dedicated_ivtes_psl8(struct cxl_context
*ctx
)
894 struct cxl_afu
*afu
= ctx
->afu
;
896 cxl_p1n_write(afu
, CXL_PSL_IVTE_Offset_An
,
897 (((u64
)ctx
->irqs
.offset
[0] & 0xffff) << 48) |
898 (((u64
)ctx
->irqs
.offset
[1] & 0xffff) << 32) |
899 (((u64
)ctx
->irqs
.offset
[2] & 0xffff) << 16) |
900 ((u64
)ctx
->irqs
.offset
[3] & 0xffff));
901 cxl_p1n_write(afu
, CXL_PSL_IVTE_Limit_An
, (u64
)
902 (((u64
)ctx
->irqs
.range
[0] & 0xffff) << 48) |
903 (((u64
)ctx
->irqs
.range
[1] & 0xffff) << 32) |
904 (((u64
)ctx
->irqs
.range
[2] & 0xffff) << 16) |
905 ((u64
)ctx
->irqs
.range
[3] & 0xffff));
908 int cxl_attach_dedicated_process_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
910 struct cxl_afu
*afu
= ctx
->afu
;
913 /* fill the process element entry */
914 result
= process_element_entry_psl9(ctx
, wed
, amr
);
918 if (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
)
919 afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
921 ctx
->elem
->software_state
= cpu_to_be32(CXL_PE_SOFTWARE_STATE_V
);
923 * Ideally we should do a wmb() here to make sure the changes to the
924 * PE are visible to the card before we call afu_enable.
925 * On ppc64 though all mmios are preceded by a 'sync' instruction hence
926 * we dont dont need one here.
929 result
= cxl_ops
->afu_reset(afu
);
933 return afu_enable(afu
);
936 int cxl_attach_dedicated_process_psl8(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
938 struct cxl_afu
*afu
= ctx
->afu
;
942 pid
= (u64
)current
->pid
<< 32;
945 cxl_p2n_write(afu
, CXL_PSL_PID_TID_An
, pid
);
947 cxl_p1n_write(afu
, CXL_PSL_SR_An
, calculate_sr(ctx
));
949 if ((rc
= cxl_write_sstp(afu
, ctx
->sstp0
, ctx
->sstp1
)))
952 cxl_prefault(ctx
, wed
);
954 if (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
)
955 afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
957 cxl_p2n_write(afu
, CXL_PSL_AMR_An
, amr
);
959 /* master only context for dedicated */
960 cxl_assign_psn_space(ctx
);
962 if ((rc
= cxl_ops
->afu_reset(afu
)))
965 cxl_p2n_write(afu
, CXL_PSL_WED_An
, wed
);
967 return afu_enable(afu
);
970 static int deactivate_dedicated_process(struct cxl_afu
*afu
)
972 dev_info(&afu
->dev
, "Deactivating dedicated process mode\n");
974 afu
->current_mode
= 0;
977 cxl_chardev_afu_remove(afu
);
982 static int native_afu_deactivate_mode(struct cxl_afu
*afu
, int mode
)
984 if (mode
== CXL_MODE_DIRECTED
)
985 return deactivate_afu_directed(afu
);
986 if (mode
== CXL_MODE_DEDICATED
)
987 return deactivate_dedicated_process(afu
);
991 static int native_afu_activate_mode(struct cxl_afu
*afu
, int mode
)
995 if (!(mode
& afu
->modes_supported
))
998 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
999 WARN(1, "Device link is down, refusing to activate!\n");
1003 if (mode
== CXL_MODE_DIRECTED
)
1004 return activate_afu_directed(afu
);
1005 if ((mode
== CXL_MODE_DEDICATED
) &&
1006 (afu
->adapter
->native
->sl_ops
->activate_dedicated_process
))
1007 return afu
->adapter
->native
->sl_ops
->activate_dedicated_process(afu
);
1012 static int native_attach_process(struct cxl_context
*ctx
, bool kernel
,
1015 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
)) {
1016 WARN(1, "Device link is down, refusing to attach process!\n");
1020 ctx
->kernel
= kernel
;
1021 if ((ctx
->afu
->current_mode
== CXL_MODE_DIRECTED
) &&
1022 (ctx
->afu
->adapter
->native
->sl_ops
->attach_afu_directed
))
1023 return ctx
->afu
->adapter
->native
->sl_ops
->attach_afu_directed(ctx
, wed
, amr
);
1025 if ((ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
) &&
1026 (ctx
->afu
->adapter
->native
->sl_ops
->attach_dedicated_process
))
1027 return ctx
->afu
->adapter
->native
->sl_ops
->attach_dedicated_process(ctx
, wed
, amr
);
1032 static inline int detach_process_native_dedicated(struct cxl_context
*ctx
)
1035 * The CAIA section 2.1.1 indicates that we need to do an AFU reset to
1036 * stop the AFU in dedicated mode (we therefore do not make that
1037 * optional like we do in the afu directed path). It does not indicate
1038 * that we need to do an explicit disable (which should occur
1039 * implicitly as part of the reset) or purge, but we do these as well
1040 * to be on the safe side.
1042 * Notably we used to have some issues with the disable sequence
1043 * (before the sequence was spelled out in the architecture) which is
1044 * why we were so heavy weight in the first place, however a bug was
1045 * discovered that had rendered the disable operation ineffective, so
1046 * it is conceivable that was the sole explanation for those
1047 * difficulties. Point is, we should be careful and do some regression
1048 * testing if we ever attempt to remove any part of this procedure.
1050 cxl_ops
->afu_reset(ctx
->afu
);
1051 cxl_afu_disable(ctx
->afu
);
1052 cxl_psl_purge(ctx
->afu
);
1056 static void native_update_ivtes(struct cxl_context
*ctx
)
1058 if (ctx
->afu
->current_mode
== CXL_MODE_DIRECTED
)
1059 return update_ivtes_directed(ctx
);
1060 if ((ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
) &&
1061 (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
))
1062 return ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
1063 WARN(1, "native_update_ivtes: Bad mode\n");
1066 static inline int detach_process_native_afu_directed(struct cxl_context
*ctx
)
1068 if (!ctx
->pe_inserted
)
1070 if (terminate_process_element(ctx
))
1072 if (remove_process_element(ctx
))
1078 static int native_detach_process(struct cxl_context
*ctx
)
1080 trace_cxl_detach(ctx
);
1082 if (ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
)
1083 return detach_process_native_dedicated(ctx
);
1085 return detach_process_native_afu_directed(ctx
);
1088 static int native_get_irq_info(struct cxl_afu
*afu
, struct cxl_irq_info
*info
)
1090 /* If the adapter has gone away, we can't get any meaningful
1093 if (!cxl_ops
->link_ok(afu
->adapter
, afu
))
1096 info
->dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1097 info
->dar
= cxl_p2n_read(afu
, CXL_PSL_DAR_An
);
1098 if (cxl_is_power8())
1099 info
->dsr
= cxl_p2n_read(afu
, CXL_PSL_DSR_An
);
1100 info
->afu_err
= cxl_p2n_read(afu
, CXL_AFU_ERR_An
);
1101 info
->errstat
= cxl_p2n_read(afu
, CXL_PSL_ErrStat_An
);
1102 info
->proc_handle
= 0;
1107 void cxl_native_irq_dump_regs_psl9(struct cxl_context
*ctx
)
1111 fir1
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL9_FIR1
);
1113 dev_crit(&ctx
->afu
->dev
, "PSL_FIR1: 0x%016llx\n", fir1
);
1114 if (ctx
->afu
->adapter
->native
->sl_ops
->register_serr_irq
) {
1115 serr
= cxl_p1n_read(ctx
->afu
, CXL_PSL_SERR_An
);
1116 cxl_afu_decode_psl_serr(ctx
->afu
, serr
);
1120 void cxl_native_irq_dump_regs_psl8(struct cxl_context
*ctx
)
1122 u64 fir1
, fir2
, fir_slice
, serr
, afu_debug
;
1124 fir1
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL_FIR1
);
1125 fir2
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL_FIR2
);
1126 fir_slice
= cxl_p1n_read(ctx
->afu
, CXL_PSL_FIR_SLICE_An
);
1127 afu_debug
= cxl_p1n_read(ctx
->afu
, CXL_AFU_DEBUG_An
);
1129 dev_crit(&ctx
->afu
->dev
, "PSL_FIR1: 0x%016llx\n", fir1
);
1130 dev_crit(&ctx
->afu
->dev
, "PSL_FIR2: 0x%016llx\n", fir2
);
1131 if (ctx
->afu
->adapter
->native
->sl_ops
->register_serr_irq
) {
1132 serr
= cxl_p1n_read(ctx
->afu
, CXL_PSL_SERR_An
);
1133 cxl_afu_decode_psl_serr(ctx
->afu
, serr
);
1135 dev_crit(&ctx
->afu
->dev
, "PSL_FIR_SLICE_An: 0x%016llx\n", fir_slice
);
1136 dev_crit(&ctx
->afu
->dev
, "CXL_PSL_AFU_DEBUG_An: 0x%016llx\n", afu_debug
);
1139 static irqreturn_t
native_handle_psl_slice_error(struct cxl_context
*ctx
,
1140 u64 dsisr
, u64 errstat
)
1143 dev_crit(&ctx
->afu
->dev
, "PSL ERROR STATUS: 0x%016llx\n", errstat
);
1145 if (ctx
->afu
->adapter
->native
->sl_ops
->psl_irq_dump_registers
)
1146 ctx
->afu
->adapter
->native
->sl_ops
->psl_irq_dump_registers(ctx
);
1148 if (ctx
->afu
->adapter
->native
->sl_ops
->debugfs_stop_trace
) {
1149 dev_crit(&ctx
->afu
->dev
, "STOPPING CXL TRACE\n");
1150 ctx
->afu
->adapter
->native
->sl_ops
->debugfs_stop_trace(ctx
->afu
->adapter
);
1153 return cxl_ops
->ack_irq(ctx
, 0, errstat
);
1156 static bool cxl_is_translation_fault(struct cxl_afu
*afu
, u64 dsisr
)
1158 if ((cxl_is_power8()) && (dsisr
& CXL_PSL_DSISR_TRANS
))
1161 if ((cxl_is_power9()) && (dsisr
& CXL_PSL9_DSISR_An_TF
))
1167 irqreturn_t
cxl_fail_irq_psl(struct cxl_afu
*afu
, struct cxl_irq_info
*irq_info
)
1169 if (cxl_is_translation_fault(afu
, irq_info
->dsisr
))
1170 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_AE
);
1172 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_A
);
1177 static irqreturn_t
native_irq_multiplexed(int irq
, void *data
)
1179 struct cxl_afu
*afu
= data
;
1180 struct cxl_context
*ctx
;
1181 struct cxl_irq_info irq_info
;
1182 u64 phreg
= cxl_p2n_read(afu
, CXL_PSL_PEHandle_An
);
1183 int ph
, ret
= IRQ_HANDLED
, res
;
1185 /* check if eeh kicked in while the interrupt was in flight */
1186 if (unlikely(phreg
== ~0ULL)) {
1188 "Ignoring slice interrupt(%d) due to fenced card",
1192 /* Mask the pe-handle from register value */
1193 ph
= phreg
& 0xffff;
1194 if ((res
= native_get_irq_info(afu
, &irq_info
))) {
1195 WARN(1, "Unable to get CXL IRQ Info: %i\n", res
);
1196 if (afu
->adapter
->native
->sl_ops
->fail_irq
)
1197 return afu
->adapter
->native
->sl_ops
->fail_irq(afu
, &irq_info
);
1202 ctx
= idr_find(&afu
->contexts_idr
, ph
);
1204 if (afu
->adapter
->native
->sl_ops
->handle_interrupt
)
1205 ret
= afu
->adapter
->native
->sl_ops
->handle_interrupt(irq
, ctx
, &irq_info
);
1211 WARN(1, "Unable to demultiplex CXL PSL IRQ for PE %i DSISR %016llx DAR"
1212 " %016llx\n(Possible AFU HW issue - was a term/remove acked"
1213 " with outstanding transactions?)\n", ph
, irq_info
.dsisr
,
1215 if (afu
->adapter
->native
->sl_ops
->fail_irq
)
1216 ret
= afu
->adapter
->native
->sl_ops
->fail_irq(afu
, &irq_info
);
1220 static void native_irq_wait(struct cxl_context
*ctx
)
1227 * Wait until no further interrupts are presented by the PSL
1231 ph
= cxl_p2n_read(ctx
->afu
, CXL_PSL_PEHandle_An
) & 0xffff;
1234 dsisr
= cxl_p2n_read(ctx
->afu
, CXL_PSL_DSISR_An
);
1235 if (cxl_is_power8() &&
1236 ((dsisr
& CXL_PSL_DSISR_PENDING
) == 0))
1238 if (cxl_is_power9() &&
1239 ((dsisr
& CXL_PSL9_DSISR_PENDING
) == 0))
1242 * We are waiting for the workqueue to process our
1243 * irq, so need to let that run here.
1248 dev_warn(&ctx
->afu
->dev
, "WARNING: waiting on DSI for PE %i"
1249 " DSISR %016llx!\n", ph
, dsisr
);
1253 static irqreturn_t
native_slice_irq_err(int irq
, void *data
)
1255 struct cxl_afu
*afu
= data
;
1256 u64 errstat
, serr
, afu_error
, dsisr
;
1257 u64 fir_slice
, afu_debug
, irq_mask
;
1260 * slice err interrupt is only used with full PSL (no XSL)
1262 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
1263 errstat
= cxl_p2n_read(afu
, CXL_PSL_ErrStat_An
);
1264 afu_error
= cxl_p2n_read(afu
, CXL_AFU_ERR_An
);
1265 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1266 cxl_afu_decode_psl_serr(afu
, serr
);
1268 if (cxl_is_power8()) {
1269 fir_slice
= cxl_p1n_read(afu
, CXL_PSL_FIR_SLICE_An
);
1270 afu_debug
= cxl_p1n_read(afu
, CXL_AFU_DEBUG_An
);
1271 dev_crit(&afu
->dev
, "PSL_FIR_SLICE_An: 0x%016llx\n", fir_slice
);
1272 dev_crit(&afu
->dev
, "CXL_PSL_AFU_DEBUG_An: 0x%016llx\n", afu_debug
);
1274 dev_crit(&afu
->dev
, "CXL_PSL_ErrStat_An: 0x%016llx\n", errstat
);
1275 dev_crit(&afu
->dev
, "AFU_ERR_An: 0x%.16llx\n", afu_error
);
1276 dev_crit(&afu
->dev
, "PSL_DSISR_An: 0x%.16llx\n", dsisr
);
1278 /* mask off the IRQ so it won't retrigger until the AFU is reset */
1279 irq_mask
= (serr
& CXL_PSL_SERR_An_IRQS
) >> 32;
1281 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
1282 dev_info(&afu
->dev
, "Further such interrupts will be masked until the AFU is reset\n");
1287 void cxl_native_err_irq_dump_regs_psl9(struct cxl
*adapter
)
1291 fir1
= cxl_p1_read(adapter
, CXL_PSL9_FIR1
);
1292 dev_crit(&adapter
->dev
, "PSL_FIR: 0x%016llx\n", fir1
);
1295 void cxl_native_err_irq_dump_regs_psl8(struct cxl
*adapter
)
1299 fir1
= cxl_p1_read(adapter
, CXL_PSL_FIR1
);
1300 fir2
= cxl_p1_read(adapter
, CXL_PSL_FIR2
);
1301 dev_crit(&adapter
->dev
,
1302 "PSL_FIR1: 0x%016llx\nPSL_FIR2: 0x%016llx\n",
1306 static irqreturn_t
native_irq_err(int irq
, void *data
)
1308 struct cxl
*adapter
= data
;
1311 WARN(1, "CXL ERROR interrupt %i\n", irq
);
1313 err_ivte
= cxl_p1_read(adapter
, CXL_PSL_ErrIVTE
);
1314 dev_crit(&adapter
->dev
, "PSL_ErrIVTE: 0x%016llx\n", err_ivte
);
1316 if (adapter
->native
->sl_ops
->debugfs_stop_trace
) {
1317 dev_crit(&adapter
->dev
, "STOPPING CXL TRACE\n");
1318 adapter
->native
->sl_ops
->debugfs_stop_trace(adapter
);
1321 if (adapter
->native
->sl_ops
->err_irq_dump_registers
)
1322 adapter
->native
->sl_ops
->err_irq_dump_registers(adapter
);
1327 int cxl_native_register_psl_err_irq(struct cxl
*adapter
)
1331 adapter
->irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s-err",
1332 dev_name(&adapter
->dev
));
1333 if (!adapter
->irq_name
)
1336 if ((rc
= cxl_register_one_irq(adapter
, native_irq_err
, adapter
,
1337 &adapter
->native
->err_hwirq
,
1338 &adapter
->native
->err_virq
,
1339 adapter
->irq_name
))) {
1340 kfree(adapter
->irq_name
);
1341 adapter
->irq_name
= NULL
;
1345 cxl_p1_write(adapter
, CXL_PSL_ErrIVTE
, adapter
->native
->err_hwirq
& 0xffff);
1350 void cxl_native_release_psl_err_irq(struct cxl
*adapter
)
1352 if (adapter
->native
->err_virq
== 0 ||
1353 adapter
->native
->err_virq
!=
1354 irq_find_mapping(NULL
, adapter
->native
->err_hwirq
))
1357 cxl_p1_write(adapter
, CXL_PSL_ErrIVTE
, 0x0000000000000000);
1358 cxl_unmap_irq(adapter
->native
->err_virq
, adapter
);
1359 cxl_ops
->release_one_irq(adapter
, adapter
->native
->err_hwirq
);
1360 kfree(adapter
->irq_name
);
1361 adapter
->native
->err_virq
= 0;
1364 int cxl_native_register_serr_irq(struct cxl_afu
*afu
)
1369 afu
->err_irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s-err",
1370 dev_name(&afu
->dev
));
1371 if (!afu
->err_irq_name
)
1374 if ((rc
= cxl_register_one_irq(afu
->adapter
, native_slice_irq_err
, afu
,
1376 &afu
->serr_virq
, afu
->err_irq_name
))) {
1377 kfree(afu
->err_irq_name
);
1378 afu
->err_irq_name
= NULL
;
1382 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
1383 if (cxl_is_power8())
1384 serr
= (serr
& 0x00ffffffffff0000ULL
) | (afu
->serr_hwirq
& 0xffff);
1385 if (cxl_is_power9()) {
1387 * By default, all errors are masked. So don't set all masks.
1388 * Slice errors will be transfered.
1390 serr
= (serr
& ~0xff0000007fffffffULL
) | (afu
->serr_hwirq
& 0xffff);
1392 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
1397 void cxl_native_release_serr_irq(struct cxl_afu
*afu
)
1399 if (afu
->serr_virq
== 0 ||
1400 afu
->serr_virq
!= irq_find_mapping(NULL
, afu
->serr_hwirq
))
1403 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, 0x0000000000000000);
1404 cxl_unmap_irq(afu
->serr_virq
, afu
);
1405 cxl_ops
->release_one_irq(afu
->adapter
, afu
->serr_hwirq
);
1406 kfree(afu
->err_irq_name
);
1410 int cxl_native_register_psl_irq(struct cxl_afu
*afu
)
1414 afu
->psl_irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s",
1415 dev_name(&afu
->dev
));
1416 if (!afu
->psl_irq_name
)
1419 if ((rc
= cxl_register_one_irq(afu
->adapter
, native_irq_multiplexed
,
1420 afu
, &afu
->native
->psl_hwirq
, &afu
->native
->psl_virq
,
1421 afu
->psl_irq_name
))) {
1422 kfree(afu
->psl_irq_name
);
1423 afu
->psl_irq_name
= NULL
;
1428 void cxl_native_release_psl_irq(struct cxl_afu
*afu
)
1430 if (afu
->native
->psl_virq
== 0 ||
1431 afu
->native
->psl_virq
!=
1432 irq_find_mapping(NULL
, afu
->native
->psl_hwirq
))
1435 cxl_unmap_irq(afu
->native
->psl_virq
, afu
);
1436 cxl_ops
->release_one_irq(afu
->adapter
, afu
->native
->psl_hwirq
);
1437 kfree(afu
->psl_irq_name
);
1438 afu
->native
->psl_virq
= 0;
1441 static void recover_psl_err(struct cxl_afu
*afu
, u64 errstat
)
1445 pr_devel("RECOVERING FROM PSL ERROR... (0x%016llx)\n", errstat
);
1447 /* Clear PSL_DSISR[PE] */
1448 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1449 cxl_p2n_write(afu
, CXL_PSL_DSISR_An
, dsisr
& ~CXL_PSL_DSISR_An_PE
);
1451 /* Write 1s to clear error status bits */
1452 cxl_p2n_write(afu
, CXL_PSL_ErrStat_An
, errstat
);
1455 static int native_ack_irq(struct cxl_context
*ctx
, u64 tfc
, u64 psl_reset_mask
)
1457 trace_cxl_psl_irq_ack(ctx
, tfc
);
1459 cxl_p2n_write(ctx
->afu
, CXL_PSL_TFC_An
, tfc
);
1461 recover_psl_err(ctx
->afu
, psl_reset_mask
);
1466 int cxl_check_error(struct cxl_afu
*afu
)
1468 return (cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
) == ~0ULL);
1471 static bool native_support_attributes(const char *attr_name
,
1472 enum cxl_attrs type
)
1477 static int native_afu_cr_read64(struct cxl_afu
*afu
, int cr
, u64 off
, u64
*out
)
1479 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1481 if (unlikely(off
>= afu
->crs_len
))
1483 *out
= in_le64(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1484 (cr
* afu
->crs_len
) + off
);
1488 static int native_afu_cr_read32(struct cxl_afu
*afu
, int cr
, u64 off
, u32
*out
)
1490 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1492 if (unlikely(off
>= afu
->crs_len
))
1494 *out
= in_le32(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1495 (cr
* afu
->crs_len
) + off
);
1499 static int native_afu_cr_read16(struct cxl_afu
*afu
, int cr
, u64 off
, u16
*out
)
1501 u64 aligned_off
= off
& ~0x3L
;
1505 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val
);
1507 *out
= (val
>> ((off
& 0x3) * 8)) & 0xffff;
1511 static int native_afu_cr_read8(struct cxl_afu
*afu
, int cr
, u64 off
, u8
*out
)
1513 u64 aligned_off
= off
& ~0x3L
;
1517 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val
);
1519 *out
= (val
>> ((off
& 0x3) * 8)) & 0xff;
1523 static int native_afu_cr_write32(struct cxl_afu
*afu
, int cr
, u64 off
, u32 in
)
1525 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1527 if (unlikely(off
>= afu
->crs_len
))
1529 out_le32(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1530 (cr
* afu
->crs_len
) + off
, in
);
1534 static int native_afu_cr_write16(struct cxl_afu
*afu
, int cr
, u64 off
, u16 in
)
1536 u64 aligned_off
= off
& ~0x3L
;
1537 u32 val32
, mask
, shift
;
1540 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val32
);
1543 shift
= (off
& 0x3) * 8;
1544 WARN_ON(shift
== 24);
1545 mask
= 0xffff << shift
;
1546 val32
= (val32
& ~mask
) | (in
<< shift
);
1548 rc
= native_afu_cr_write32(afu
, cr
, aligned_off
, val32
);
1552 static int native_afu_cr_write8(struct cxl_afu
*afu
, int cr
, u64 off
, u8 in
)
1554 u64 aligned_off
= off
& ~0x3L
;
1555 u32 val32
, mask
, shift
;
1558 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val32
);
1561 shift
= (off
& 0x3) * 8;
1562 mask
= 0xff << shift
;
1563 val32
= (val32
& ~mask
) | (in
<< shift
);
1565 rc
= native_afu_cr_write32(afu
, cr
, aligned_off
, val32
);
1569 const struct cxl_backend_ops cxl_native_ops
= {
1570 .module
= THIS_MODULE
,
1571 .adapter_reset
= cxl_pci_reset
,
1572 .alloc_one_irq
= cxl_pci_alloc_one_irq
,
1573 .release_one_irq
= cxl_pci_release_one_irq
,
1574 .alloc_irq_ranges
= cxl_pci_alloc_irq_ranges
,
1575 .release_irq_ranges
= cxl_pci_release_irq_ranges
,
1576 .setup_irq
= cxl_pci_setup_irq
,
1577 .handle_psl_slice_error
= native_handle_psl_slice_error
,
1578 .psl_interrupt
= NULL
,
1579 .ack_irq
= native_ack_irq
,
1580 .irq_wait
= native_irq_wait
,
1581 .attach_process
= native_attach_process
,
1582 .detach_process
= native_detach_process
,
1583 .update_ivtes
= native_update_ivtes
,
1584 .support_attributes
= native_support_attributes
,
1585 .link_ok
= cxl_adapter_link_ok
,
1586 .release_afu
= cxl_pci_release_afu
,
1587 .afu_read_err_buffer
= cxl_pci_afu_read_err_buffer
,
1588 .afu_check_and_enable
= native_afu_check_and_enable
,
1589 .afu_activate_mode
= native_afu_activate_mode
,
1590 .afu_deactivate_mode
= native_afu_deactivate_mode
,
1591 .afu_reset
= native_afu_reset
,
1592 .afu_cr_read8
= native_afu_cr_read8
,
1593 .afu_cr_read16
= native_afu_cr_read16
,
1594 .afu_cr_read32
= native_afu_cr_read32
,
1595 .afu_cr_read64
= native_afu_cr_read64
,
1596 .afu_cr_write8
= native_afu_cr_write8
,
1597 .afu_cr_write16
= native_afu_cr_write16
,
1598 .afu_cr_write32
= native_afu_cr_write32
,
1599 .read_adapter_vpd
= cxl_pci_read_adapter_vpd
,