2 * Copyright 2014 IBM Corp.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
10 #include <linux/spinlock.h>
11 #include <linux/sched.h>
12 #include <linux/sched/clock.h>
13 #include <linux/slab.h>
14 #include <linux/mutex.h>
16 #include <linux/uaccess.h>
17 #include <linux/delay.h>
18 #include <asm/synch.h>
19 #include <asm/switch_to.h>
20 #include <misc/cxl-base.h>
25 static int afu_control(struct cxl_afu
*afu
, u64 command
, u64 clear
,
26 u64 result
, u64 mask
, bool enabled
)
29 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
32 spin_lock(&afu
->afu_cntl_lock
);
33 pr_devel("AFU command starting: %llx\n", command
);
35 trace_cxl_afu_ctrl(afu
, command
);
37 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
38 cxl_p2n_write(afu
, CXL_AFU_Cntl_An
, (AFU_Cntl
& ~clear
) | command
);
40 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
41 while ((AFU_Cntl
& mask
) != result
) {
42 if (time_after_eq(jiffies
, timeout
)) {
43 dev_warn(&afu
->dev
, "WARNING: AFU control timed out!\n");
48 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
49 afu
->enabled
= enabled
;
54 pr_devel_ratelimited("AFU control... (0x%016llx)\n",
57 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
60 if (AFU_Cntl
& CXL_AFU_Cntl_An_RA
) {
62 * Workaround for a bug in the XSL used in the Mellanox CX4
63 * that fails to clear the RA bit after an AFU reset,
64 * preventing subsequent AFU resets from working.
66 cxl_p2n_write(afu
, CXL_AFU_Cntl_An
, AFU_Cntl
& ~CXL_AFU_Cntl_An_RA
);
69 pr_devel("AFU command complete: %llx\n", command
);
70 afu
->enabled
= enabled
;
72 trace_cxl_afu_ctrl_done(afu
, command
, rc
);
73 spin_unlock(&afu
->afu_cntl_lock
);
78 static int afu_enable(struct cxl_afu
*afu
)
80 pr_devel("AFU enable request\n");
82 return afu_control(afu
, CXL_AFU_Cntl_An_E
, 0,
83 CXL_AFU_Cntl_An_ES_Enabled
,
84 CXL_AFU_Cntl_An_ES_MASK
, true);
87 int cxl_afu_disable(struct cxl_afu
*afu
)
89 pr_devel("AFU disable request\n");
91 return afu_control(afu
, 0, CXL_AFU_Cntl_An_E
,
92 CXL_AFU_Cntl_An_ES_Disabled
,
93 CXL_AFU_Cntl_An_ES_MASK
, false);
96 /* This will disable as well as reset */
97 static int native_afu_reset(struct cxl_afu
*afu
)
102 pr_devel("AFU reset request\n");
104 rc
= afu_control(afu
, CXL_AFU_Cntl_An_RA
, 0,
105 CXL_AFU_Cntl_An_RS_Complete
| CXL_AFU_Cntl_An_ES_Disabled
,
106 CXL_AFU_Cntl_An_RS_MASK
| CXL_AFU_Cntl_An_ES_MASK
,
110 * Re-enable any masked interrupts when the AFU is not
111 * activated to avoid side effects after attaching a process
114 if (afu
->current_mode
== 0) {
115 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
116 serr
&= ~CXL_PSL_SERR_An_IRQ_MASKS
;
117 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
123 static int native_afu_check_and_enable(struct cxl_afu
*afu
)
125 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
126 WARN(1, "Refusing to enable afu while link down!\n");
131 return afu_enable(afu
);
134 int cxl_psl_purge(struct cxl_afu
*afu
)
136 u64 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
137 u64 AFU_Cntl
= cxl_p2n_read(afu
, CXL_AFU_Cntl_An
);
140 u64 trans_fault
= 0x0ULL
;
141 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
144 trace_cxl_psl_ctrl(afu
, CXL_PSL_SCNTL_An_Pc
);
146 pr_devel("PSL purge request\n");
149 trans_fault
= CXL_PSL_DSISR_TRANS
;
151 trans_fault
= CXL_PSL9_DSISR_An_TF
;
153 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
154 dev_warn(&afu
->dev
, "PSL Purge called with link down, ignoring\n");
159 if ((AFU_Cntl
& CXL_AFU_Cntl_An_ES_MASK
) != CXL_AFU_Cntl_An_ES_Disabled
) {
160 WARN(1, "psl_purge request while AFU not disabled!\n");
161 cxl_afu_disable(afu
);
164 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
,
165 PSL_CNTL
| CXL_PSL_SCNTL_An_Pc
);
166 start
= local_clock();
167 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
168 while ((PSL_CNTL
& CXL_PSL_SCNTL_An_Ps_MASK
)
169 == CXL_PSL_SCNTL_An_Ps_Pending
) {
170 if (time_after_eq(jiffies
, timeout
)) {
171 dev_warn(&afu
->dev
, "WARNING: PSL Purge timed out!\n");
175 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
180 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
181 pr_devel_ratelimited("PSL purging... PSL_CNTL: 0x%016llx PSL_DSISR: 0x%016llx\n",
184 if (dsisr
& trans_fault
) {
185 dar
= cxl_p2n_read(afu
, CXL_PSL_DAR_An
);
186 dev_notice(&afu
->dev
, "PSL purge terminating pending translation, DSISR: 0x%016llx, DAR: 0x%016llx\n",
188 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_AE
);
190 dev_notice(&afu
->dev
, "PSL purge acknowledging pending non-translation fault, DSISR: 0x%016llx\n",
192 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_A
);
196 PSL_CNTL
= cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
);
199 pr_devel("PSL purged in %lld ns\n", end
- start
);
201 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
,
202 PSL_CNTL
& ~CXL_PSL_SCNTL_An_Pc
);
204 trace_cxl_psl_ctrl_done(afu
, CXL_PSL_SCNTL_An_Pc
, rc
);
208 static int spa_max_procs(int spa_size
)
212 * end_of_SPA_area = SPA_Base + ((n+4) * 128) + (( ((n*8) + 127) >> 7) * 128) + 255
213 * Most of that junk is really just an overly-complicated way of saying
214 * the last 256 bytes are __aligned(128), so it's really:
215 * end_of_SPA_area = end_of_PSL_queue_area + __aligned(128) 255
217 * end_of_PSL_queue_area = SPA_Base + ((n+4) * 128) + (n*8) - 1
219 * sizeof(SPA) = ((n+4) * 128) + (n*8) + __aligned(128) 256
220 * Ignore the alignment (which is safe in this case as long as we are
221 * careful with our rounding) and solve for n:
223 return ((spa_size
/ 8) - 96) / 17;
226 static int cxl_alloc_spa(struct cxl_afu
*afu
, int mode
)
230 /* Work out how many pages to allocate */
231 afu
->native
->spa_order
= -1;
233 afu
->native
->spa_order
++;
234 spa_size
= (1 << afu
->native
->spa_order
) * PAGE_SIZE
;
236 if (spa_size
> 0x100000) {
237 dev_warn(&afu
->dev
, "num_of_processes too large for the SPA, limiting to %i (0x%x)\n",
238 afu
->native
->spa_max_procs
, afu
->native
->spa_size
);
239 if (mode
!= CXL_MODE_DEDICATED
)
240 afu
->num_procs
= afu
->native
->spa_max_procs
;
244 afu
->native
->spa_size
= spa_size
;
245 afu
->native
->spa_max_procs
= spa_max_procs(afu
->native
->spa_size
);
246 } while (afu
->native
->spa_max_procs
< afu
->num_procs
);
248 if (!(afu
->native
->spa
= (struct cxl_process_element
*)
249 __get_free_pages(GFP_KERNEL
| __GFP_ZERO
, afu
->native
->spa_order
))) {
250 pr_err("cxl_alloc_spa: Unable to allocate scheduled process area\n");
253 pr_devel("spa pages: %i afu->spa_max_procs: %i afu->num_procs: %i\n",
254 1<<afu
->native
->spa_order
, afu
->native
->spa_max_procs
, afu
->num_procs
);
259 static void attach_spa(struct cxl_afu
*afu
)
263 afu
->native
->sw_command_status
= (__be64
*)((char *)afu
->native
->spa
+
264 ((afu
->native
->spa_max_procs
+ 3) * 128));
266 spap
= virt_to_phys(afu
->native
->spa
) & CXL_PSL_SPAP_Addr
;
267 spap
|= ((afu
->native
->spa_size
>> (12 - CXL_PSL_SPAP_Size_Shift
)) - 1) & CXL_PSL_SPAP_Size
;
268 spap
|= CXL_PSL_SPAP_V
;
269 pr_devel("cxl: SPA allocated at 0x%p. Max processes: %i, sw_command_status: 0x%p CXL_PSL_SPAP_An=0x%016llx\n",
270 afu
->native
->spa
, afu
->native
->spa_max_procs
,
271 afu
->native
->sw_command_status
, spap
);
272 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, spap
);
275 static inline void detach_spa(struct cxl_afu
*afu
)
277 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, 0);
280 void cxl_release_spa(struct cxl_afu
*afu
)
282 if (afu
->native
->spa
) {
283 free_pages((unsigned long) afu
->native
->spa
,
284 afu
->native
->spa_order
);
285 afu
->native
->spa
= NULL
;
290 * Invalidation of all ERAT entries is no longer required by CAIA2. Use
293 int cxl_invalidate_all_psl9(struct cxl
*adapter
)
295 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
298 pr_devel("CXL adapter - invalidation of all ERAT entries\n");
300 /* Invalidates all ERAT entries for Radix or HPT */
301 ierat
= CXL_XSL9_IERAT_IALL
;
303 ierat
|= CXL_XSL9_IERAT_INVR
;
304 cxl_p1_write(adapter
, CXL_XSL9_IERAT
, ierat
);
306 while (cxl_p1_read(adapter
, CXL_XSL9_IERAT
) & CXL_XSL9_IERAT_IINPROG
) {
307 if (time_after_eq(jiffies
, timeout
)) {
308 dev_warn(&adapter
->dev
,
309 "WARNING: CXL adapter invalidation of all ERAT entries timed out!\n");
312 if (!cxl_ops
->link_ok(adapter
, NULL
))
319 int cxl_invalidate_all_psl8(struct cxl
*adapter
)
321 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
323 pr_devel("CXL adapter wide TLBIA & SLBIA\n");
325 cxl_p1_write(adapter
, CXL_PSL_AFUSEL
, CXL_PSL_AFUSEL_A
);
327 cxl_p1_write(adapter
, CXL_PSL_TLBIA
, CXL_TLB_SLB_IQ_ALL
);
328 while (cxl_p1_read(adapter
, CXL_PSL_TLBIA
) & CXL_TLB_SLB_P
) {
329 if (time_after_eq(jiffies
, timeout
)) {
330 dev_warn(&adapter
->dev
, "WARNING: CXL adapter wide TLBIA timed out!\n");
333 if (!cxl_ops
->link_ok(adapter
, NULL
))
338 cxl_p1_write(adapter
, CXL_PSL_SLBIA
, CXL_TLB_SLB_IQ_ALL
);
339 while (cxl_p1_read(adapter
, CXL_PSL_SLBIA
) & CXL_TLB_SLB_P
) {
340 if (time_after_eq(jiffies
, timeout
)) {
341 dev_warn(&adapter
->dev
, "WARNING: CXL adapter wide SLBIA timed out!\n");
344 if (!cxl_ops
->link_ok(adapter
, NULL
))
351 int cxl_data_cache_flush(struct cxl
*adapter
)
354 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
356 pr_devel("Flushing data cache\n");
358 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
359 reg
|= CXL_PSL_Control_Fr
;
360 cxl_p1_write(adapter
, CXL_PSL_Control
, reg
);
362 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
363 while ((reg
& CXL_PSL_Control_Fs_MASK
) != CXL_PSL_Control_Fs_Complete
) {
364 if (time_after_eq(jiffies
, timeout
)) {
365 dev_warn(&adapter
->dev
, "WARNING: cache flush timed out!\n");
369 if (!cxl_ops
->link_ok(adapter
, NULL
)) {
370 dev_warn(&adapter
->dev
, "WARNING: link down when flushing cache\n");
374 reg
= cxl_p1_read(adapter
, CXL_PSL_Control
);
377 reg
&= ~CXL_PSL_Control_Fr
;
378 cxl_p1_write(adapter
, CXL_PSL_Control
, reg
);
382 static int cxl_write_sstp(struct cxl_afu
*afu
, u64 sstp0
, u64 sstp1
)
386 /* 1. Disable SSTP by writing 0 to SSTP1[V] */
387 cxl_p2n_write(afu
, CXL_SSTP1_An
, 0);
389 /* 2. Invalidate all SLB entries */
390 if ((rc
= cxl_afu_slbia(afu
)))
393 /* 3. Set SSTP0_An */
394 cxl_p2n_write(afu
, CXL_SSTP0_An
, sstp0
);
396 /* 4. Set SSTP1_An */
397 cxl_p2n_write(afu
, CXL_SSTP1_An
, sstp1
);
402 /* Using per slice version may improve performance here. (ie. SLBIA_An) */
403 static void slb_invalid(struct cxl_context
*ctx
)
405 struct cxl
*adapter
= ctx
->afu
->adapter
;
408 WARN_ON(!mutex_is_locked(&ctx
->afu
->native
->spa_mutex
));
410 cxl_p1_write(adapter
, CXL_PSL_LBISEL
,
411 ((u64
)be32_to_cpu(ctx
->elem
->common
.pid
) << 32) |
412 be32_to_cpu(ctx
->elem
->lpid
));
413 cxl_p1_write(adapter
, CXL_PSL_SLBIA
, CXL_TLB_SLB_IQ_LPIDPID
);
416 if (!cxl_ops
->link_ok(adapter
, NULL
))
418 slbia
= cxl_p1_read(adapter
, CXL_PSL_SLBIA
);
419 if (!(slbia
& CXL_TLB_SLB_P
))
425 static int do_process_element_cmd(struct cxl_context
*ctx
,
426 u64 cmd
, u64 pe_state
)
429 unsigned long timeout
= jiffies
+ (HZ
* CXL_TIMEOUT
);
432 trace_cxl_llcmd(ctx
, cmd
);
434 WARN_ON(!ctx
->afu
->enabled
);
436 ctx
->elem
->software_state
= cpu_to_be32(pe_state
);
438 *(ctx
->afu
->native
->sw_command_status
) = cpu_to_be64(cmd
| 0 | ctx
->pe
);
440 cxl_p1n_write(ctx
->afu
, CXL_PSL_LLCMD_An
, cmd
| ctx
->pe
);
442 if (time_after_eq(jiffies
, timeout
)) {
443 dev_warn(&ctx
->afu
->dev
, "WARNING: Process Element Command timed out!\n");
447 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
)) {
448 dev_warn(&ctx
->afu
->dev
, "WARNING: Device link down, aborting Process Element Command!\n");
452 state
= be64_to_cpup(ctx
->afu
->native
->sw_command_status
);
453 if (state
== ~0ULL) {
454 pr_err("cxl: Error adding process element to AFU\n");
458 if ((state
& (CXL_SPA_SW_CMD_MASK
| CXL_SPA_SW_STATE_MASK
| CXL_SPA_SW_LINK_MASK
)) ==
459 (cmd
| (cmd
>> 16) | ctx
->pe
))
462 * The command won't finish in the PSL if there are
463 * outstanding DSIs. Hence we need to yield here in
464 * case there are outstanding DSIs that we need to
465 * service. Tuning possiblity: we could wait for a
472 trace_cxl_llcmd_done(ctx
, cmd
, rc
);
476 static int add_process_element(struct cxl_context
*ctx
)
480 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
481 pr_devel("%s Adding pe: %i started\n", __func__
, ctx
->pe
);
482 if (!(rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_ADD
, CXL_PE_SOFTWARE_STATE_V
)))
483 ctx
->pe_inserted
= true;
484 pr_devel("%s Adding pe: %i finished\n", __func__
, ctx
->pe
);
485 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
489 static int terminate_process_element(struct cxl_context
*ctx
)
493 /* fast path terminate if it's already invalid */
494 if (!(ctx
->elem
->software_state
& cpu_to_be32(CXL_PE_SOFTWARE_STATE_V
)))
497 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
498 pr_devel("%s Terminate pe: %i started\n", __func__
, ctx
->pe
);
499 /* We could be asked to terminate when the hw is down. That
500 * should always succeed: it's not running if the hw has gone
501 * away and is being reset.
503 if (cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
504 rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_TERMINATE
,
505 CXL_PE_SOFTWARE_STATE_V
| CXL_PE_SOFTWARE_STATE_T
);
506 ctx
->elem
->software_state
= 0; /* Remove Valid bit */
507 pr_devel("%s Terminate pe: %i finished\n", __func__
, ctx
->pe
);
508 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
512 static int remove_process_element(struct cxl_context
*ctx
)
516 mutex_lock(&ctx
->afu
->native
->spa_mutex
);
517 pr_devel("%s Remove pe: %i started\n", __func__
, ctx
->pe
);
519 /* We could be asked to remove when the hw is down. Again, if
520 * the hw is down, the PE is gone, so we succeed.
522 if (cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
))
523 rc
= do_process_element_cmd(ctx
, CXL_SPA_SW_CMD_REMOVE
, 0);
526 ctx
->pe_inserted
= false;
529 pr_devel("%s Remove pe: %i finished\n", __func__
, ctx
->pe
);
530 mutex_unlock(&ctx
->afu
->native
->spa_mutex
);
535 void cxl_assign_psn_space(struct cxl_context
*ctx
)
537 if (!ctx
->afu
->pp_size
|| ctx
->master
) {
538 ctx
->psn_phys
= ctx
->afu
->psn_phys
;
539 ctx
->psn_size
= ctx
->afu
->adapter
->ps_size
;
541 ctx
->psn_phys
= ctx
->afu
->psn_phys
+
542 (ctx
->afu
->native
->pp_offset
+ ctx
->afu
->pp_size
* ctx
->pe
);
543 ctx
->psn_size
= ctx
->afu
->pp_size
;
547 static int activate_afu_directed(struct cxl_afu
*afu
)
551 dev_info(&afu
->dev
, "Activating AFU directed mode\n");
553 afu
->num_procs
= afu
->max_procs_virtualised
;
554 if (afu
->native
->spa
== NULL
) {
555 if (cxl_alloc_spa(afu
, CXL_MODE_DIRECTED
))
560 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_AFU
);
562 cxl_p1n_write(afu
, CXL_PSL_AMOR_An
, 0xFFFFFFFFFFFFFFFFULL
);
563 cxl_p1n_write(afu
, CXL_PSL_ID_An
, CXL_PSL_ID_An_F
| CXL_PSL_ID_An_L
);
565 afu
->current_mode
= CXL_MODE_DIRECTED
;
567 if ((rc
= cxl_chardev_m_afu_add(afu
)))
570 if ((rc
= cxl_sysfs_afu_m_add(afu
)))
573 if ((rc
= cxl_chardev_s_afu_add(afu
)))
578 cxl_sysfs_afu_m_remove(afu
);
580 cxl_chardev_afu_remove(afu
);
584 #ifdef CONFIG_CPU_LITTLE_ENDIAN
585 #define set_endian(sr) ((sr) |= CXL_PSL_SR_An_LE)
587 #define set_endian(sr) ((sr) &= ~(CXL_PSL_SR_An_LE))
590 u64
cxl_calculate_sr(bool master
, bool kernel
, bool real_mode
, bool p9
)
596 sr
|= CXL_PSL_SR_An_MP
;
597 if (mfspr(SPRN_LPCR
) & LPCR_TC
)
598 sr
|= CXL_PSL_SR_An_TC
;
601 sr
|= CXL_PSL_SR_An_R
;
602 sr
|= (mfmsr() & MSR_SF
) | CXL_PSL_SR_An_HV
;
604 sr
|= CXL_PSL_SR_An_PR
| CXL_PSL_SR_An_R
;
606 sr
|= CXL_PSL_SR_An_HV
;
608 sr
&= ~(CXL_PSL_SR_An_HV
);
609 if (!test_tsk_thread_flag(current
, TIF_32BIT
))
610 sr
|= CXL_PSL_SR_An_SF
;
614 sr
|= CXL_PSL_SR_An_XLAT_ror
;
616 sr
|= CXL_PSL_SR_An_XLAT_hpt
;
621 static u64
calculate_sr(struct cxl_context
*ctx
)
623 return cxl_calculate_sr(ctx
->master
, ctx
->kernel
, ctx
->real_mode
,
627 static void update_ivtes_directed(struct cxl_context
*ctx
)
629 bool need_update
= (ctx
->status
== STARTED
);
633 WARN_ON(terminate_process_element(ctx
));
634 WARN_ON(remove_process_element(ctx
));
637 for (r
= 0; r
< CXL_IRQ_RANGES
; r
++) {
638 ctx
->elem
->ivte_offsets
[r
] = cpu_to_be16(ctx
->irqs
.offset
[r
]);
639 ctx
->elem
->ivte_ranges
[r
] = cpu_to_be16(ctx
->irqs
.range
[r
]);
643 * Theoretically we could use the update llcmd, instead of a
644 * terminate/remove/add (or if an atomic update was required we could
645 * do a suspend/update/resume), however it seems there might be issues
646 * with the update llcmd on some cards (including those using an XSL on
647 * an ASIC) so for now it's safest to go with the commands that are
648 * known to work. In the future if we come across a situation where the
649 * card may be performing transactions using the same PE while we are
650 * doing this update we might need to revisit this.
653 WARN_ON(add_process_element(ctx
));
656 static int process_element_entry_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
661 cxl_assign_psn_space(ctx
);
663 ctx
->elem
->ctxtime
= 0; /* disable */
664 ctx
->elem
->lpid
= cpu_to_be32(mfspr(SPRN_LPID
));
665 ctx
->elem
->haurp
= 0; /* disable */
670 if (ctx
->mm
== NULL
) {
671 pr_devel("%s: unable to get mm for pe=%d pid=%i\n",
672 __func__
, ctx
->pe
, pid_nr(ctx
->pid
));
675 pid
= ctx
->mm
->context
.id
;
678 /* Assign a unique TIDR (thread id) for the current thread */
679 if (!(ctx
->tidr
) && (ctx
->assign_tidr
)) {
680 rc
= set_thread_tidr(current
);
683 ctx
->tidr
= current
->thread
.tidr
;
684 pr_devel("%s: current tidr: %d\n", __func__
, ctx
->tidr
);
687 ctx
->elem
->common
.tid
= cpu_to_be32(ctx
->tidr
);
688 ctx
->elem
->common
.pid
= cpu_to_be32(pid
);
690 ctx
->elem
->sr
= cpu_to_be64(calculate_sr(ctx
));
692 ctx
->elem
->common
.csrp
= 0; /* disable */
694 cxl_prefault(ctx
, wed
);
697 * Ensure we have the multiplexed PSL interrupt set up to take faults
698 * for kernel contexts that may not have allocated any AFU IRQs at all:
700 if (ctx
->irqs
.range
[0] == 0) {
701 ctx
->irqs
.offset
[0] = ctx
->afu
->native
->psl_hwirq
;
702 ctx
->irqs
.range
[0] = 1;
705 ctx
->elem
->common
.amr
= cpu_to_be64(amr
);
706 ctx
->elem
->common
.wed
= cpu_to_be64(wed
);
711 int cxl_attach_afu_directed_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
715 /* fill the process element entry */
716 result
= process_element_entry_psl9(ctx
, wed
, amr
);
720 update_ivtes_directed(ctx
);
722 /* first guy needs to enable */
723 result
= cxl_ops
->afu_check_and_enable(ctx
->afu
);
727 return add_process_element(ctx
);
730 int cxl_attach_afu_directed_psl8(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
735 cxl_assign_psn_space(ctx
);
737 ctx
->elem
->ctxtime
= 0; /* disable */
738 ctx
->elem
->lpid
= cpu_to_be32(mfspr(SPRN_LPID
));
739 ctx
->elem
->haurp
= 0; /* disable */
740 ctx
->elem
->u
.sdr
= cpu_to_be64(mfspr(SPRN_SDR1
));
745 ctx
->elem
->common
.tid
= 0;
746 ctx
->elem
->common
.pid
= cpu_to_be32(pid
);
748 ctx
->elem
->sr
= cpu_to_be64(calculate_sr(ctx
));
750 ctx
->elem
->common
.csrp
= 0; /* disable */
751 ctx
->elem
->common
.u
.psl8
.aurp0
= 0; /* disable */
752 ctx
->elem
->common
.u
.psl8
.aurp1
= 0; /* disable */
754 cxl_prefault(ctx
, wed
);
756 ctx
->elem
->common
.u
.psl8
.sstp0
= cpu_to_be64(ctx
->sstp0
);
757 ctx
->elem
->common
.u
.psl8
.sstp1
= cpu_to_be64(ctx
->sstp1
);
760 * Ensure we have the multiplexed PSL interrupt set up to take faults
761 * for kernel contexts that may not have allocated any AFU IRQs at all:
763 if (ctx
->irqs
.range
[0] == 0) {
764 ctx
->irqs
.offset
[0] = ctx
->afu
->native
->psl_hwirq
;
765 ctx
->irqs
.range
[0] = 1;
768 update_ivtes_directed(ctx
);
770 ctx
->elem
->common
.amr
= cpu_to_be64(amr
);
771 ctx
->elem
->common
.wed
= cpu_to_be64(wed
);
773 /* first guy needs to enable */
774 if ((result
= cxl_ops
->afu_check_and_enable(ctx
->afu
)))
777 return add_process_element(ctx
);
780 static int deactivate_afu_directed(struct cxl_afu
*afu
)
782 dev_info(&afu
->dev
, "Deactivating AFU directed mode\n");
784 afu
->current_mode
= 0;
787 cxl_sysfs_afu_m_remove(afu
);
788 cxl_chardev_afu_remove(afu
);
791 * The CAIA section 2.2.1 indicates that the procedure for starting and
792 * stopping an AFU in AFU directed mode is AFU specific, which is not
793 * ideal since this code is generic and with one exception has no
794 * knowledge of the AFU. This is in contrast to the procedure for
795 * disabling a dedicated process AFU, which is documented to just
796 * require a reset. The architecture does indicate that both an AFU
797 * reset and an AFU disable should result in the AFU being disabled and
798 * we do both followed by a PSL purge for safety.
800 * Notably we used to have some issues with the disable sequence on PSL
801 * cards, which is why we ended up using this heavy weight procedure in
802 * the first place, however a bug was discovered that had rendered the
803 * disable operation ineffective, so it is conceivable that was the
804 * sole explanation for those difficulties. Careful regression testing
805 * is recommended if anyone attempts to remove or reorder these
808 * The XSL on the Mellanox CX4 behaves a little differently from the
809 * PSL based cards and will time out an AFU reset if the AFU is still
810 * enabled. That card is special in that we do have a means to identify
811 * it from this code, so in that case we skip the reset and just use a
812 * disable/purge to avoid the timeout and corresponding noise in the
815 if (afu
->adapter
->native
->sl_ops
->needs_reset_before_disable
)
816 cxl_ops
->afu_reset(afu
);
817 cxl_afu_disable(afu
);
823 int cxl_activate_dedicated_process_psl9(struct cxl_afu
*afu
)
825 dev_info(&afu
->dev
, "Activating dedicated process mode\n");
828 * If XSL is set to dedicated mode (Set in PSL_SCNTL reg), the
829 * XSL and AFU are programmed to work with a single context.
830 * The context information should be configured in the SPA area
831 * index 0 (so PSL_SPAP must be configured before enabling the
835 if (afu
->native
->spa
== NULL
) {
836 if (cxl_alloc_spa(afu
, CXL_MODE_DEDICATED
))
841 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_Process
);
842 cxl_p1n_write(afu
, CXL_PSL_ID_An
, CXL_PSL_ID_An_F
| CXL_PSL_ID_An_L
);
844 afu
->current_mode
= CXL_MODE_DEDICATED
;
846 return cxl_chardev_d_afu_add(afu
);
849 int cxl_activate_dedicated_process_psl8(struct cxl_afu
*afu
)
851 dev_info(&afu
->dev
, "Activating dedicated process mode\n");
853 cxl_p1n_write(afu
, CXL_PSL_SCNTL_An
, CXL_PSL_SCNTL_An_PM_Process
);
855 cxl_p1n_write(afu
, CXL_PSL_CtxTime_An
, 0); /* disable */
856 cxl_p1n_write(afu
, CXL_PSL_SPAP_An
, 0); /* disable */
857 cxl_p1n_write(afu
, CXL_PSL_AMOR_An
, 0xFFFFFFFFFFFFFFFFULL
);
858 cxl_p1n_write(afu
, CXL_PSL_LPID_An
, mfspr(SPRN_LPID
));
859 cxl_p1n_write(afu
, CXL_HAURP_An
, 0); /* disable */
860 cxl_p1n_write(afu
, CXL_PSL_SDR_An
, mfspr(SPRN_SDR1
));
862 cxl_p2n_write(afu
, CXL_CSRP_An
, 0); /* disable */
863 cxl_p2n_write(afu
, CXL_AURP0_An
, 0); /* disable */
864 cxl_p2n_write(afu
, CXL_AURP1_An
, 0); /* disable */
866 afu
->current_mode
= CXL_MODE_DEDICATED
;
869 return cxl_chardev_d_afu_add(afu
);
872 void cxl_update_dedicated_ivtes_psl9(struct cxl_context
*ctx
)
876 for (r
= 0; r
< CXL_IRQ_RANGES
; r
++) {
877 ctx
->elem
->ivte_offsets
[r
] = cpu_to_be16(ctx
->irqs
.offset
[r
]);
878 ctx
->elem
->ivte_ranges
[r
] = cpu_to_be16(ctx
->irqs
.range
[r
]);
882 void cxl_update_dedicated_ivtes_psl8(struct cxl_context
*ctx
)
884 struct cxl_afu
*afu
= ctx
->afu
;
886 cxl_p1n_write(afu
, CXL_PSL_IVTE_Offset_An
,
887 (((u64
)ctx
->irqs
.offset
[0] & 0xffff) << 48) |
888 (((u64
)ctx
->irqs
.offset
[1] & 0xffff) << 32) |
889 (((u64
)ctx
->irqs
.offset
[2] & 0xffff) << 16) |
890 ((u64
)ctx
->irqs
.offset
[3] & 0xffff));
891 cxl_p1n_write(afu
, CXL_PSL_IVTE_Limit_An
, (u64
)
892 (((u64
)ctx
->irqs
.range
[0] & 0xffff) << 48) |
893 (((u64
)ctx
->irqs
.range
[1] & 0xffff) << 32) |
894 (((u64
)ctx
->irqs
.range
[2] & 0xffff) << 16) |
895 ((u64
)ctx
->irqs
.range
[3] & 0xffff));
898 int cxl_attach_dedicated_process_psl9(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
900 struct cxl_afu
*afu
= ctx
->afu
;
903 /* fill the process element entry */
904 result
= process_element_entry_psl9(ctx
, wed
, amr
);
908 if (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
)
909 afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
911 ctx
->elem
->software_state
= cpu_to_be32(CXL_PE_SOFTWARE_STATE_V
);
913 * Ideally we should do a wmb() here to make sure the changes to the
914 * PE are visible to the card before we call afu_enable.
915 * On ppc64 though all mmios are preceded by a 'sync' instruction hence
916 * we dont dont need one here.
919 result
= cxl_ops
->afu_reset(afu
);
923 return afu_enable(afu
);
926 int cxl_attach_dedicated_process_psl8(struct cxl_context
*ctx
, u64 wed
, u64 amr
)
928 struct cxl_afu
*afu
= ctx
->afu
;
932 pid
= (u64
)current
->pid
<< 32;
935 cxl_p2n_write(afu
, CXL_PSL_PID_TID_An
, pid
);
937 cxl_p1n_write(afu
, CXL_PSL_SR_An
, calculate_sr(ctx
));
939 if ((rc
= cxl_write_sstp(afu
, ctx
->sstp0
, ctx
->sstp1
)))
942 cxl_prefault(ctx
, wed
);
944 if (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
)
945 afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
947 cxl_p2n_write(afu
, CXL_PSL_AMR_An
, amr
);
949 /* master only context for dedicated */
950 cxl_assign_psn_space(ctx
);
952 if ((rc
= cxl_ops
->afu_reset(afu
)))
955 cxl_p2n_write(afu
, CXL_PSL_WED_An
, wed
);
957 return afu_enable(afu
);
960 static int deactivate_dedicated_process(struct cxl_afu
*afu
)
962 dev_info(&afu
->dev
, "Deactivating dedicated process mode\n");
964 afu
->current_mode
= 0;
967 cxl_chardev_afu_remove(afu
);
972 static int native_afu_deactivate_mode(struct cxl_afu
*afu
, int mode
)
974 if (mode
== CXL_MODE_DIRECTED
)
975 return deactivate_afu_directed(afu
);
976 if (mode
== CXL_MODE_DEDICATED
)
977 return deactivate_dedicated_process(afu
);
981 static int native_afu_activate_mode(struct cxl_afu
*afu
, int mode
)
985 if (!(mode
& afu
->modes_supported
))
988 if (!cxl_ops
->link_ok(afu
->adapter
, afu
)) {
989 WARN(1, "Device link is down, refusing to activate!\n");
993 if (mode
== CXL_MODE_DIRECTED
)
994 return activate_afu_directed(afu
);
995 if ((mode
== CXL_MODE_DEDICATED
) &&
996 (afu
->adapter
->native
->sl_ops
->activate_dedicated_process
))
997 return afu
->adapter
->native
->sl_ops
->activate_dedicated_process(afu
);
1002 static int native_attach_process(struct cxl_context
*ctx
, bool kernel
,
1005 if (!cxl_ops
->link_ok(ctx
->afu
->adapter
, ctx
->afu
)) {
1006 WARN(1, "Device link is down, refusing to attach process!\n");
1010 ctx
->kernel
= kernel
;
1011 if ((ctx
->afu
->current_mode
== CXL_MODE_DIRECTED
) &&
1012 (ctx
->afu
->adapter
->native
->sl_ops
->attach_afu_directed
))
1013 return ctx
->afu
->adapter
->native
->sl_ops
->attach_afu_directed(ctx
, wed
, amr
);
1015 if ((ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
) &&
1016 (ctx
->afu
->adapter
->native
->sl_ops
->attach_dedicated_process
))
1017 return ctx
->afu
->adapter
->native
->sl_ops
->attach_dedicated_process(ctx
, wed
, amr
);
1022 static inline int detach_process_native_dedicated(struct cxl_context
*ctx
)
1025 * The CAIA section 2.1.1 indicates that we need to do an AFU reset to
1026 * stop the AFU in dedicated mode (we therefore do not make that
1027 * optional like we do in the afu directed path). It does not indicate
1028 * that we need to do an explicit disable (which should occur
1029 * implicitly as part of the reset) or purge, but we do these as well
1030 * to be on the safe side.
1032 * Notably we used to have some issues with the disable sequence
1033 * (before the sequence was spelled out in the architecture) which is
1034 * why we were so heavy weight in the first place, however a bug was
1035 * discovered that had rendered the disable operation ineffective, so
1036 * it is conceivable that was the sole explanation for those
1037 * difficulties. Point is, we should be careful and do some regression
1038 * testing if we ever attempt to remove any part of this procedure.
1040 cxl_ops
->afu_reset(ctx
->afu
);
1041 cxl_afu_disable(ctx
->afu
);
1042 cxl_psl_purge(ctx
->afu
);
1046 static void native_update_ivtes(struct cxl_context
*ctx
)
1048 if (ctx
->afu
->current_mode
== CXL_MODE_DIRECTED
)
1049 return update_ivtes_directed(ctx
);
1050 if ((ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
) &&
1051 (ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes
))
1052 return ctx
->afu
->adapter
->native
->sl_ops
->update_dedicated_ivtes(ctx
);
1053 WARN(1, "native_update_ivtes: Bad mode\n");
1056 static inline int detach_process_native_afu_directed(struct cxl_context
*ctx
)
1058 if (!ctx
->pe_inserted
)
1060 if (terminate_process_element(ctx
))
1062 if (remove_process_element(ctx
))
1068 static int native_detach_process(struct cxl_context
*ctx
)
1070 trace_cxl_detach(ctx
);
1072 if (ctx
->afu
->current_mode
== CXL_MODE_DEDICATED
)
1073 return detach_process_native_dedicated(ctx
);
1075 return detach_process_native_afu_directed(ctx
);
1078 static int native_get_irq_info(struct cxl_afu
*afu
, struct cxl_irq_info
*info
)
1080 /* If the adapter has gone away, we can't get any meaningful
1083 if (!cxl_ops
->link_ok(afu
->adapter
, afu
))
1086 info
->dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1087 info
->dar
= cxl_p2n_read(afu
, CXL_PSL_DAR_An
);
1088 if (cxl_is_power8())
1089 info
->dsr
= cxl_p2n_read(afu
, CXL_PSL_DSR_An
);
1090 info
->afu_err
= cxl_p2n_read(afu
, CXL_AFU_ERR_An
);
1091 info
->errstat
= cxl_p2n_read(afu
, CXL_PSL_ErrStat_An
);
1092 info
->proc_handle
= 0;
1097 void cxl_native_irq_dump_regs_psl9(struct cxl_context
*ctx
)
1101 fir1
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL9_FIR1
);
1103 dev_crit(&ctx
->afu
->dev
, "PSL_FIR1: 0x%016llx\n", fir1
);
1104 if (ctx
->afu
->adapter
->native
->sl_ops
->register_serr_irq
) {
1105 serr
= cxl_p1n_read(ctx
->afu
, CXL_PSL_SERR_An
);
1106 cxl_afu_decode_psl_serr(ctx
->afu
, serr
);
1110 void cxl_native_irq_dump_regs_psl8(struct cxl_context
*ctx
)
1112 u64 fir1
, fir2
, fir_slice
, serr
, afu_debug
;
1114 fir1
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL_FIR1
);
1115 fir2
= cxl_p1_read(ctx
->afu
->adapter
, CXL_PSL_FIR2
);
1116 fir_slice
= cxl_p1n_read(ctx
->afu
, CXL_PSL_FIR_SLICE_An
);
1117 afu_debug
= cxl_p1n_read(ctx
->afu
, CXL_AFU_DEBUG_An
);
1119 dev_crit(&ctx
->afu
->dev
, "PSL_FIR1: 0x%016llx\n", fir1
);
1120 dev_crit(&ctx
->afu
->dev
, "PSL_FIR2: 0x%016llx\n", fir2
);
1121 if (ctx
->afu
->adapter
->native
->sl_ops
->register_serr_irq
) {
1122 serr
= cxl_p1n_read(ctx
->afu
, CXL_PSL_SERR_An
);
1123 cxl_afu_decode_psl_serr(ctx
->afu
, serr
);
1125 dev_crit(&ctx
->afu
->dev
, "PSL_FIR_SLICE_An: 0x%016llx\n", fir_slice
);
1126 dev_crit(&ctx
->afu
->dev
, "CXL_PSL_AFU_DEBUG_An: 0x%016llx\n", afu_debug
);
1129 static irqreturn_t
native_handle_psl_slice_error(struct cxl_context
*ctx
,
1130 u64 dsisr
, u64 errstat
)
1133 dev_crit(&ctx
->afu
->dev
, "PSL ERROR STATUS: 0x%016llx\n", errstat
);
1135 if (ctx
->afu
->adapter
->native
->sl_ops
->psl_irq_dump_registers
)
1136 ctx
->afu
->adapter
->native
->sl_ops
->psl_irq_dump_registers(ctx
);
1138 if (ctx
->afu
->adapter
->native
->sl_ops
->debugfs_stop_trace
) {
1139 dev_crit(&ctx
->afu
->dev
, "STOPPING CXL TRACE\n");
1140 ctx
->afu
->adapter
->native
->sl_ops
->debugfs_stop_trace(ctx
->afu
->adapter
);
1143 return cxl_ops
->ack_irq(ctx
, 0, errstat
);
1146 static bool cxl_is_translation_fault(struct cxl_afu
*afu
, u64 dsisr
)
1148 if ((cxl_is_power8()) && (dsisr
& CXL_PSL_DSISR_TRANS
))
1151 if ((cxl_is_power9()) && (dsisr
& CXL_PSL9_DSISR_An_TF
))
1157 irqreturn_t
cxl_fail_irq_psl(struct cxl_afu
*afu
, struct cxl_irq_info
*irq_info
)
1159 if (cxl_is_translation_fault(afu
, irq_info
->dsisr
))
1160 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_AE
);
1162 cxl_p2n_write(afu
, CXL_PSL_TFC_An
, CXL_PSL_TFC_An_A
);
1167 static irqreturn_t
native_irq_multiplexed(int irq
, void *data
)
1169 struct cxl_afu
*afu
= data
;
1170 struct cxl_context
*ctx
;
1171 struct cxl_irq_info irq_info
;
1172 u64 phreg
= cxl_p2n_read(afu
, CXL_PSL_PEHandle_An
);
1173 int ph
, ret
= IRQ_HANDLED
, res
;
1175 /* check if eeh kicked in while the interrupt was in flight */
1176 if (unlikely(phreg
== ~0ULL)) {
1178 "Ignoring slice interrupt(%d) due to fenced card",
1182 /* Mask the pe-handle from register value */
1183 ph
= phreg
& 0xffff;
1184 if ((res
= native_get_irq_info(afu
, &irq_info
))) {
1185 WARN(1, "Unable to get CXL IRQ Info: %i\n", res
);
1186 if (afu
->adapter
->native
->sl_ops
->fail_irq
)
1187 return afu
->adapter
->native
->sl_ops
->fail_irq(afu
, &irq_info
);
1192 ctx
= idr_find(&afu
->contexts_idr
, ph
);
1194 if (afu
->adapter
->native
->sl_ops
->handle_interrupt
)
1195 ret
= afu
->adapter
->native
->sl_ops
->handle_interrupt(irq
, ctx
, &irq_info
);
1201 WARN(1, "Unable to demultiplex CXL PSL IRQ for PE %i DSISR %016llx DAR"
1202 " %016llx\n(Possible AFU HW issue - was a term/remove acked"
1203 " with outstanding transactions?)\n", ph
, irq_info
.dsisr
,
1205 if (afu
->adapter
->native
->sl_ops
->fail_irq
)
1206 ret
= afu
->adapter
->native
->sl_ops
->fail_irq(afu
, &irq_info
);
1210 static void native_irq_wait(struct cxl_context
*ctx
)
1217 * Wait until no further interrupts are presented by the PSL
1221 ph
= cxl_p2n_read(ctx
->afu
, CXL_PSL_PEHandle_An
) & 0xffff;
1224 dsisr
= cxl_p2n_read(ctx
->afu
, CXL_PSL_DSISR_An
);
1225 if (cxl_is_power8() &&
1226 ((dsisr
& CXL_PSL_DSISR_PENDING
) == 0))
1228 if (cxl_is_power9() &&
1229 ((dsisr
& CXL_PSL9_DSISR_PENDING
) == 0))
1232 * We are waiting for the workqueue to process our
1233 * irq, so need to let that run here.
1238 dev_warn(&ctx
->afu
->dev
, "WARNING: waiting on DSI for PE %i"
1239 " DSISR %016llx!\n", ph
, dsisr
);
1243 static irqreturn_t
native_slice_irq_err(int irq
, void *data
)
1245 struct cxl_afu
*afu
= data
;
1246 u64 errstat
, serr
, afu_error
, dsisr
;
1247 u64 fir_slice
, afu_debug
, irq_mask
;
1250 * slice err interrupt is only used with full PSL (no XSL)
1252 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
1253 errstat
= cxl_p2n_read(afu
, CXL_PSL_ErrStat_An
);
1254 afu_error
= cxl_p2n_read(afu
, CXL_AFU_ERR_An
);
1255 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1256 cxl_afu_decode_psl_serr(afu
, serr
);
1258 if (cxl_is_power8()) {
1259 fir_slice
= cxl_p1n_read(afu
, CXL_PSL_FIR_SLICE_An
);
1260 afu_debug
= cxl_p1n_read(afu
, CXL_AFU_DEBUG_An
);
1261 dev_crit(&afu
->dev
, "PSL_FIR_SLICE_An: 0x%016llx\n", fir_slice
);
1262 dev_crit(&afu
->dev
, "CXL_PSL_AFU_DEBUG_An: 0x%016llx\n", afu_debug
);
1264 dev_crit(&afu
->dev
, "CXL_PSL_ErrStat_An: 0x%016llx\n", errstat
);
1265 dev_crit(&afu
->dev
, "AFU_ERR_An: 0x%.16llx\n", afu_error
);
1266 dev_crit(&afu
->dev
, "PSL_DSISR_An: 0x%.16llx\n", dsisr
);
1268 /* mask off the IRQ so it won't retrigger until the AFU is reset */
1269 irq_mask
= (serr
& CXL_PSL_SERR_An_IRQS
) >> 32;
1271 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
1272 dev_info(&afu
->dev
, "Further such interrupts will be masked until the AFU is reset\n");
1277 void cxl_native_err_irq_dump_regs_psl9(struct cxl
*adapter
)
1281 fir1
= cxl_p1_read(adapter
, CXL_PSL9_FIR1
);
1282 dev_crit(&adapter
->dev
, "PSL_FIR: 0x%016llx\n", fir1
);
1285 void cxl_native_err_irq_dump_regs_psl8(struct cxl
*adapter
)
1289 fir1
= cxl_p1_read(adapter
, CXL_PSL_FIR1
);
1290 fir2
= cxl_p1_read(adapter
, CXL_PSL_FIR2
);
1291 dev_crit(&adapter
->dev
,
1292 "PSL_FIR1: 0x%016llx\nPSL_FIR2: 0x%016llx\n",
1296 static irqreturn_t
native_irq_err(int irq
, void *data
)
1298 struct cxl
*adapter
= data
;
1301 WARN(1, "CXL ERROR interrupt %i\n", irq
);
1303 err_ivte
= cxl_p1_read(adapter
, CXL_PSL_ErrIVTE
);
1304 dev_crit(&adapter
->dev
, "PSL_ErrIVTE: 0x%016llx\n", err_ivte
);
1306 if (adapter
->native
->sl_ops
->debugfs_stop_trace
) {
1307 dev_crit(&adapter
->dev
, "STOPPING CXL TRACE\n");
1308 adapter
->native
->sl_ops
->debugfs_stop_trace(adapter
);
1311 if (adapter
->native
->sl_ops
->err_irq_dump_registers
)
1312 adapter
->native
->sl_ops
->err_irq_dump_registers(adapter
);
1317 int cxl_native_register_psl_err_irq(struct cxl
*adapter
)
1321 adapter
->irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s-err",
1322 dev_name(&adapter
->dev
));
1323 if (!adapter
->irq_name
)
1326 if ((rc
= cxl_register_one_irq(adapter
, native_irq_err
, adapter
,
1327 &adapter
->native
->err_hwirq
,
1328 &adapter
->native
->err_virq
,
1329 adapter
->irq_name
))) {
1330 kfree(adapter
->irq_name
);
1331 adapter
->irq_name
= NULL
;
1335 cxl_p1_write(adapter
, CXL_PSL_ErrIVTE
, adapter
->native
->err_hwirq
& 0xffff);
1340 void cxl_native_release_psl_err_irq(struct cxl
*adapter
)
1342 if (adapter
->native
->err_virq
== 0 ||
1343 adapter
->native
->err_virq
!=
1344 irq_find_mapping(NULL
, adapter
->native
->err_hwirq
))
1347 cxl_p1_write(adapter
, CXL_PSL_ErrIVTE
, 0x0000000000000000);
1348 cxl_unmap_irq(adapter
->native
->err_virq
, adapter
);
1349 cxl_ops
->release_one_irq(adapter
, adapter
->native
->err_hwirq
);
1350 kfree(adapter
->irq_name
);
1351 adapter
->native
->err_virq
= 0;
1354 int cxl_native_register_serr_irq(struct cxl_afu
*afu
)
1359 afu
->err_irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s-err",
1360 dev_name(&afu
->dev
));
1361 if (!afu
->err_irq_name
)
1364 if ((rc
= cxl_register_one_irq(afu
->adapter
, native_slice_irq_err
, afu
,
1366 &afu
->serr_virq
, afu
->err_irq_name
))) {
1367 kfree(afu
->err_irq_name
);
1368 afu
->err_irq_name
= NULL
;
1372 serr
= cxl_p1n_read(afu
, CXL_PSL_SERR_An
);
1373 if (cxl_is_power8())
1374 serr
= (serr
& 0x00ffffffffff0000ULL
) | (afu
->serr_hwirq
& 0xffff);
1375 if (cxl_is_power9()) {
1377 * By default, all errors are masked. So don't set all masks.
1378 * Slice errors will be transfered.
1380 serr
= (serr
& ~0xff0000007fffffffULL
) | (afu
->serr_hwirq
& 0xffff);
1382 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, serr
);
1387 void cxl_native_release_serr_irq(struct cxl_afu
*afu
)
1389 if (afu
->serr_virq
== 0 ||
1390 afu
->serr_virq
!= irq_find_mapping(NULL
, afu
->serr_hwirq
))
1393 cxl_p1n_write(afu
, CXL_PSL_SERR_An
, 0x0000000000000000);
1394 cxl_unmap_irq(afu
->serr_virq
, afu
);
1395 cxl_ops
->release_one_irq(afu
->adapter
, afu
->serr_hwirq
);
1396 kfree(afu
->err_irq_name
);
1400 int cxl_native_register_psl_irq(struct cxl_afu
*afu
)
1404 afu
->psl_irq_name
= kasprintf(GFP_KERNEL
, "cxl-%s",
1405 dev_name(&afu
->dev
));
1406 if (!afu
->psl_irq_name
)
1409 if ((rc
= cxl_register_one_irq(afu
->adapter
, native_irq_multiplexed
,
1410 afu
, &afu
->native
->psl_hwirq
, &afu
->native
->psl_virq
,
1411 afu
->psl_irq_name
))) {
1412 kfree(afu
->psl_irq_name
);
1413 afu
->psl_irq_name
= NULL
;
1418 void cxl_native_release_psl_irq(struct cxl_afu
*afu
)
1420 if (afu
->native
->psl_virq
== 0 ||
1421 afu
->native
->psl_virq
!=
1422 irq_find_mapping(NULL
, afu
->native
->psl_hwirq
))
1425 cxl_unmap_irq(afu
->native
->psl_virq
, afu
);
1426 cxl_ops
->release_one_irq(afu
->adapter
, afu
->native
->psl_hwirq
);
1427 kfree(afu
->psl_irq_name
);
1428 afu
->native
->psl_virq
= 0;
1431 static void recover_psl_err(struct cxl_afu
*afu
, u64 errstat
)
1435 pr_devel("RECOVERING FROM PSL ERROR... (0x%016llx)\n", errstat
);
1437 /* Clear PSL_DSISR[PE] */
1438 dsisr
= cxl_p2n_read(afu
, CXL_PSL_DSISR_An
);
1439 cxl_p2n_write(afu
, CXL_PSL_DSISR_An
, dsisr
& ~CXL_PSL_DSISR_An_PE
);
1441 /* Write 1s to clear error status bits */
1442 cxl_p2n_write(afu
, CXL_PSL_ErrStat_An
, errstat
);
1445 static int native_ack_irq(struct cxl_context
*ctx
, u64 tfc
, u64 psl_reset_mask
)
1447 trace_cxl_psl_irq_ack(ctx
, tfc
);
1449 cxl_p2n_write(ctx
->afu
, CXL_PSL_TFC_An
, tfc
);
1451 recover_psl_err(ctx
->afu
, psl_reset_mask
);
1456 int cxl_check_error(struct cxl_afu
*afu
)
1458 return (cxl_p1n_read(afu
, CXL_PSL_SCNTL_An
) == ~0ULL);
1461 static bool native_support_attributes(const char *attr_name
,
1462 enum cxl_attrs type
)
1467 static int native_afu_cr_read64(struct cxl_afu
*afu
, int cr
, u64 off
, u64
*out
)
1469 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1471 if (unlikely(off
>= afu
->crs_len
))
1473 *out
= in_le64(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1474 (cr
* afu
->crs_len
) + off
);
1478 static int native_afu_cr_read32(struct cxl_afu
*afu
, int cr
, u64 off
, u32
*out
)
1480 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1482 if (unlikely(off
>= afu
->crs_len
))
1484 *out
= in_le32(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1485 (cr
* afu
->crs_len
) + off
);
1489 static int native_afu_cr_read16(struct cxl_afu
*afu
, int cr
, u64 off
, u16
*out
)
1491 u64 aligned_off
= off
& ~0x3L
;
1495 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val
);
1497 *out
= (val
>> ((off
& 0x3) * 8)) & 0xffff;
1501 static int native_afu_cr_read8(struct cxl_afu
*afu
, int cr
, u64 off
, u8
*out
)
1503 u64 aligned_off
= off
& ~0x3L
;
1507 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val
);
1509 *out
= (val
>> ((off
& 0x3) * 8)) & 0xff;
1513 static int native_afu_cr_write32(struct cxl_afu
*afu
, int cr
, u64 off
, u32 in
)
1515 if (unlikely(!cxl_ops
->link_ok(afu
->adapter
, afu
)))
1517 if (unlikely(off
>= afu
->crs_len
))
1519 out_le32(afu
->native
->afu_desc_mmio
+ afu
->crs_offset
+
1520 (cr
* afu
->crs_len
) + off
, in
);
1524 static int native_afu_cr_write16(struct cxl_afu
*afu
, int cr
, u64 off
, u16 in
)
1526 u64 aligned_off
= off
& ~0x3L
;
1527 u32 val32
, mask
, shift
;
1530 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val32
);
1533 shift
= (off
& 0x3) * 8;
1534 WARN_ON(shift
== 24);
1535 mask
= 0xffff << shift
;
1536 val32
= (val32
& ~mask
) | (in
<< shift
);
1538 rc
= native_afu_cr_write32(afu
, cr
, aligned_off
, val32
);
1542 static int native_afu_cr_write8(struct cxl_afu
*afu
, int cr
, u64 off
, u8 in
)
1544 u64 aligned_off
= off
& ~0x3L
;
1545 u32 val32
, mask
, shift
;
1548 rc
= native_afu_cr_read32(afu
, cr
, aligned_off
, &val32
);
1551 shift
= (off
& 0x3) * 8;
1552 mask
= 0xff << shift
;
1553 val32
= (val32
& ~mask
) | (in
<< shift
);
1555 rc
= native_afu_cr_write32(afu
, cr
, aligned_off
, val32
);
1559 const struct cxl_backend_ops cxl_native_ops
= {
1560 .module
= THIS_MODULE
,
1561 .adapter_reset
= cxl_pci_reset
,
1562 .alloc_one_irq
= cxl_pci_alloc_one_irq
,
1563 .release_one_irq
= cxl_pci_release_one_irq
,
1564 .alloc_irq_ranges
= cxl_pci_alloc_irq_ranges
,
1565 .release_irq_ranges
= cxl_pci_release_irq_ranges
,
1566 .setup_irq
= cxl_pci_setup_irq
,
1567 .handle_psl_slice_error
= native_handle_psl_slice_error
,
1568 .psl_interrupt
= NULL
,
1569 .ack_irq
= native_ack_irq
,
1570 .irq_wait
= native_irq_wait
,
1571 .attach_process
= native_attach_process
,
1572 .detach_process
= native_detach_process
,
1573 .update_ivtes
= native_update_ivtes
,
1574 .support_attributes
= native_support_attributes
,
1575 .link_ok
= cxl_adapter_link_ok
,
1576 .release_afu
= cxl_pci_release_afu
,
1577 .afu_read_err_buffer
= cxl_pci_afu_read_err_buffer
,
1578 .afu_check_and_enable
= native_afu_check_and_enable
,
1579 .afu_activate_mode
= native_afu_activate_mode
,
1580 .afu_deactivate_mode
= native_afu_deactivate_mode
,
1581 .afu_reset
= native_afu_reset
,
1582 .afu_cr_read8
= native_afu_cr_read8
,
1583 .afu_cr_read16
= native_afu_cr_read16
,
1584 .afu_cr_read32
= native_afu_cr_read32
,
1585 .afu_cr_read64
= native_afu_cr_read64
,
1586 .afu_cr_write8
= native_afu_cr_write8
,
1587 .afu_cr_write16
= native_afu_cr_write16
,
1588 .afu_cr_write32
= native_afu_cr_write32
,
1589 .read_adapter_vpd
= cxl_pci_read_adapter_vpd
,