1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Driver for IBM PowerNV compression accelerator
5 * Copyright (C) 2015 Dan Streetman, IBM Corp
8 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
12 #include <linux/timer.h>
15 #include <asm/icswx.h>
18 #include <asm/opal-api.h>
21 MODULE_LICENSE("GPL");
22 MODULE_AUTHOR("Dan Streetman <ddstreet@ieee.org>");
23 MODULE_DESCRIPTION("H/W Compression driver for IBM PowerNV processors");
24 MODULE_ALIAS_CRYPTO("842");
25 MODULE_ALIAS_CRYPTO("842-nx");
27 #define WORKMEM_ALIGN (CRB_ALIGN)
28 #define CSB_WAIT_MAX (5000) /* ms */
29 #define VAS_RETRIES (10)
31 struct nx842_workmem
{
32 /* Below fields must be properly aligned */
33 struct coprocessor_request_block crb
; /* CRB_ALIGN align */
34 struct data_descriptor_entry ddl_in
[DDL_LEN_MAX
]; /* DDE_ALIGN align */
35 struct data_descriptor_entry ddl_out
[DDL_LEN_MAX
]; /* DDE_ALIGN align */
36 /* Above fields must be properly aligned */
40 char padding
[WORKMEM_ALIGN
]; /* unused, to allow alignment */
41 } __packed
__aligned(WORKMEM_ALIGN
);
45 unsigned int ct
; /* Can be 842 or GZIP high/normal*/
46 unsigned int ci
; /* Coprocessor instance, used with icswx */
48 struct vas_window
*rxwin
;
51 struct list_head list
;
55 * Send the request to NX engine on the chip for the corresponding CPU
56 * where the process is executing. Use with VAS function.
58 static DEFINE_PER_CPU(struct vas_window
*, cpu_txwin
);
60 /* no cpu hotplug on powernv, so this list never changes after init */
61 static LIST_HEAD(nx_coprocs
);
62 static unsigned int nx842_ct
; /* used in icswx function */
65 * Using same values as in skiboot or coprocessor type representing
68 #define NX_CT_GZIP (2) /* on P9 and later */
71 static int (*nx842_powernv_exec
)(const unsigned char *in
,
72 unsigned int inlen
, unsigned char *out
,
73 unsigned int *outlenp
, void *workmem
, int fc
);
76 * setup_indirect_dde - Setup an indirect DDE
78 * The DDE is setup with the DDE count, byte count, and address of
79 * first direct DDE in the list.
81 static void setup_indirect_dde(struct data_descriptor_entry
*dde
,
82 struct data_descriptor_entry
*ddl
,
83 unsigned int dde_count
, unsigned int byte_count
)
86 dde
->count
= dde_count
;
88 dde
->length
= cpu_to_be32(byte_count
);
89 dde
->address
= cpu_to_be64(nx842_get_pa(ddl
));
93 * setup_direct_dde - Setup single DDE from buffer
95 * The DDE is setup with the buffer and length. The buffer must be properly
96 * aligned. The used length is returned.
98 * N Successfully set up DDE with N bytes
100 static unsigned int setup_direct_dde(struct data_descriptor_entry
*dde
,
101 unsigned long pa
, unsigned int len
)
103 unsigned int l
= min_t(unsigned int, len
, LEN_ON_PAGE(pa
));
108 dde
->length
= cpu_to_be32(l
);
109 dde
->address
= cpu_to_be64(pa
);
115 * setup_ddl - Setup DDL from buffer
118 * 0 Successfully set up DDL
120 static int setup_ddl(struct data_descriptor_entry
*dde
,
121 struct data_descriptor_entry
*ddl
,
122 unsigned char *buf
, unsigned int len
,
125 unsigned long pa
= nx842_get_pa(buf
);
126 int i
, ret
, total_len
= len
;
128 if (!IS_ALIGNED(pa
, DDE_BUFFER_ALIGN
)) {
129 pr_debug("%s buffer pa 0x%lx not 0x%x-byte aligned\n",
130 in
? "input" : "output", pa
, DDE_BUFFER_ALIGN
);
134 /* only need to check last mult; since buffer must be
135 * DDE_BUFFER_ALIGN aligned, and that is a multiple of
136 * DDE_BUFFER_SIZE_MULT, and pre-last page DDE buffers
137 * are guaranteed a multiple of DDE_BUFFER_SIZE_MULT.
139 if (len
% DDE_BUFFER_LAST_MULT
) {
140 pr_debug("%s buffer len 0x%x not a multiple of 0x%x\n",
141 in
? "input" : "output", len
, DDE_BUFFER_LAST_MULT
);
144 len
= round_down(len
, DDE_BUFFER_LAST_MULT
);
147 /* use a single direct DDE */
148 if (len
<= LEN_ON_PAGE(pa
)) {
149 ret
= setup_direct_dde(dde
, pa
, len
);
155 for (i
= 0; i
< DDL_LEN_MAX
&& len
> 0; i
++) {
156 ret
= setup_direct_dde(&ddl
[i
], pa
, len
);
159 pa
= nx842_get_pa(buf
);
163 pr_debug("0x%x total %s bytes 0x%x too many for DDL.\n",
164 total_len
, in
? "input" : "output", len
);
169 setup_indirect_dde(dde
, ddl
, i
, total_len
);
174 #define CSB_ERR(csb, msg, ...) \
175 pr_err("ERROR: " msg " : %02x %02x %02x %02x %08x\n", \
176 ##__VA_ARGS__, (csb)->flags, \
177 (csb)->cs, (csb)->cc, (csb)->ce, \
178 be32_to_cpu((csb)->count))
180 #define CSB_ERR_ADDR(csb, msg, ...) \
181 CSB_ERR(csb, msg " at %lx", ##__VA_ARGS__, \
182 (unsigned long)be64_to_cpu((csb)->address))
184 static int wait_for_csb(struct nx842_workmem
*wmem
,
185 struct coprocessor_status_block
*csb
)
187 ktime_t start
= wmem
->start
, now
= ktime_get();
188 ktime_t timeout
= ktime_add_ms(start
, CSB_WAIT_MAX
);
190 while (!(READ_ONCE(csb
->flags
) & CSB_V
)) {
193 if (ktime_after(now
, timeout
))
197 /* hw has updated csb and output buffer */
200 /* check CSB flags */
201 if (!(csb
->flags
& CSB_V
)) {
202 CSB_ERR(csb
, "CSB still not valid after %ld us, giving up",
203 (long)ktime_us_delta(now
, start
));
206 if (csb
->flags
& CSB_F
) {
207 CSB_ERR(csb
, "Invalid CSB format");
210 if (csb
->flags
& CSB_CH
) {
211 CSB_ERR(csb
, "Invalid CSB chaining state");
215 /* verify CSB completion sequence is 0 */
217 CSB_ERR(csb
, "Invalid CSB completion sequence");
221 /* check CSB Completion Code */
226 case CSB_CC_TPBC_GT_SPBC
:
227 /* not an error, but the compressed data is
228 * larger than the uncompressed data :(
232 /* input data errors */
233 case CSB_CC_OPERAND_OVERLAP
:
234 /* input and output buffers overlap */
235 CSB_ERR(csb
, "Operand Overlap error");
237 case CSB_CC_INVALID_OPERAND
:
238 CSB_ERR(csb
, "Invalid operand");
241 /* output buffer too small */
244 CSB_ERR(csb
, "Function aborted");
246 case CSB_CC_CRC_MISMATCH
:
247 CSB_ERR(csb
, "CRC mismatch");
249 case CSB_CC_TEMPL_INVALID
:
250 CSB_ERR(csb
, "Compressed data template invalid");
252 case CSB_CC_TEMPL_OVERFLOW
:
253 CSB_ERR(csb
, "Compressed data template shows data past end");
255 case CSB_CC_EXCEED_BYTE_COUNT
: /* P9 or later */
257 * DDE byte count exceeds the limit specified in Maximum
258 * byte count register.
260 CSB_ERR(csb
, "DDE byte count exceeds the limit");
263 /* these should not happen */
264 case CSB_CC_INVALID_ALIGN
:
265 /* setup_ddl should have detected this */
266 CSB_ERR_ADDR(csb
, "Invalid alignment");
268 case CSB_CC_DATA_LENGTH
:
269 /* setup_ddl should have detected this */
270 CSB_ERR(csb
, "Invalid data length");
272 case CSB_CC_WR_TRANSLATION
:
273 case CSB_CC_TRANSLATION
:
274 case CSB_CC_TRANSLATION_DUP1
:
275 case CSB_CC_TRANSLATION_DUP2
:
276 case CSB_CC_TRANSLATION_DUP3
:
277 case CSB_CC_TRANSLATION_DUP4
:
278 case CSB_CC_TRANSLATION_DUP5
:
279 case CSB_CC_TRANSLATION_DUP6
:
280 /* should not happen, we use physical addrs */
281 CSB_ERR_ADDR(csb
, "Translation error");
283 case CSB_CC_WR_PROTECTION
:
284 case CSB_CC_PROTECTION
:
285 case CSB_CC_PROTECTION_DUP1
:
286 case CSB_CC_PROTECTION_DUP2
:
287 case CSB_CC_PROTECTION_DUP3
:
288 case CSB_CC_PROTECTION_DUP4
:
289 case CSB_CC_PROTECTION_DUP5
:
290 case CSB_CC_PROTECTION_DUP6
:
291 /* should not happen, we use physical addrs */
292 CSB_ERR_ADDR(csb
, "Protection error");
294 case CSB_CC_PRIVILEGE
:
295 /* shouldn't happen, we're in HYP mode */
296 CSB_ERR(csb
, "Insufficient Privilege error");
298 case CSB_CC_EXCESSIVE_DDE
:
299 /* shouldn't happen, setup_ddl doesn't use many dde's */
300 CSB_ERR(csb
, "Too many DDEs in DDL");
302 case CSB_CC_TRANSPORT
:
303 case CSB_CC_INVALID_CRB
: /* P9 or later */
304 /* shouldn't happen, we setup CRB correctly */
305 CSB_ERR(csb
, "Invalid CRB");
307 case CSB_CC_INVALID_DDE
: /* P9 or later */
309 * shouldn't happen, setup_direct/indirect_dde creates
312 CSB_ERR(csb
, "Invalid DDE");
314 case CSB_CC_SEGMENTED_DDL
:
315 /* shouldn't happen, setup_ddl creates DDL right */
316 CSB_ERR(csb
, "Segmented DDL error");
318 case CSB_CC_DDE_OVERFLOW
:
319 /* shouldn't happen, setup_ddl creates DDL right */
320 CSB_ERR(csb
, "DDE overflow error");
323 /* should not happen with ICSWX */
324 CSB_ERR(csb
, "Session violation error");
327 /* should not happen, we don't use chained CRBs */
328 CSB_ERR(csb
, "Chained CRB error");
330 case CSB_CC_SEQUENCE
:
331 /* should not happen, we don't use chained CRBs */
332 CSB_ERR(csb
, "CRB sequence number error");
334 case CSB_CC_UNKNOWN_CODE
:
335 CSB_ERR(csb
, "Unknown subfunction code");
338 /* hardware errors */
339 case CSB_CC_RD_EXTERNAL
:
340 case CSB_CC_RD_EXTERNAL_DUP1
:
341 case CSB_CC_RD_EXTERNAL_DUP2
:
342 case CSB_CC_RD_EXTERNAL_DUP3
:
343 CSB_ERR_ADDR(csb
, "Read error outside coprocessor");
345 case CSB_CC_WR_EXTERNAL
:
346 CSB_ERR_ADDR(csb
, "Write error outside coprocessor");
348 case CSB_CC_INTERNAL
:
349 CSB_ERR(csb
, "Internal error in coprocessor");
351 case CSB_CC_PROVISION
:
352 CSB_ERR(csb
, "Storage provision error");
355 CSB_ERR(csb
, "Correctable hardware error");
357 case CSB_CC_HW_EXPIRED_TIMER
: /* P9 or later */
358 CSB_ERR(csb
, "Job did not finish within allowed time");
362 CSB_ERR(csb
, "Invalid CC %d", csb
->cc
);
366 /* check Completion Extension state */
367 if (csb
->ce
& CSB_CE_TERMINATION
) {
368 CSB_ERR(csb
, "CSB request was terminated");
371 if (csb
->ce
& CSB_CE_INCOMPLETE
) {
372 CSB_ERR(csb
, "CSB request not complete");
375 if (!(csb
->ce
& CSB_CE_TPBC
)) {
376 CSB_ERR(csb
, "TPBC not provided, unknown target length");
380 /* successful completion */
381 pr_debug_ratelimited("Processed %u bytes in %lu us\n",
382 be32_to_cpu(csb
->count
),
383 (unsigned long)ktime_us_delta(now
, start
));
388 static int nx842_config_crb(const unsigned char *in
, unsigned int inlen
,
389 unsigned char *out
, unsigned int outlen
,
390 struct nx842_workmem
*wmem
)
392 struct coprocessor_request_block
*crb
;
393 struct coprocessor_status_block
*csb
;
400 /* Clear any previous values */
401 memset(crb
, 0, sizeof(*crb
));
404 ret
= setup_ddl(&crb
->source
, wmem
->ddl_in
,
405 (unsigned char *)in
, inlen
, true);
409 ret
= setup_ddl(&crb
->target
, wmem
->ddl_out
,
414 /* set up CRB's CSB addr */
415 csb_addr
= nx842_get_pa(csb
) & CRB_CSB_ADDRESS
;
416 csb_addr
|= CRB_CSB_AT
; /* Addrs are phys */
417 crb
->csb_addr
= cpu_to_be64(csb_addr
);
423 * nx842_exec_icswx - compress/decompress data using the 842 algorithm
425 * (De)compression provided by the NX842 coprocessor on IBM PowerNV systems.
426 * This compresses or decompresses the provided input buffer into the provided
429 * Upon return from this function @outlen contains the length of the
430 * output data. If there is an error then @outlen will be 0 and an
431 * error will be specified by the return code from this function.
433 * The @workmem buffer should only be used by one function call at a time.
435 * @in: input buffer pointer
436 * @inlen: input buffer size
437 * @out: output buffer pointer
438 * @outlenp: output buffer size pointer
439 * @workmem: working memory buffer pointer, size determined by
440 * nx842_powernv_driver.workmem_size
441 * @fc: function code, see CCW Function Codes in nx-842.h
444 * 0 Success, output of length @outlenp stored in the buffer at @out
445 * -ENODEV Hardware unavailable
446 * -ENOSPC Output buffer is to small
447 * -EMSGSIZE Input buffer too large
448 * -EINVAL buffer constraints do not fix nx842_constraints
449 * -EPROTO hardware error during operation
450 * -ETIMEDOUT hardware did not complete operation in reasonable time
451 * -EINTR operation was aborted
453 static int nx842_exec_icswx(const unsigned char *in
, unsigned int inlen
,
454 unsigned char *out
, unsigned int *outlenp
,
455 void *workmem
, int fc
)
457 struct coprocessor_request_block
*crb
;
458 struct coprocessor_status_block
*csb
;
459 struct nx842_workmem
*wmem
;
462 unsigned int outlen
= *outlenp
;
464 wmem
= PTR_ALIGN(workmem
, WORKMEM_ALIGN
);
468 /* shoudn't happen, we don't load without a coproc */
470 pr_err_ratelimited("coprocessor CT is 0");
474 ret
= nx842_config_crb(in
, inlen
, out
, outlen
, wmem
);
483 ccw
= SET_FIELD(CCW_CT
, ccw
, nx842_ct
);
484 ccw
= SET_FIELD(CCW_CI_842
, ccw
, 0); /* use 0 for hw auto-selection */
485 ccw
= SET_FIELD(CCW_FC_842
, ccw
, fc
);
487 wmem
->start
= ktime_get();
490 ret
= icswx(cpu_to_be32(ccw
), crb
);
492 pr_debug_ratelimited("icswx CR %x ccw %x crb->ccw %x\n", ret
,
494 (unsigned int)be32_to_cpu(crb
->ccw
));
497 * NX842 coprocessor sets 3rd bit in CR register with XER[S0].
498 * XER[S0] is the integer summary overflow bit which is nothing
499 * to do NX. Since this bit can be set with other return values,
505 case ICSWX_INITIATED
:
506 ret
= wait_for_csb(wmem
, csb
);
509 pr_debug_ratelimited("842 Coprocessor busy\n");
513 pr_err_ratelimited("ICSWX rejected\n");
519 *outlenp
= be32_to_cpu(csb
->count
);
525 * nx842_exec_vas - compress/decompress data using the 842 algorithm
527 * (De)compression provided by the NX842 coprocessor on IBM PowerNV systems.
528 * This compresses or decompresses the provided input buffer into the provided
531 * Upon return from this function @outlen contains the length of the
532 * output data. If there is an error then @outlen will be 0 and an
533 * error will be specified by the return code from this function.
535 * The @workmem buffer should only be used by one function call at a time.
537 * @in: input buffer pointer
538 * @inlen: input buffer size
539 * @out: output buffer pointer
540 * @outlenp: output buffer size pointer
541 * @workmem: working memory buffer pointer, size determined by
542 * nx842_powernv_driver.workmem_size
543 * @fc: function code, see CCW Function Codes in nx-842.h
546 * 0 Success, output of length @outlenp stored in the buffer
548 * -ENODEV Hardware unavailable
549 * -ENOSPC Output buffer is to small
550 * -EMSGSIZE Input buffer too large
551 * -EINVAL buffer constraints do not fix nx842_constraints
552 * -EPROTO hardware error during operation
553 * -ETIMEDOUT hardware did not complete operation in reasonable time
554 * -EINTR operation was aborted
556 static int nx842_exec_vas(const unsigned char *in
, unsigned int inlen
,
557 unsigned char *out
, unsigned int *outlenp
,
558 void *workmem
, int fc
)
560 struct coprocessor_request_block
*crb
;
561 struct coprocessor_status_block
*csb
;
562 struct nx842_workmem
*wmem
;
563 struct vas_window
*txwin
;
566 unsigned int outlen
= *outlenp
;
568 wmem
= PTR_ALIGN(workmem
, WORKMEM_ALIGN
);
575 ret
= nx842_config_crb(in
, inlen
, out
, outlen
, wmem
);
580 ccw
= SET_FIELD(CCW_FC_842
, ccw
, fc
);
581 crb
->ccw
= cpu_to_be32(ccw
);
584 wmem
->start
= ktime_get();
586 txwin
= this_cpu_read(cpu_txwin
);
589 * VAS copy CRB into L2 cache. Refer <asm/vas.h>.
592 vas_copy_crb(crb
, 0);
595 * VAS paste previously copied CRB to NX.
596 * @txwin, @offset and @last (must be true).
598 ret
= vas_paste_crb(txwin
, 0, 1);
601 * Retry copy/paste function for VAS failures.
603 } while (ret
&& (i
++ < VAS_RETRIES
));
606 pr_err_ratelimited("VAS copy/paste failed\n");
610 ret
= wait_for_csb(wmem
, csb
);
612 *outlenp
= be32_to_cpu(csb
->count
);
618 * nx842_powernv_compress - Compress data using the 842 algorithm
620 * Compression provided by the NX842 coprocessor on IBM PowerNV systems.
621 * The input buffer is compressed and the result is stored in the
622 * provided output buffer.
624 * Upon return from this function @outlen contains the length of the
625 * compressed data. If there is an error then @outlen will be 0 and an
626 * error will be specified by the return code from this function.
628 * @in: input buffer pointer
629 * @inlen: input buffer size
630 * @out: output buffer pointer
631 * @outlenp: output buffer size pointer
632 * @wmem: working memory buffer pointer, size determined by
633 * nx842_powernv_driver.workmem_size
635 * Returns: see @nx842_powernv_exec()
637 static int nx842_powernv_compress(const unsigned char *in
, unsigned int inlen
,
638 unsigned char *out
, unsigned int *outlenp
,
641 return nx842_powernv_exec(in
, inlen
, out
, outlenp
,
642 wmem
, CCW_FC_842_COMP_CRC
);
646 * nx842_powernv_decompress - Decompress data using the 842 algorithm
648 * Decompression provided by the NX842 coprocessor on IBM PowerNV systems.
649 * The input buffer is decompressed and the result is stored in the
650 * provided output buffer.
652 * Upon return from this function @outlen contains the length of the
653 * decompressed data. If there is an error then @outlen will be 0 and an
654 * error will be specified by the return code from this function.
656 * @in: input buffer pointer
657 * @inlen: input buffer size
658 * @out: output buffer pointer
659 * @outlenp: output buffer size pointer
660 * @wmem: working memory buffer pointer, size determined by
661 * nx842_powernv_driver.workmem_size
663 * Returns: see @nx842_powernv_exec()
665 static int nx842_powernv_decompress(const unsigned char *in
, unsigned int inlen
,
666 unsigned char *out
, unsigned int *outlenp
,
669 return nx842_powernv_exec(in
, inlen
, out
, outlenp
,
670 wmem
, CCW_FC_842_DECOMP_CRC
);
673 static inline void nx_add_coprocs_list(struct nx_coproc
*coproc
,
676 coproc
->chip_id
= chipid
;
677 INIT_LIST_HEAD(&coproc
->list
);
678 list_add(&coproc
->list
, &nx_coprocs
);
681 static struct vas_window
*nx_alloc_txwin(struct nx_coproc
*coproc
)
683 struct vas_window
*txwin
= NULL
;
684 struct vas_tx_win_attr txattr
;
687 * Kernel requests will be high priority. So open send
688 * windows only for high priority RxFIFO entries.
690 vas_init_tx_win_attr(&txattr
, coproc
->ct
);
691 txattr
.lpid
= 0; /* lpid is 0 for kernel requests */
694 * Open a VAS send window which is used to send request to NX.
696 txwin
= vas_tx_win_open(coproc
->vas
.id
, coproc
->ct
, &txattr
);
698 pr_err("ibm,nx-842: Can not open TX window: %ld\n",
705 * Identify chip ID for each CPU, open send wndow for the corresponding NX
706 * engine and save txwin in percpu cpu_txwin.
707 * cpu_txwin is used in copy/paste operation for each compression /
708 * decompression request.
710 static int nx_open_percpu_txwins(void)
712 struct nx_coproc
*coproc
, *n
;
713 unsigned int i
, chip_id
;
715 for_each_possible_cpu(i
) {
716 struct vas_window
*txwin
= NULL
;
718 chip_id
= cpu_to_chip_id(i
);
720 list_for_each_entry_safe(coproc
, n
, &nx_coprocs
, list
) {
722 * Kernel requests use only high priority FIFOs. So
723 * open send windows for these FIFOs.
724 * GZIP is not supported in kernel right now.
727 if (coproc
->ct
!= VAS_COP_TYPE_842_HIPRI
)
730 if (coproc
->chip_id
== chip_id
) {
731 txwin
= nx_alloc_txwin(coproc
);
733 return PTR_ERR(txwin
);
735 per_cpu(cpu_txwin
, i
) = txwin
;
740 if (!per_cpu(cpu_txwin
, i
)) {
741 /* shouldn't happen, Each chip will have NX engine */
742 pr_err("NX engine is not available for CPU %d\n", i
);
750 static int __init
nx_set_ct(struct nx_coproc
*coproc
, const char *priority
,
751 int high
, int normal
)
753 if (!strcmp(priority
, "High"))
755 else if (!strcmp(priority
, "Normal"))
758 pr_err("Invalid RxFIFO priority value\n");
765 static int __init
vas_cfg_coproc_info(struct device_node
*dn
, int chip_id
,
766 int vasid
, int type
, int *ct
)
768 struct vas_window
*rxwin
= NULL
;
769 struct vas_rx_win_attr rxattr
;
770 u32 lpid
, pid
, tid
, fifo_size
;
771 struct nx_coproc
*coproc
;
773 const char *priority
;
776 ret
= of_property_read_u64(dn
, "rx-fifo-address", &rx_fifo
);
778 pr_err("Missing rx-fifo-address property\n");
782 ret
= of_property_read_u32(dn
, "rx-fifo-size", &fifo_size
);
784 pr_err("Missing rx-fifo-size property\n");
788 ret
= of_property_read_u32(dn
, "lpid", &lpid
);
790 pr_err("Missing lpid property\n");
794 ret
= of_property_read_u32(dn
, "pid", &pid
);
796 pr_err("Missing pid property\n");
800 ret
= of_property_read_u32(dn
, "tid", &tid
);
802 pr_err("Missing tid property\n");
806 ret
= of_property_read_string(dn
, "priority", &priority
);
808 pr_err("Missing priority property\n");
812 coproc
= kzalloc(sizeof(*coproc
), GFP_KERNEL
);
816 if (type
== NX_CT_842
)
817 ret
= nx_set_ct(coproc
, priority
, VAS_COP_TYPE_842_HIPRI
,
819 else if (type
== NX_CT_GZIP
)
820 ret
= nx_set_ct(coproc
, priority
, VAS_COP_TYPE_GZIP_HIPRI
,
826 vas_init_rx_win_attr(&rxattr
, coproc
->ct
);
827 rxattr
.rx_fifo
= rx_fifo
;
828 rxattr
.rx_fifo_size
= fifo_size
;
829 rxattr
.lnotify_lpid
= lpid
;
830 rxattr
.lnotify_pid
= pid
;
831 rxattr
.lnotify_tid
= tid
;
833 * Maximum RX window credits can not be more than #CRBs in
834 * RxFIFO. Otherwise, can get checkstop if RxFIFO overruns.
836 rxattr
.wcreds_max
= fifo_size
/ CRB_SIZE
;
839 * Open a VAS receice window which is used to configure RxFIFO
842 rxwin
= vas_rx_win_open(vasid
, coproc
->ct
, &rxattr
);
844 ret
= PTR_ERR(rxwin
);
845 pr_err("setting RxFIFO with VAS failed: %d\n",
850 coproc
->vas
.rxwin
= rxwin
;
851 coproc
->vas
.id
= vasid
;
852 nx_add_coprocs_list(coproc
, chip_id
);
855 * (lpid, pid, tid) combination has to be unique for each
856 * coprocessor instance in the system. So to make it
857 * unique, skiboot uses coprocessor type such as 842 or
858 * GZIP for pid and provides this value to kernel in pid
859 * device-tree property.
870 static int __init
nx_coproc_init(int chip_id
, int ct_842
, int ct_gzip
)
874 if (opal_check_token(OPAL_NX_COPROC_INIT
)) {
875 ret
= opal_nx_coproc_init(chip_id
, ct_842
);
878 ret
= opal_nx_coproc_init(chip_id
, ct_gzip
);
881 ret
= opal_error_code(ret
);
882 pr_err("Failed to initialize NX for chip(%d): %d\n",
886 pr_warn("Firmware doesn't support NX initialization\n");
891 static int __init
find_nx_device_tree(struct device_node
*dn
, int chip_id
,
892 int vasid
, int type
, char *devname
,
897 if (of_device_is_compatible(dn
, devname
)) {
898 ret
= vas_cfg_coproc_info(dn
, chip_id
, vasid
, type
, ct
);
906 static int __init
nx_powernv_probe_vas(struct device_node
*pn
)
908 int chip_id
, vasid
, ret
= 0;
909 int ct_842
= 0, ct_gzip
= 0;
910 struct device_node
*dn
;
912 chip_id
= of_get_ibm_chip_id(pn
);
914 pr_err("ibm,chip-id missing\n");
918 vasid
= chip_to_vas_id(chip_id
);
920 pr_err("Unable to map chip_id %d to vasid\n", chip_id
);
924 for_each_child_of_node(pn
, dn
) {
925 ret
= find_nx_device_tree(dn
, chip_id
, vasid
, NX_CT_842
,
926 "ibm,p9-nx-842", &ct_842
);
929 ret
= find_nx_device_tree(dn
, chip_id
, vasid
,
930 NX_CT_GZIP
, "ibm,p9-nx-gzip", &ct_gzip
);
938 if (!ct_842
|| !ct_gzip
) {
939 pr_err("NX FIFO nodes are missing\n");
944 * Initialize NX instance for both high and normal priority FIFOs.
946 ret
= nx_coproc_init(chip_id
, ct_842
, ct_gzip
);
951 static int __init
nx842_powernv_probe(struct device_node
*dn
)
953 struct nx_coproc
*coproc
;
957 chip_id
= of_get_ibm_chip_id(dn
);
959 pr_err("ibm,chip-id missing\n");
963 if (of_property_read_u32(dn
, "ibm,842-coprocessor-type", &ct
)) {
964 pr_err("ibm,842-coprocessor-type missing\n");
968 if (of_property_read_u32(dn
, "ibm,842-coprocessor-instance", &ci
)) {
969 pr_err("ibm,842-coprocessor-instance missing\n");
973 coproc
= kzalloc(sizeof(*coproc
), GFP_KERNEL
);
979 nx_add_coprocs_list(coproc
, chip_id
);
981 pr_info("coprocessor found on chip %d, CT %d CI %d\n", chip_id
, ct
, ci
);
985 else if (nx842_ct
!= ct
)
986 pr_err("NX842 chip %d, CT %d != first found CT %d\n",
987 chip_id
, ct
, nx842_ct
);
992 static void nx_delete_coprocs(void)
994 struct nx_coproc
*coproc
, *n
;
995 struct vas_window
*txwin
;
999 * close percpu txwins that are opened for the corresponding coproc.
1001 for_each_possible_cpu(i
) {
1002 txwin
= per_cpu(cpu_txwin
, i
);
1004 vas_win_close(txwin
);
1006 per_cpu(cpu_txwin
, i
) = NULL
;
1009 list_for_each_entry_safe(coproc
, n
, &nx_coprocs
, list
) {
1010 if (coproc
->vas
.rxwin
)
1011 vas_win_close(coproc
->vas
.rxwin
);
1013 list_del(&coproc
->list
);
1018 static struct nx842_constraints nx842_powernv_constraints
= {
1019 .alignment
= DDE_BUFFER_ALIGN
,
1020 .multiple
= DDE_BUFFER_LAST_MULT
,
1021 .minimum
= DDE_BUFFER_LAST_MULT
,
1022 .maximum
= (DDL_LEN_MAX
- 1) * PAGE_SIZE
,
1025 static struct nx842_driver nx842_powernv_driver
= {
1026 .name
= KBUILD_MODNAME
,
1027 .owner
= THIS_MODULE
,
1028 .workmem_size
= sizeof(struct nx842_workmem
),
1029 .constraints
= &nx842_powernv_constraints
,
1030 .compress
= nx842_powernv_compress
,
1031 .decompress
= nx842_powernv_decompress
,
1034 static int nx842_powernv_crypto_init(struct crypto_tfm
*tfm
)
1036 return nx842_crypto_init(tfm
, &nx842_powernv_driver
);
1039 static struct crypto_alg nx842_powernv_alg
= {
1041 .cra_driver_name
= "842-nx",
1042 .cra_priority
= 300,
1043 .cra_flags
= CRYPTO_ALG_TYPE_COMPRESS
,
1044 .cra_ctxsize
= sizeof(struct nx842_crypto_ctx
),
1045 .cra_module
= THIS_MODULE
,
1046 .cra_init
= nx842_powernv_crypto_init
,
1047 .cra_exit
= nx842_crypto_exit
,
1048 .cra_u
= { .compress
= {
1049 .coa_compress
= nx842_crypto_compress
,
1050 .coa_decompress
= nx842_crypto_decompress
} }
1053 static __init
int nx_compress_powernv_init(void)
1055 struct device_node
*dn
;
1058 /* verify workmem size/align restrictions */
1059 BUILD_BUG_ON(WORKMEM_ALIGN
% CRB_ALIGN
);
1060 BUILD_BUG_ON(CRB_ALIGN
% DDE_ALIGN
);
1061 BUILD_BUG_ON(CRB_SIZE
% DDE_ALIGN
);
1062 /* verify buffer size/align restrictions */
1063 BUILD_BUG_ON(PAGE_SIZE
% DDE_BUFFER_ALIGN
);
1064 BUILD_BUG_ON(DDE_BUFFER_ALIGN
% DDE_BUFFER_SIZE_MULT
);
1065 BUILD_BUG_ON(DDE_BUFFER_SIZE_MULT
% DDE_BUFFER_LAST_MULT
);
1067 for_each_compatible_node(dn
, NULL
, "ibm,power9-nx") {
1068 ret
= nx_powernv_probe_vas(dn
);
1070 nx_delete_coprocs();
1076 if (list_empty(&nx_coprocs
)) {
1077 for_each_compatible_node(dn
, NULL
, "ibm,power-nx")
1078 nx842_powernv_probe(dn
);
1083 nx842_powernv_exec
= nx842_exec_icswx
;
1086 * Register VAS user space API for NX GZIP so
1087 * that user space can use GZIP engine.
1088 * Using high FIFO priority for kernel requests and
1089 * normal FIFO priority is assigned for userspace.
1090 * 842 compression is supported only in kernel.
1092 ret
= vas_register_api_powernv(THIS_MODULE
, VAS_COP_TYPE_GZIP
,
1096 * GZIP is not supported in kernel right now.
1097 * So open tx windows only for 842.
1100 ret
= nx_open_percpu_txwins();
1103 nx_delete_coprocs();
1107 nx842_powernv_exec
= nx842_exec_vas
;
1110 ret
= crypto_register_alg(&nx842_powernv_alg
);
1112 nx_delete_coprocs();
1118 module_init(nx_compress_powernv_init
);
1120 static void __exit
nx_compress_powernv_exit(void)
1123 * GZIP engine is supported only in power9 or later and nx842_ct
1124 * is used on power8 (icswx).
1125 * VAS API for NX GZIP is registered during init for user space
1126 * use. So delete this API use for GZIP engine.
1129 vas_unregister_api_powernv();
1131 crypto_unregister_alg(&nx842_powernv_alg
);
1133 nx_delete_coprocs();
1135 module_exit(nx_compress_powernv_exit
);