1 #ifndef __GENWQE_CARD_H__
2 #define __GENWQE_CARD_H__
5 * IBM Accelerator Family 'GenWQE'
7 * (C) Copyright IBM Corp. 2013
9 * Author: Frank Haverkamp <haver@linux.vnet.ibm.com>
10 * Author: Joerg-Stephan Vogt <jsvogt@de.ibm.com>
11 * Author: Michael Jung <mijung@gmx.net>
12 * Author: Michael Ruettger <michael@ibmra.de>
14 * This program is free software; you can redistribute it and/or modify
15 * it under the terms of the GNU General Public License (version 2 only)
16 * as published by the Free Software Foundation.
18 * This program is distributed in the hope that it will be useful,
19 * but WITHOUT ANY WARRANTY; without even the implied warranty of
20 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
21 * GNU General Public License for more details.
25 * User-space API for the GenWQE card. For debugging and test purposes
26 * the register addresses are included here too.
29 #include <linux/types.h>
30 #include <linux/ioctl.h>
32 /* Basename of sysfs, debugfs and /dev interfaces */
33 #define GENWQE_DEVNAME "genwqe"
35 #define GENWQE_TYPE_ALTERA_230 0x00 /* GenWQE4 Stratix-IV-230 */
36 #define GENWQE_TYPE_ALTERA_530 0x01 /* GenWQE4 Stratix-IV-530 */
37 #define GENWQE_TYPE_ALTERA_A4 0x02 /* GenWQE5 A4 Stratix-V-A4 */
38 #define GENWQE_TYPE_ALTERA_A7 0x03 /* GenWQE5 A7 Stratix-V-A7 */
40 /* MMIO Unit offsets: Each UnitID occupies a defined address range */
41 #define GENWQE_UID_OFFS(uid) ((uid) << 24)
42 #define GENWQE_SLU_OFFS GENWQE_UID_OFFS(0)
43 #define GENWQE_HSU_OFFS GENWQE_UID_OFFS(1)
44 #define GENWQE_APP_OFFS GENWQE_UID_OFFS(2)
45 #define GENWQE_MAX_UNITS 3
47 /* Common offsets per UnitID */
48 #define IO_EXTENDED_ERROR_POINTER 0x00000048
49 #define IO_ERROR_INJECT_SELECTOR 0x00000060
50 #define IO_EXTENDED_DIAG_SELECTOR 0x00000070
51 #define IO_EXTENDED_DIAG_READ_MBX 0x00000078
52 #define IO_EXTENDED_DIAG_MAP(ring) (0x00000500 | ((ring) << 3))
54 #define GENWQE_EXTENDED_DIAG_SELECTOR(ring, trace) (((ring) << 8) | (trace))
56 /* UnitID 0: Service Layer Unit (SLU) */
58 /* SLU: Unit Configuration Register */
59 #define IO_SLU_UNITCFG 0x00000000
60 #define IO_SLU_UNITCFG_TYPE_MASK 0x000000000ff00000 /* 27:20 */
62 /* SLU: Fault Isolation Register (FIR) (ac_slu_fir) */
63 #define IO_SLU_FIR 0x00000008 /* read only, wr direct */
64 #define IO_SLU_FIR_CLR 0x00000010 /* read and clear */
66 /* SLU: First Error Capture Register (FEC/WOF) */
67 #define IO_SLU_FEC 0x00000018
69 #define IO_SLU_ERR_ACT_MASK 0x00000020
70 #define IO_SLU_ERR_ATTN_MASK 0x00000028
71 #define IO_SLU_FIRX1_ACT_MASK 0x00000030
72 #define IO_SLU_FIRX0_ACT_MASK 0x00000038
73 #define IO_SLU_SEC_LEM_DEBUG_OVR 0x00000040
74 #define IO_SLU_EXTENDED_ERR_PTR 0x00000048
75 #define IO_SLU_COMMON_CONFIG 0x00000060
77 #define IO_SLU_FLASH_FIR 0x00000108
78 #define IO_SLU_SLC_FIR 0x00000110
79 #define IO_SLU_RIU_TRAP 0x00000280
80 #define IO_SLU_FLASH_FEC 0x00000308
81 #define IO_SLU_SLC_FEC 0x00000310
84 * The Virtual Function's Access is from offset 0x00010000
85 * The Physical Function's Access is from offset 0x00050000
86 * Single Shared Registers exists only at offset 0x00060000
88 * SLC: Queue Virtual Window Window for accessing into a specific VF
89 * queue. When accessing the 0x10000 space using the 0x50000 address
90 * segment, the value indicated here is used to specify which VF
91 * register is decoded. This register, and the 0x50000 register space
92 * can only be accessed by the PF. Example, if this register is set to
93 * 0x2, then a read from 0x50000 is the same as a read from 0x10000
97 /* SLC: Queue Segment */
98 #define IO_SLC_QUEUE_SEGMENT 0x00010000
99 #define IO_SLC_VF_QUEUE_SEGMENT 0x00050000
101 /* SLC: Queue Offset */
102 #define IO_SLC_QUEUE_OFFSET 0x00010008
103 #define IO_SLC_VF_QUEUE_OFFSET 0x00050008
105 /* SLC: Queue Configuration */
106 #define IO_SLC_QUEUE_CONFIG 0x00010010
107 #define IO_SLC_VF_QUEUE_CONFIG 0x00050010
109 /* SLC: Job Timout/Only accessible for the PF */
110 #define IO_SLC_APPJOB_TIMEOUT 0x00010018
111 #define IO_SLC_VF_APPJOB_TIMEOUT 0x00050018
112 #define TIMEOUT_250MS 0x0000000f
113 #define HEARTBEAT_DISABLE 0x0000ff00
115 /* SLC: Queue InitSequence Register */
116 #define IO_SLC_QUEUE_INITSQN 0x00010020
117 #define IO_SLC_VF_QUEUE_INITSQN 0x00050020
119 /* SLC: Queue Wrap */
120 #define IO_SLC_QUEUE_WRAP 0x00010028
121 #define IO_SLC_VF_QUEUE_WRAP 0x00050028
123 /* SLC: Queue Status */
124 #define IO_SLC_QUEUE_STATUS 0x00010100
125 #define IO_SLC_VF_QUEUE_STATUS 0x00050100
127 /* SLC: Queue Working Time */
128 #define IO_SLC_QUEUE_WTIME 0x00010030
129 #define IO_SLC_VF_QUEUE_WTIME 0x00050030
131 /* SLC: Queue Error Counts */
132 #define IO_SLC_QUEUE_ERRCNTS 0x00010038
133 #define IO_SLC_VF_QUEUE_ERRCNTS 0x00050038
135 /* SLC: Queue Loast Response Word */
136 #define IO_SLC_QUEUE_LRW 0x00010040
137 #define IO_SLC_VF_QUEUE_LRW 0x00050040
139 /* SLC: Freerunning Timer */
140 #define IO_SLC_FREE_RUNNING_TIMER 0x00010108
141 #define IO_SLC_VF_FREE_RUNNING_TIMER 0x00050108
143 /* SLC: Queue Virtual Access Region */
144 #define IO_PF_SLC_VIRTUAL_REGION 0x00050000
146 /* SLC: Queue Virtual Window */
147 #define IO_PF_SLC_VIRTUAL_WINDOW 0x00060000
149 /* SLC: DDCB Application Job Pending [n] (n=0:63) */
150 #define IO_PF_SLC_JOBPEND(n) (0x00061000 + 8*(n))
151 #define IO_SLC_JOBPEND(n) IO_PF_SLC_JOBPEND(n)
153 /* SLC: Parser Trap RAM [n] (n=0:31) */
154 #define IO_SLU_SLC_PARSE_TRAP(n) (0x00011000 + 8*(n))
156 /* SLC: Dispatcher Trap RAM [n] (n=0:31) */
157 #define IO_SLU_SLC_DISP_TRAP(n) (0x00011200 + 8*(n))
159 /* Global Fault Isolation Register (GFIR) */
160 #define IO_SLC_CFGREG_GFIR 0x00020000
161 #define GFIR_ERR_TRIGGER 0x0000ffff
163 /* SLU: Soft Reset Register */
164 #define IO_SLC_CFGREG_SOFTRESET 0x00020018
166 /* SLU: Misc Debug Register */
167 #define IO_SLC_MISC_DEBUG 0x00020060
168 #define IO_SLC_MISC_DEBUG_CLR 0x00020068
169 #define IO_SLC_MISC_DEBUG_SET 0x00020070
171 /* Temperature Sensor Reading */
172 #define IO_SLU_TEMPERATURE_SENSOR 0x00030000
173 #define IO_SLU_TEMPERATURE_CONFIG 0x00030008
175 /* Voltage Margining Control */
176 #define IO_SLU_VOLTAGE_CONTROL 0x00030080
177 #define IO_SLU_VOLTAGE_NOMINAL 0x00000000
178 #define IO_SLU_VOLTAGE_DOWN5 0x00000006
179 #define IO_SLU_VOLTAGE_UP5 0x00000007
181 /* Direct LED Control Register */
182 #define IO_SLU_LEDCONTROL 0x00030100
184 /* SLU: Flashbus Direct Access -A5 */
185 #define IO_SLU_FLASH_DIRECTACCESS 0x00040010
187 /* SLU: Flashbus Direct Access2 -A5 */
188 #define IO_SLU_FLASH_DIRECTACCESS2 0x00040020
190 /* SLU: Flashbus Command Interface -A5 */
191 #define IO_SLU_FLASH_CMDINTF 0x00040030
193 /* SLU: BitStream Loaded */
194 #define IO_SLU_BITSTREAM 0x00040040
196 /* This Register has a switch which will change the CAs to UR */
197 #define IO_HSU_ERR_BEHAVIOR 0x01001010
199 #define IO_SLC2_SQB_TRAP 0x00062000
200 #define IO_SLC2_QUEUE_MANAGER_TRAP 0x00062008
201 #define IO_SLC2_FLS_MASTER_TRAP 0x00062010
203 /* UnitID 1: HSU Registers */
204 #define IO_HSU_UNITCFG 0x01000000
205 #define IO_HSU_FIR 0x01000008
206 #define IO_HSU_FIR_CLR 0x01000010
207 #define IO_HSU_FEC 0x01000018
208 #define IO_HSU_ERR_ACT_MASK 0x01000020
209 #define IO_HSU_ERR_ATTN_MASK 0x01000028
210 #define IO_HSU_FIRX1_ACT_MASK 0x01000030
211 #define IO_HSU_FIRX0_ACT_MASK 0x01000038
212 #define IO_HSU_SEC_LEM_DEBUG_OVR 0x01000040
213 #define IO_HSU_EXTENDED_ERR_PTR 0x01000048
214 #define IO_HSU_COMMON_CONFIG 0x01000060
216 /* UnitID 2: Application Unit (APP) */
217 #define IO_APP_UNITCFG 0x02000000
218 #define IO_APP_FIR 0x02000008
219 #define IO_APP_FIR_CLR 0x02000010
220 #define IO_APP_FEC 0x02000018
221 #define IO_APP_ERR_ACT_MASK 0x02000020
222 #define IO_APP_ERR_ATTN_MASK 0x02000028
223 #define IO_APP_FIRX1_ACT_MASK 0x02000030
224 #define IO_APP_FIRX0_ACT_MASK 0x02000038
225 #define IO_APP_SEC_LEM_DEBUG_OVR 0x02000040
226 #define IO_APP_EXTENDED_ERR_PTR 0x02000048
227 #define IO_APP_COMMON_CONFIG 0x02000060
229 #define IO_APP_DEBUG_REG_01 0x02010000
230 #define IO_APP_DEBUG_REG_02 0x02010008
231 #define IO_APP_DEBUG_REG_03 0x02010010
232 #define IO_APP_DEBUG_REG_04 0x02010018
233 #define IO_APP_DEBUG_REG_05 0x02010020
234 #define IO_APP_DEBUG_REG_06 0x02010028
235 #define IO_APP_DEBUG_REG_07 0x02010030
236 #define IO_APP_DEBUG_REG_08 0x02010038
237 #define IO_APP_DEBUG_REG_09 0x02010040
238 #define IO_APP_DEBUG_REG_10 0x02010048
239 #define IO_APP_DEBUG_REG_11 0x02010050
240 #define IO_APP_DEBUG_REG_12 0x02010058
241 #define IO_APP_DEBUG_REG_13 0x02010060
242 #define IO_APP_DEBUG_REG_14 0x02010068
243 #define IO_APP_DEBUG_REG_15 0x02010070
244 #define IO_APP_DEBUG_REG_16 0x02010078
245 #define IO_APP_DEBUG_REG_17 0x02010080
246 #define IO_APP_DEBUG_REG_18 0x02010088
248 /* Read/write from/to registers */
249 struct genwqe_reg_io
{
250 __u64 num
; /* register offset/address */
255 * All registers of our card will return values not equal this values.
256 * If we see IO_ILLEGAL_VALUE on any of our MMIO register reads, the
257 * card can be considered as unusable. It will need recovery.
259 #define IO_ILLEGAL_VALUE 0xffffffffffffffffull
262 * Generic DDCB execution interface.
264 * This interface is a first prototype resulting from discussions we
265 * had with other teams which wanted to use the Genwqe card. It allows
266 * to issue a DDCB request in a generic way. The request will block
267 * until it finishes or time out with error.
269 * Some DDCBs require DMA addresses to be specified in the ASIV
270 * block. The interface provies the capability to let the kernel
271 * driver know where those addresses are by specifying the ATS field,
272 * such that it can replace the user-space addresses with appropriate
273 * DMA addresses or DMA addresses of a scatter gather list which is
274 * dynamically created.
276 * Our hardware will refuse DDCB execution if the ATS field is not as
277 * expected. That means the DDCB execution engine in the chip knows
278 * where it expects DMA addresses within the ASIV part of the DDCB and
279 * will check that against the ATS field definition. Any invalid or
280 * unknown ATS content will lead to DDCB refusal.
283 /* Genwqe chip Units */
284 #define DDCB_ACFUNC_SLU 0x00 /* chip service layer unit */
285 #define DDCB_ACFUNC_APP 0x01 /* chip application */
287 /* DDCB return codes (RETC) */
288 #define DDCB_RETC_IDLE 0x0000 /* Unexecuted/DDCB created */
289 #define DDCB_RETC_PENDING 0x0101 /* Pending Execution */
290 #define DDCB_RETC_COMPLETE 0x0102 /* Cmd complete. No error */
291 #define DDCB_RETC_FAULT 0x0104 /* App Err, recoverable */
292 #define DDCB_RETC_ERROR 0x0108 /* App Err, non-recoverable */
293 #define DDCB_RETC_FORCED_ERROR 0x01ff /* overwritten by driver */
295 #define DDCB_RETC_UNEXEC 0x0110 /* Unexe/Removed from queue */
296 #define DDCB_RETC_TERM 0x0120 /* Terminated */
297 #define DDCB_RETC_RES0 0x0140 /* Reserved */
298 #define DDCB_RETC_RES1 0x0180 /* Reserved */
300 /* DDCB Command Options (CMDOPT) */
301 #define DDCB_OPT_ECHO_FORCE_NO 0x0000 /* ECHO DDCB */
302 #define DDCB_OPT_ECHO_FORCE_102 0x0001 /* force return code */
303 #define DDCB_OPT_ECHO_FORCE_104 0x0002
304 #define DDCB_OPT_ECHO_FORCE_108 0x0003
306 #define DDCB_OPT_ECHO_FORCE_110 0x0004 /* only on PF ! */
307 #define DDCB_OPT_ECHO_FORCE_120 0x0005
308 #define DDCB_OPT_ECHO_FORCE_140 0x0006
309 #define DDCB_OPT_ECHO_FORCE_180 0x0007
311 #define DDCB_OPT_ECHO_COPY_NONE (0 << 5)
312 #define DDCB_OPT_ECHO_COPY_ALL (1 << 5)
314 /* Definitions of Service Layer Commands */
315 #define SLCMD_ECHO_SYNC 0x00 /* PF/VF */
316 #define SLCMD_MOVE_FLASH 0x06 /* PF only */
317 #define SLCMD_MOVE_FLASH_FLAGS_MODE 0x03 /* bit 0 and 1 used for mode */
318 #define SLCMD_MOVE_FLASH_FLAGS_DLOAD 0 /* mode: download */
319 #define SLCMD_MOVE_FLASH_FLAGS_EMUL 1 /* mode: emulation */
320 #define SLCMD_MOVE_FLASH_FLAGS_UPLOAD 2 /* mode: upload */
321 #define SLCMD_MOVE_FLASH_FLAGS_VERIFY 3 /* mode: verify */
322 #define SLCMD_MOVE_FLASH_FLAG_NOTAP (1 << 2)/* just dump DDCB and exit */
323 #define SLCMD_MOVE_FLASH_FLAG_POLL (1 << 3)/* wait for RETC >= 0102 */
324 #define SLCMD_MOVE_FLASH_FLAG_PARTITION (1 << 4)
325 #define SLCMD_MOVE_FLASH_FLAG_ERASE (1 << 5)
327 enum genwqe_card_state
{
328 GENWQE_CARD_UNUSED
= 0,
329 GENWQE_CARD_USED
= 1,
330 GENWQE_CARD_FATAL_ERROR
= 2,
331 GENWQE_CARD_RELOAD_BITSTREAM
= 3,
332 GENWQE_CARD_STATE_MAX
,
335 /* common struct for chip image exchange */
336 struct genwqe_bitstream
{
337 __u64 data_addr
; /* pointer to image data */
338 __u32 size
; /* size of image file */
339 __u32 crc
; /* crc of this image */
340 __u64 target_addr
; /* starting address in Flash */
341 __u32 partition
; /* '0', '1', or 'v' */
342 __u32 uid
; /* 1=host/x=dram */
344 __u64 slu_id
; /* informational/sim: SluID */
345 __u64 app_id
; /* informational/sim: AppID */
347 __u16 retc
; /* returned from processing */
348 __u16 attn
; /* attention code from processing */
349 __u32 progress
; /* progress code from processing */
352 /* Issuing a specific DDCB command */
353 #define DDCB_LENGTH 256 /* for debug data */
354 #define DDCB_ASIV_LENGTH 104 /* len of the DDCB ASIV array */
355 #define DDCB_ASIV_LENGTH_ATS 96 /* ASIV in ATS architecture */
356 #define DDCB_ASV_LENGTH 64 /* len of the DDCB ASV array */
357 #define DDCB_FIXUPS 12 /* maximum number of fixups */
359 struct genwqe_debug_data
{
360 char driver_version
[64];
364 __u8 ddcb_before
[DDCB_LENGTH
];
365 __u8 ddcb_prev
[DDCB_LENGTH
];
366 __u8 ddcb_finished
[DDCB_LENGTH
];
370 * Address Translation Specification (ATS) definitions
372 * Each 4 bit within the ATS 64-bit word specify the required address
373 * translation at the defined offset.
376 * 6666.5555.5555.5544.4444.4443.3333.3333 ... 11
377 * 3210.9876.5432.1098.7654.3210.9876.5432 ... 1098.7654.3210
379 * offset: 0x00 0x08 0x10 0x18 0x20 0x28 0x30 0x38 ... 0x68 0x70 0x78
380 * res res res res ASIV ...
381 * The first 4 entries in the ATS word are reserved. The following nibbles
382 * each describe at an 8 byte offset the format of the required data.
384 #define ATS_TYPE_DATA 0x0ull /* data */
385 #define ATS_TYPE_FLAT_RD 0x4ull /* flat buffer read only */
386 #define ATS_TYPE_FLAT_RDWR 0x5ull /* flat buffer read/write */
387 #define ATS_TYPE_SGL_RD 0x6ull /* sgl read only */
388 #define ATS_TYPE_SGL_RDWR 0x7ull /* sgl read/write */
390 #define ATS_SET_FLAGS(_struct, _field, _flags) \
391 (((_flags) & 0xf) << (44 - (4 * (offsetof(_struct, _field) / 8))))
393 #define ATS_GET_FLAGS(_ats, _byte_offs) \
394 (((_ats) >> (44 - (4 * ((_byte_offs) / 8)))) & 0xf)
397 * struct genwqe_ddcb_cmd - User parameter for generic DDCB commands
399 * On the way into the kernel the driver will read the whole data
400 * structure. On the way out the driver will not copy the ASIV data
401 * back to user-space.
403 struct genwqe_ddcb_cmd
{
404 /* START of data copied to/from driver */
405 __u64 next_addr
; /* chaining genwqe_ddcb_cmd */
406 __u64 flags
; /* reserved */
408 __u8 acfunc
; /* accelerators functional unit */
409 __u8 cmd
; /* command to execute */
410 __u8 asiv_length
; /* used parameter length */
411 __u8 asv_length
; /* length of valid return values */
412 __u16 cmdopts
; /* command options */
413 __u16 retc
; /* return code from processing */
415 __u16 attn
; /* attention code from processing */
416 __u16 vcrc
; /* variant crc16 */
417 __u32 progress
; /* progress code from processing */
419 __u64 deque_ts
; /* dequeue time stamp */
420 __u64 cmplt_ts
; /* completion time stamp */
421 __u64 disp_ts
; /* SW processing start */
423 /* move to end and avoid copy-back */
424 __u64 ddata_addr
; /* collect debug data */
426 /* command specific values */
427 __u8 asv
[DDCB_ASV_LENGTH
];
429 /* END of data copied from driver */
433 __u8 asiv
[DDCB_ASIV_LENGTH_ATS
];
435 /* used for flash update to keep it backward compatible */
436 __u8 __asiv
[DDCB_ASIV_LENGTH
];
438 /* END of data copied to driver */
441 #define GENWQE_IOC_CODE 0xa5
443 /* Access functions */
444 #define GENWQE_READ_REG64 _IOR(GENWQE_IOC_CODE, 30, struct genwqe_reg_io)
445 #define GENWQE_WRITE_REG64 _IOW(GENWQE_IOC_CODE, 31, struct genwqe_reg_io)
446 #define GENWQE_READ_REG32 _IOR(GENWQE_IOC_CODE, 32, struct genwqe_reg_io)
447 #define GENWQE_WRITE_REG32 _IOW(GENWQE_IOC_CODE, 33, struct genwqe_reg_io)
448 #define GENWQE_READ_REG16 _IOR(GENWQE_IOC_CODE, 34, struct genwqe_reg_io)
449 #define GENWQE_WRITE_REG16 _IOW(GENWQE_IOC_CODE, 35, struct genwqe_reg_io)
451 #define GENWQE_GET_CARD_STATE _IOR(GENWQE_IOC_CODE, 36, enum genwqe_card_state)
454 * struct genwqe_mem - Memory pinning/unpinning information
455 * @addr: virtual user space address
456 * @size: size of the area pin/dma-map/unmap
457 * direction: 0: read/1: read and write
459 * Avoid pinning and unpinning of memory pages dynamically. Instead
460 * the idea is to pin the whole buffer space required for DDCB
461 * opertionas in advance. The driver will reuse this pinning and the
462 * memory associated with it to setup the sglists for the DDCB
463 * requests without the need to allocate and free memory or map and
464 * unmap to get the DMA addresses.
466 * The inverse operation needs to be called after the pinning is not
467 * needed anymore. The pinnings else the pinnings will get removed
468 * after the device is closed. Note that pinnings will required
478 #define GENWQE_PIN_MEM _IOWR(GENWQE_IOC_CODE, 40, struct genwqe_mem)
479 #define GENWQE_UNPIN_MEM _IOWR(GENWQE_IOC_CODE, 41, struct genwqe_mem)
482 * Generic synchronous DDCB execution interface.
483 * Synchronously execute a DDCB.
485 * Return: 0 on success or negative error code.
486 * -EINVAL: Invalid parameters (ASIV_LEN, ASV_LEN, illegal fixups
487 * no mappings found/could not create mappings
488 * -EFAULT: illegal addresses in fixups, purging failed
489 * -EBADMSG: enqueing failed, retc != DDCB_RETC_COMPLETE
491 #define GENWQE_EXECUTE_DDCB \
492 _IOWR(GENWQE_IOC_CODE, 50, struct genwqe_ddcb_cmd)
494 #define GENWQE_EXECUTE_RAW_DDCB \
495 _IOWR(GENWQE_IOC_CODE, 51, struct genwqe_ddcb_cmd)
497 /* Service Layer functions (PF only) */
498 #define GENWQE_SLU_UPDATE _IOWR(GENWQE_IOC_CODE, 80, struct genwqe_bitstream)
499 #define GENWQE_SLU_READ _IOWR(GENWQE_IOC_CODE, 81, struct genwqe_bitstream)
501 #endif /* __GENWQE_CARD_H__ */