1 /***********************license start***************
2 * Author: Cavium Networks
4 * Contact: support@caviumnetworks.com
5 * This file is part of the OCTEON SDK
7 * Copyright (c) 2003-2008 Cavium Networks
9 * This file is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License, Version 2, as
11 * published by the Free Software Foundation.
13 * This file is distributed in the hope that it will be useful, but
14 * AS-IS and WITHOUT ANY WARRANTY; without even the implied warranty
15 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, TITLE, or
16 * NONINFRINGEMENT. See the GNU General Public License for more
19 * You should have received a copy of the GNU General Public License
20 * along with this file; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
22 * or visit http://www.gnu.org/licenses/.
24 * This file may also be available under a different license from Cavium.
25 * Contact Cavium Networks for more information
26 ***********************license end**************************************/
30 * Interface to the hardware Packet Output unit.
32 * Starting with SDK 1.7.0, the PKO output functions now support
33 * two types of locking. CVMX_PKO_LOCK_ATOMIC_TAG continues to
34 * function similarly to previous SDKs by using POW atomic tags
35 * to preserve ordering and exclusivity. As a new option, you
36 * can now pass CVMX_PKO_LOCK_CMD_QUEUE which uses a ll/sc
37 * memory based locking instead. This locking has the advantage
38 * of not affecting the tag state but doesn't preserve packet
39 * ordering. CVMX_PKO_LOCK_CMD_QUEUE is appropriate in most
40 * generic code while CVMX_PKO_LOCK_CMD_QUEUE should be used
41 * with hand tuned fast path code.
43 * Some of other SDK differences visible to the command command
45 * - PKO indexes are no longer stored in the FAU. A large
46 * percentage of the FAU register block used to be tied up
47 * maintaining PKO queue pointers. These are now stored in a
49 * - The PKO <b>use_locking</b> parameter can now have a global
50 * effect. Since all application use the same named block,
51 * queue locking correctly applies across all operating
52 * systems when using CVMX_PKO_LOCK_CMD_QUEUE.
53 * - PKO 3 word commands are now supported. Use
54 * cvmx_pko_send_packet_finish3().
58 #ifndef __CVMX_PKO_H__
59 #define __CVMX_PKO_H__
61 #include <asm/octeon/cvmx-fpa.h>
62 #include <asm/octeon/cvmx-pow.h>
63 #include <asm/octeon/cvmx-cmd-queue.h>
64 #include <asm/octeon/cvmx-pko-defs.h>
66 /* Adjust the command buffer size by 1 word so that in the case of using only
67 * two word PKO commands no command words stradle buffers. The useful values
68 * for this are 0 and 1. */
69 #define CVMX_PKO_COMMAND_BUFFER_SIZE_ADJUST (1)
71 #define CVMX_PKO_MAX_OUTPUT_QUEUES_STATIC 256
72 #define CVMX_PKO_MAX_OUTPUT_QUEUES ((OCTEON_IS_MODEL(OCTEON_CN31XX) || \
73 OCTEON_IS_MODEL(OCTEON_CN3010) || OCTEON_IS_MODEL(OCTEON_CN3005) || \
74 OCTEON_IS_MODEL(OCTEON_CN50XX)) ? 32 : \
75 (OCTEON_IS_MODEL(OCTEON_CN58XX) || \
76 OCTEON_IS_MODEL(OCTEON_CN56XX)) ? 256 : 128)
77 #define CVMX_PKO_NUM_OUTPUT_PORTS 40
78 /* use this for queues that are not used */
79 #define CVMX_PKO_MEM_QUEUE_PTRS_ILLEGAL_PID 63
80 #define CVMX_PKO_QUEUE_STATIC_PRIORITY 9
81 #define CVMX_PKO_ILLEGAL_QUEUE 0xFFFF
82 #define CVMX_PKO_MAX_QUEUE_DEPTH 0
86 CVMX_PKO_INVALID_PORT
,
87 CVMX_PKO_INVALID_QUEUE
,
88 CVMX_PKO_INVALID_PRIORITY
,
90 CVMX_PKO_PORT_ALREADY_SETUP
,
91 CVMX_PKO_CMD_QUEUE_INIT_ERROR
95 * This enumeration represents the differnet locking modes supported by PKO.
99 * PKO doesn't do any locking. It is the responsibility of the
100 * application to make sure that no other core is accessing
101 * the same queue at the same time
103 CVMX_PKO_LOCK_NONE
= 0,
105 * PKO performs an atomic tagswitch to insure exclusive access
106 * to the output queue. This will maintain packet ordering on
109 CVMX_PKO_LOCK_ATOMIC_TAG
= 1,
111 * PKO uses the common command queue locks to insure exclusive
112 * access to the output queue. This is a memory based
113 * ll/sc. This is the most portable locking mechanism.
115 CVMX_PKO_LOCK_CMD_QUEUE
= 2,
122 } cvmx_pko_port_status_t
;
125 * This structure defines the address to use on a packet enqueue
130 /* Must CVMX_IO_SEG */
131 uint64_t mem_space
:2;
133 uint64_t reserved
:13;
136 /* The ID of the device on the non-coherent bus */
139 uint64_t reserved2
:4;
141 uint64_t reserved3
:18;
143 * The hardware likes to have the output port in
144 * addition to the output queue,
148 * The output queue to send the packet to (0-127 are
153 uint64_t reserved4
:3;
155 } cvmx_pko_doorbell_address_t
;
158 * Structure of the first packet output command word.
164 * The size of the reg1 operation - could be 8, 16,
169 * The size of the reg0 operation - could be 8, 16,
174 * If set, subtract 1, if clear, subtract packet
179 * The register, subtract will be done if reg1 is
183 /* If set, subtract 1, if clear, subtract packet size */
185 /* The register, subtract will be done if reg0 is non-zero */
188 * When set, interpret segment pointer and segment
189 * bytes in little endian order.
193 * When set, packet data not allocated in L2 cache by
198 * If set and rsp is set, word3 contains a pointer to
199 * a work queue entry.
202 /* If set, the hardware will send a response when done */
205 * If set, the supplied pkt_ptr is really a pointer to
206 * a list of pkt_ptr's.
210 * If ipoffp1 is non zero, (ipoffp1-1) is the number
211 * of bytes to IP header, and the hardware will
212 * calculate and insert the UDP/TCP checksum.
216 * If set, ignore the I bit (force to zero) from all
217 * pointer structures.
221 * If clear, the hardware will attempt to free the
222 * buffers containing the packet.
226 * The total number of segs in the packet, if gather
227 * set, also gather list length.
230 /* Including L2, but no trailing CRC */
231 uint64_t total_bytes
:16;
233 } cvmx_pko_command_word0_t
;
235 /* CSR typedefs have been moved to cvmx-csr-*.h */
238 * Definition of internal state for Packet output processing
241 /* ptr to start of buffer, offset kept in FAU reg */
243 } cvmx_pko_state_elem_t
;
246 * Call before any other calls to initialize the packet
249 extern void cvmx_pko_initialize_global(void);
250 extern int cvmx_pko_initialize_local(void);
253 * Enables the packet output hardware. It must already be
256 extern void cvmx_pko_enable(void);
259 * Disables the packet output. Does not affect any configuration.
261 extern void cvmx_pko_disable(void);
264 * Shutdown and free resources required by packet output.
267 extern void cvmx_pko_shutdown(void);
270 * Configure a output port and the associated queues for use.
272 * @port: Port to configure.
273 * @base_queue: First queue number to associate with this port.
274 * @num_queues: Number of queues t oassociate with this port
275 * @priority: Array of priority levels for each queue. Values are
276 * allowed to be 1-8. A value of 8 get 8 times the traffic
277 * of a value of 1. There must be num_queues elements in the
280 extern cvmx_pko_status_t
cvmx_pko_config_port(uint64_t port
,
283 const uint64_t priority
[]);
286 * Ring the packet output doorbell. This tells the packet
287 * output hardware that "len" command words have been added
288 * to its pending list. This command includes the required
289 * CVMX_SYNCWS before the doorbell ring.
291 * @port: Port the packet is for
292 * @queue: Queue the packet is for
293 * @len: Length of the command in 64 bit words
295 static inline void cvmx_pko_doorbell(uint64_t port
, uint64_t queue
,
298 cvmx_pko_doorbell_address_t ptr
;
301 ptr
.s
.mem_space
= CVMX_IO_SEG
;
302 ptr
.s
.did
= CVMX_OCT_DID_PKT_SEND
;
307 * Need to make sure output queue data is in DRAM before
311 cvmx_write_io(ptr
.u64
, len
);
315 * Prepare to send a packet. This may initiate a tag switch to
316 * get exclusive access to the output queue structure, and
317 * performs other prep work for the packet send operation.
319 * cvmx_pko_send_packet_finish() MUST be called after this function is called,
320 * and must be called with the same port/queue/use_locking arguments.
322 * The use_locking parameter allows the caller to use three
323 * possible locking modes.
324 * - CVMX_PKO_LOCK_NONE
325 * - PKO doesn't do any locking. It is the responsibility
326 * of the application to make sure that no other core
327 * is accessing the same queue at the same time.
328 * - CVMX_PKO_LOCK_ATOMIC_TAG
329 * - PKO performs an atomic tagswitch to insure exclusive
330 * access to the output queue. This will maintain
331 * packet ordering on output.
332 * - CVMX_PKO_LOCK_CMD_QUEUE
333 * - PKO uses the common command queue locks to insure
334 * exclusive access to the output queue. This is a
335 * memory based ll/sc. This is the most portable
338 * NOTE: If atomic locking is used, the POW entry CANNOT be
339 * descheduled, as it does not contain a valid WQE pointer.
341 * @port: Port to send it on
342 * @queue: Queue to use
343 * @use_locking: CVMX_PKO_LOCK_NONE, CVMX_PKO_LOCK_ATOMIC_TAG, or
344 * CVMX_PKO_LOCK_CMD_QUEUE
347 static inline void cvmx_pko_send_packet_prepare(uint64_t port
, uint64_t queue
,
348 cvmx_pko_lock_t use_locking
)
350 if (use_locking
== CVMX_PKO_LOCK_ATOMIC_TAG
) {
352 * Must do a full switch here to handle all cases. We
353 * use a fake WQE pointer, as the POW does not access
354 * this memory. The WQE pointer and group are only
355 * used if this work is descheduled, which is not
357 * cvmx_pko_send_packet_prepare/cvmx_pko_send_packet_finish
358 * combination. Note that this is a special case in
359 * which these fake values can be used - this is not a
363 CVMX_TAG_SW_BITS_INTERNAL
<< CVMX_TAG_SW_SHIFT
|
364 CVMX_TAG_SUBGROUP_PKO
<< CVMX_TAG_SUBGROUP_SHIFT
|
365 (CVMX_TAG_SUBGROUP_MASK
& queue
);
366 cvmx_pow_tag_sw_full((cvmx_wqe_t
*) cvmx_phys_to_ptr(0x80), tag
,
367 CVMX_POW_TAG_TYPE_ATOMIC
, 0);
372 * Complete packet output. cvmx_pko_send_packet_prepare() must be
373 * called exactly once before this, and the same parameters must be
374 * passed to both cvmx_pko_send_packet_prepare() and
375 * cvmx_pko_send_packet_finish().
377 * @port: Port to send it on
378 * @queue: Queue to use
380 * PKO HW command word
381 * @packet: Packet to send
382 * @use_locking: CVMX_PKO_LOCK_NONE, CVMX_PKO_LOCK_ATOMIC_TAG, or
383 * CVMX_PKO_LOCK_CMD_QUEUE
385 * Returns returns CVMX_PKO_SUCCESS on success, or error code on
388 static inline cvmx_pko_status_t
cvmx_pko_send_packet_finish(
391 cvmx_pko_command_word0_t pko_command
,
392 union cvmx_buf_ptr packet
,
393 cvmx_pko_lock_t use_locking
)
395 cvmx_cmd_queue_result_t result
;
396 if (use_locking
== CVMX_PKO_LOCK_ATOMIC_TAG
)
397 cvmx_pow_tag_sw_wait();
398 result
= cvmx_cmd_queue_write2(CVMX_CMD_QUEUE_PKO(queue
),
399 (use_locking
== CVMX_PKO_LOCK_CMD_QUEUE
),
400 pko_command
.u64
, packet
.u64
);
401 if (likely(result
== CVMX_CMD_QUEUE_SUCCESS
)) {
402 cvmx_pko_doorbell(port
, queue
, 2);
403 return CVMX_PKO_SUCCESS
;
404 } else if ((result
== CVMX_CMD_QUEUE_NO_MEMORY
)
405 || (result
== CVMX_CMD_QUEUE_FULL
)) {
406 return CVMX_PKO_NO_MEMORY
;
408 return CVMX_PKO_INVALID_QUEUE
;
413 * Complete packet output. cvmx_pko_send_packet_prepare() must be
414 * called exactly once before this, and the same parameters must be
415 * passed to both cvmx_pko_send_packet_prepare() and
416 * cvmx_pko_send_packet_finish().
418 * @port: Port to send it on
419 * @queue: Queue to use
421 * PKO HW command word
422 * @packet: Packet to send
423 * @addr: Plysical address of a work queue entry or physical address
424 * to zero on complete.
425 * @use_locking: CVMX_PKO_LOCK_NONE, CVMX_PKO_LOCK_ATOMIC_TAG, or
426 * CVMX_PKO_LOCK_CMD_QUEUE
428 * Returns returns CVMX_PKO_SUCCESS on success, or error code on
431 static inline cvmx_pko_status_t
cvmx_pko_send_packet_finish3(
434 cvmx_pko_command_word0_t pko_command
,
435 union cvmx_buf_ptr packet
,
437 cvmx_pko_lock_t use_locking
)
439 cvmx_cmd_queue_result_t result
;
440 if (use_locking
== CVMX_PKO_LOCK_ATOMIC_TAG
)
441 cvmx_pow_tag_sw_wait();
442 result
= cvmx_cmd_queue_write3(CVMX_CMD_QUEUE_PKO(queue
),
443 (use_locking
== CVMX_PKO_LOCK_CMD_QUEUE
),
444 pko_command
.u64
, packet
.u64
, addr
);
445 if (likely(result
== CVMX_CMD_QUEUE_SUCCESS
)) {
446 cvmx_pko_doorbell(port
, queue
, 3);
447 return CVMX_PKO_SUCCESS
;
448 } else if ((result
== CVMX_CMD_QUEUE_NO_MEMORY
)
449 || (result
== CVMX_CMD_QUEUE_FULL
)) {
450 return CVMX_PKO_NO_MEMORY
;
452 return CVMX_PKO_INVALID_QUEUE
;
457 * Return the pko output queue associated with a port and a specific core.
458 * In normal mode (PKO lockless operation is disabled), the value returned
462 * @core: Core to get queue for
464 * Returns Core-specific output queue
466 static inline int cvmx_pko_get_base_queue_per_core(int port
, int core
)
468 #ifndef CVMX_HELPER_PKO_MAX_PORTS_INTERFACE0
469 #define CVMX_HELPER_PKO_MAX_PORTS_INTERFACE0 16
471 #ifndef CVMX_HELPER_PKO_MAX_PORTS_INTERFACE1
472 #define CVMX_HELPER_PKO_MAX_PORTS_INTERFACE1 16
475 if (port
< CVMX_PKO_MAX_PORTS_INTERFACE0
)
476 return port
* CVMX_PKO_QUEUES_PER_PORT_INTERFACE0
+ core
;
477 else if (port
>= 16 && port
< 16 + CVMX_PKO_MAX_PORTS_INTERFACE1
)
478 return CVMX_PKO_MAX_PORTS_INTERFACE0
*
479 CVMX_PKO_QUEUES_PER_PORT_INTERFACE0
+ (port
-
481 CVMX_PKO_QUEUES_PER_PORT_INTERFACE1
+ core
;
482 else if ((port
>= 32) && (port
< 36))
483 return CVMX_PKO_MAX_PORTS_INTERFACE0
*
484 CVMX_PKO_QUEUES_PER_PORT_INTERFACE0
+
485 CVMX_PKO_MAX_PORTS_INTERFACE1
*
486 CVMX_PKO_QUEUES_PER_PORT_INTERFACE1
+ (port
-
488 CVMX_PKO_QUEUES_PER_PORT_PCI
;
489 else if ((port
>= 36) && (port
< 40))
490 return CVMX_PKO_MAX_PORTS_INTERFACE0
*
491 CVMX_PKO_QUEUES_PER_PORT_INTERFACE0
+
492 CVMX_PKO_MAX_PORTS_INTERFACE1
*
493 CVMX_PKO_QUEUES_PER_PORT_INTERFACE1
+
494 4 * CVMX_PKO_QUEUES_PER_PORT_PCI
+ (port
-
496 CVMX_PKO_QUEUES_PER_PORT_LOOP
;
498 /* Given the limit on the number of ports we can map to
499 * CVMX_MAX_OUTPUT_QUEUES_STATIC queues (currently 256,
500 * divided among all cores), the remaining unmapped ports
501 * are assigned an illegal queue number */
502 return CVMX_PKO_ILLEGAL_QUEUE
;
506 * For a given port number, return the base pko output queue
510 * Returns Base output queue
512 static inline int cvmx_pko_get_base_queue(int port
)
514 return cvmx_pko_get_base_queue_per_core(port
, 0);
518 * For a given port number, return the number of pko output queues.
521 * Returns Number of output queues
523 static inline int cvmx_pko_get_num_queues(int port
)
526 return CVMX_PKO_QUEUES_PER_PORT_INTERFACE0
;
528 return CVMX_PKO_QUEUES_PER_PORT_INTERFACE1
;
530 return CVMX_PKO_QUEUES_PER_PORT_PCI
;
532 return CVMX_PKO_QUEUES_PER_PORT_LOOP
;
538 * Get the status counters for a port.
540 * @port_num: Port number to get statistics for.
541 * @clear: Set to 1 to clear the counters after they are read
542 * @status: Where to put the results.
544 static inline void cvmx_pko_get_port_status(uint64_t port_num
, uint64_t clear
,
545 cvmx_pko_port_status_t
*status
)
547 union cvmx_pko_reg_read_idx pko_reg_read_idx
;
548 union cvmx_pko_mem_count0 pko_mem_count0
;
549 union cvmx_pko_mem_count1 pko_mem_count1
;
551 pko_reg_read_idx
.u64
= 0;
552 pko_reg_read_idx
.s
.index
= port_num
;
553 cvmx_write_csr(CVMX_PKO_REG_READ_IDX
, pko_reg_read_idx
.u64
);
555 pko_mem_count0
.u64
= cvmx_read_csr(CVMX_PKO_MEM_COUNT0
);
556 status
->packets
= pko_mem_count0
.s
.count
;
558 pko_mem_count0
.s
.count
= port_num
;
559 cvmx_write_csr(CVMX_PKO_MEM_COUNT0
, pko_mem_count0
.u64
);
562 pko_mem_count1
.u64
= cvmx_read_csr(CVMX_PKO_MEM_COUNT1
);
563 status
->octets
= pko_mem_count1
.s
.count
;
565 pko_mem_count1
.s
.count
= port_num
;
566 cvmx_write_csr(CVMX_PKO_MEM_COUNT1
, pko_mem_count1
.u64
);
569 if (OCTEON_IS_MODEL(OCTEON_CN3XXX
)) {
570 union cvmx_pko_mem_debug9 debug9
;
571 pko_reg_read_idx
.s
.index
= cvmx_pko_get_base_queue(port_num
);
572 cvmx_write_csr(CVMX_PKO_REG_READ_IDX
, pko_reg_read_idx
.u64
);
573 debug9
.u64
= cvmx_read_csr(CVMX_PKO_MEM_DEBUG9
);
574 status
->doorbell
= debug9
.cn38xx
.doorbell
;
576 union cvmx_pko_mem_debug8 debug8
;
577 pko_reg_read_idx
.s
.index
= cvmx_pko_get_base_queue(port_num
);
578 cvmx_write_csr(CVMX_PKO_REG_READ_IDX
, pko_reg_read_idx
.u64
);
579 debug8
.u64
= cvmx_read_csr(CVMX_PKO_MEM_DEBUG8
);
580 status
->doorbell
= debug8
.cn58xx
.doorbell
;
585 * Rate limit a PKO port to a max packets/sec. This function is only
586 * supported on CN57XX, CN56XX, CN55XX, and CN54XX.
588 * @port: Port to rate limit
589 * @packets_s: Maximum packet/sec
590 * @burst: Maximum number of packets to burst in a row before rate
593 * Returns Zero on success, negative on failure
595 extern int cvmx_pko_rate_limit_packets(int port
, int packets_s
, int burst
);
598 * Rate limit a PKO port to a max bits/sec. This function is only
599 * supported on CN57XX, CN56XX, CN55XX, and CN54XX.
601 * @port: Port to rate limit
602 * @bits_s: PKO rate limit in bits/sec
603 * @burst: Maximum number of bits to burst before rate
606 * Returns Zero on success, negative on failure
608 extern int cvmx_pko_rate_limit_bits(int port
, uint64_t bits_s
, int burst
);
610 #endif /* __CVMX_PKO_H__ */