1 // SPDX-License-Identifier: (GPL-2.0-only OR BSD-3-Clause)
2 /* QLogic qed NIC Driver
3 * Copyright (c) 2015-2017 QLogic Corporation
4 * Copyright (c) 2019-2020 Marvell International Ltd.
7 #include <linux/if_ether.h>
8 #include <linux/if_vlan.h>
10 #include <linux/ipv6.h>
11 #include <linux/spinlock.h>
12 #include <linux/tcp.h>
17 #include "qed_reg_addr.h"
21 #define QED_IWARP_ORD_DEFAULT 32
22 #define QED_IWARP_IRD_DEFAULT 32
23 #define QED_IWARP_MAX_FW_MSS 4120
25 #define QED_EP_SIG 0xecabcdef
32 #define MPA_V2_PEER2PEER_MODEL 0x8000
33 #define MPA_V2_SEND_RTR 0x4000 /* on ird */
34 #define MPA_V2_READ_RTR 0x4000 /* on ord */
35 #define MPA_V2_WRITE_RTR 0x8000
36 #define MPA_V2_IRD_ORD_MASK 0x3FFF
38 #define MPA_REV2(_mpa_rev) ((_mpa_rev) == MPA_NEGOTIATION_TYPE_ENHANCED)
40 #define QED_IWARP_INVALID_TCP_CID 0xffffffff
42 #define QED_IWARP_RCV_WND_SIZE_DEF_BB_2P (200 * 1024)
43 #define QED_IWARP_RCV_WND_SIZE_DEF_BB_4P (100 * 1024)
44 #define QED_IWARP_RCV_WND_SIZE_DEF_AH_2P (150 * 1024)
45 #define QED_IWARP_RCV_WND_SIZE_DEF_AH_4P (90 * 1024)
47 #define QED_IWARP_RCV_WND_SIZE_MIN (0xffff)
48 #define TIMESTAMP_HEADER_SIZE (12)
49 #define QED_IWARP_MAX_FIN_RT_DEFAULT (2)
51 #define QED_IWARP_TS_EN BIT(0)
52 #define QED_IWARP_DA_EN BIT(1)
53 #define QED_IWARP_PARAM_CRC_NEEDED (1)
54 #define QED_IWARP_PARAM_P2P (1)
56 #define QED_IWARP_DEF_MAX_RT_TIME (0)
57 #define QED_IWARP_DEF_CWND_FACTOR (4)
58 #define QED_IWARP_DEF_KA_MAX_PROBE_CNT (5)
59 #define QED_IWARP_DEF_KA_TIMEOUT (1200000) /* 20 min */
60 #define QED_IWARP_DEF_KA_INTERVAL (1000) /* 1 sec */
62 static int qed_iwarp_async_event(struct qed_hwfn
*p_hwfn
, u8 fw_event_code
,
63 __le16 echo
, union event_ring_data
*data
,
66 /* Override devinfo with iWARP specific values */
67 void qed_iwarp_init_devinfo(struct qed_hwfn
*p_hwfn
)
69 struct qed_rdma_device
*dev
= p_hwfn
->p_rdma_info
->dev
;
71 dev
->max_inline
= IWARP_REQ_MAX_INLINE_DATA_SIZE
;
72 dev
->max_qp
= min_t(u32
,
74 p_hwfn
->p_rdma_info
->num_qps
) -
75 QED_IWARP_PREALLOC_CNT
;
77 dev
->max_cq
= dev
->max_qp
;
79 dev
->max_qp_resp_rd_atomic_resc
= QED_IWARP_IRD_DEFAULT
;
80 dev
->max_qp_req_rd_atomic_resc
= QED_IWARP_ORD_DEFAULT
;
83 void qed_iwarp_init_hw(struct qed_hwfn
*p_hwfn
, struct qed_ptt
*p_ptt
)
85 p_hwfn
->rdma_prs_search_reg
= PRS_REG_SEARCH_TCP
;
86 qed_wr(p_hwfn
, p_ptt
, p_hwfn
->rdma_prs_search_reg
, 1);
87 p_hwfn
->b_rdma_enabled_in_prs
= true;
90 /* We have two cid maps, one for tcp which should be used only from passive
91 * syn processing and replacing a pre-allocated ep in the list. The second
92 * for active tcp and for QPs.
94 static void qed_iwarp_cid_cleaned(struct qed_hwfn
*p_hwfn
, u32 cid
)
96 cid
-= qed_cxt_get_proto_cid_start(p_hwfn
, p_hwfn
->p_rdma_info
->proto
);
98 spin_lock_bh(&p_hwfn
->p_rdma_info
->lock
);
100 if (cid
< QED_IWARP_PREALLOC_CNT
)
101 qed_bmap_release_id(p_hwfn
, &p_hwfn
->p_rdma_info
->tcp_cid_map
,
104 qed_bmap_release_id(p_hwfn
, &p_hwfn
->p_rdma_info
->cid_map
, cid
);
106 spin_unlock_bh(&p_hwfn
->p_rdma_info
->lock
);
110 qed_iwarp_init_fw_ramrod(struct qed_hwfn
*p_hwfn
,
111 struct iwarp_init_func_ramrod_data
*p_ramrod
)
113 p_ramrod
->iwarp
.ll2_ooo_q_index
=
114 RESC_START(p_hwfn
, QED_LL2_RAM_QUEUE
) +
115 p_hwfn
->p_rdma_info
->iwarp
.ll2_ooo_handle
;
117 p_ramrod
->tcp
.max_fin_rt
= QED_IWARP_MAX_FIN_RT_DEFAULT
;
122 static int qed_iwarp_alloc_cid(struct qed_hwfn
*p_hwfn
, u32
*cid
)
126 spin_lock_bh(&p_hwfn
->p_rdma_info
->lock
);
127 rc
= qed_rdma_bmap_alloc_id(p_hwfn
, &p_hwfn
->p_rdma_info
->cid_map
, cid
);
128 spin_unlock_bh(&p_hwfn
->p_rdma_info
->lock
);
130 DP_NOTICE(p_hwfn
, "Failed in allocating iwarp cid\n");
133 *cid
+= qed_cxt_get_proto_cid_start(p_hwfn
, p_hwfn
->p_rdma_info
->proto
);
135 rc
= qed_cxt_dynamic_ilt_alloc(p_hwfn
, QED_ELEM_CXT
, *cid
);
137 qed_iwarp_cid_cleaned(p_hwfn
, *cid
);
142 static void qed_iwarp_set_tcp_cid(struct qed_hwfn
*p_hwfn
, u32 cid
)
144 cid
-= qed_cxt_get_proto_cid_start(p_hwfn
, p_hwfn
->p_rdma_info
->proto
);
146 spin_lock_bh(&p_hwfn
->p_rdma_info
->lock
);
147 qed_bmap_set_id(p_hwfn
, &p_hwfn
->p_rdma_info
->tcp_cid_map
, cid
);
148 spin_unlock_bh(&p_hwfn
->p_rdma_info
->lock
);
151 /* This function allocates a cid for passive tcp (called from syn receive)
152 * the reason it's separate from the regular cid allocation is because it
153 * is assured that these cids already have ilt allocated. They are preallocated
154 * to ensure that we won't need to allocate memory during syn processing
156 static int qed_iwarp_alloc_tcp_cid(struct qed_hwfn
*p_hwfn
, u32
*cid
)
160 spin_lock_bh(&p_hwfn
->p_rdma_info
->lock
);
162 rc
= qed_rdma_bmap_alloc_id(p_hwfn
,
163 &p_hwfn
->p_rdma_info
->tcp_cid_map
, cid
);
165 spin_unlock_bh(&p_hwfn
->p_rdma_info
->lock
);
168 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
169 "can't allocate iwarp tcp cid max-count=%d\n",
170 p_hwfn
->p_rdma_info
->tcp_cid_map
.max_count
);
172 *cid
= QED_IWARP_INVALID_TCP_CID
;
176 *cid
+= qed_cxt_get_proto_cid_start(p_hwfn
,
177 p_hwfn
->p_rdma_info
->proto
);
181 int qed_iwarp_create_qp(struct qed_hwfn
*p_hwfn
,
182 struct qed_rdma_qp
*qp
,
183 struct qed_rdma_create_qp_out_params
*out_params
)
185 struct iwarp_create_qp_ramrod_data
*p_ramrod
;
186 struct qed_sp_init_data init_data
;
187 struct qed_spq_entry
*p_ent
;
192 qp
->shared_queue
= dma_alloc_coherent(&p_hwfn
->cdev
->pdev
->dev
,
193 IWARP_SHARED_QUEUE_PAGE_SIZE
,
194 &qp
->shared_queue_phys_addr
,
196 if (!qp
->shared_queue
)
199 out_params
->sq_pbl_virt
= (u8
*)qp
->shared_queue
+
200 IWARP_SHARED_QUEUE_PAGE_SQ_PBL_OFFSET
;
201 out_params
->sq_pbl_phys
= qp
->shared_queue_phys_addr
+
202 IWARP_SHARED_QUEUE_PAGE_SQ_PBL_OFFSET
;
203 out_params
->rq_pbl_virt
= (u8
*)qp
->shared_queue
+
204 IWARP_SHARED_QUEUE_PAGE_RQ_PBL_OFFSET
;
205 out_params
->rq_pbl_phys
= qp
->shared_queue_phys_addr
+
206 IWARP_SHARED_QUEUE_PAGE_RQ_PBL_OFFSET
;
208 rc
= qed_iwarp_alloc_cid(p_hwfn
, &cid
);
214 memset(&init_data
, 0, sizeof(init_data
));
215 init_data
.opaque_fid
= p_hwfn
->hw_info
.opaque_fid
;
216 init_data
.cid
= qp
->icid
;
217 init_data
.comp_mode
= QED_SPQ_MODE_EBLOCK
;
219 rc
= qed_sp_init_request(p_hwfn
, &p_ent
,
220 IWARP_RAMROD_CMD_ID_CREATE_QP
,
221 PROTOCOLID_IWARP
, &init_data
);
225 p_ramrod
= &p_ent
->ramrod
.iwarp_create_qp
;
227 SET_FIELD(p_ramrod
->flags
,
228 IWARP_CREATE_QP_RAMROD_DATA_FMR_AND_RESERVED_EN
,
229 qp
->fmr_and_reserved_lkey
);
231 SET_FIELD(p_ramrod
->flags
,
232 IWARP_CREATE_QP_RAMROD_DATA_SIGNALED_COMP
, qp
->signal_all
);
234 SET_FIELD(p_ramrod
->flags
,
235 IWARP_CREATE_QP_RAMROD_DATA_RDMA_RD_EN
,
236 qp
->incoming_rdma_read_en
);
238 SET_FIELD(p_ramrod
->flags
,
239 IWARP_CREATE_QP_RAMROD_DATA_RDMA_WR_EN
,
240 qp
->incoming_rdma_write_en
);
242 SET_FIELD(p_ramrod
->flags
,
243 IWARP_CREATE_QP_RAMROD_DATA_ATOMIC_EN
,
244 qp
->incoming_atomic_en
);
246 SET_FIELD(p_ramrod
->flags
,
247 IWARP_CREATE_QP_RAMROD_DATA_SRQ_FLG
, qp
->use_srq
);
249 p_ramrod
->pd
= cpu_to_le16(qp
->pd
);
250 p_ramrod
->sq_num_pages
= cpu_to_le16(qp
->sq_num_pages
);
251 p_ramrod
->rq_num_pages
= cpu_to_le16(qp
->rq_num_pages
);
253 p_ramrod
->srq_id
.srq_idx
= cpu_to_le16(qp
->srq_id
);
254 p_ramrod
->srq_id
.opaque_fid
= cpu_to_le16(p_hwfn
->hw_info
.opaque_fid
);
255 p_ramrod
->qp_handle_for_cqe
.hi
= qp
->qp_handle
.hi
;
256 p_ramrod
->qp_handle_for_cqe
.lo
= qp
->qp_handle
.lo
;
258 p_ramrod
->cq_cid_for_sq
=
259 cpu_to_le32((p_hwfn
->hw_info
.opaque_fid
<< 16) | qp
->sq_cq_id
);
260 p_ramrod
->cq_cid_for_rq
=
261 cpu_to_le32((p_hwfn
->hw_info
.opaque_fid
<< 16) | qp
->rq_cq_id
);
263 p_ramrod
->dpi
= cpu_to_le16(qp
->dpi
);
265 physical_queue
= qed_get_cm_pq_idx(p_hwfn
, PQ_FLAGS_OFLD
);
266 p_ramrod
->physical_q0
= cpu_to_le16(physical_queue
);
267 physical_queue
= qed_get_cm_pq_idx(p_hwfn
, PQ_FLAGS_ACK
);
268 p_ramrod
->physical_q1
= cpu_to_le16(physical_queue
);
270 rc
= qed_spq_post(p_hwfn
, p_ent
, NULL
);
277 qed_iwarp_cid_cleaned(p_hwfn
, cid
);
279 dma_free_coherent(&p_hwfn
->cdev
->pdev
->dev
,
280 IWARP_SHARED_QUEUE_PAGE_SIZE
,
281 qp
->shared_queue
, qp
->shared_queue_phys_addr
);
286 static int qed_iwarp_modify_fw(struct qed_hwfn
*p_hwfn
, struct qed_rdma_qp
*qp
)
288 struct iwarp_modify_qp_ramrod_data
*p_ramrod
;
289 struct qed_sp_init_data init_data
;
290 struct qed_spq_entry
*p_ent
;
291 u16 flags
, trans_to_state
;
295 memset(&init_data
, 0, sizeof(init_data
));
296 init_data
.cid
= qp
->icid
;
297 init_data
.opaque_fid
= p_hwfn
->hw_info
.opaque_fid
;
298 init_data
.comp_mode
= QED_SPQ_MODE_EBLOCK
;
300 rc
= qed_sp_init_request(p_hwfn
, &p_ent
,
301 IWARP_RAMROD_CMD_ID_MODIFY_QP
,
302 p_hwfn
->p_rdma_info
->proto
, &init_data
);
306 p_ramrod
= &p_ent
->ramrod
.iwarp_modify_qp
;
308 flags
= le16_to_cpu(p_ramrod
->flags
);
309 SET_FIELD(flags
, IWARP_MODIFY_QP_RAMROD_DATA_STATE_TRANS_EN
, 0x1);
310 p_ramrod
->flags
= cpu_to_le16(flags
);
312 if (qp
->iwarp_state
== QED_IWARP_QP_STATE_CLOSING
)
313 trans_to_state
= IWARP_MODIFY_QP_STATE_CLOSING
;
315 trans_to_state
= IWARP_MODIFY_QP_STATE_ERROR
;
317 p_ramrod
->transition_to_state
= cpu_to_le16(trans_to_state
);
319 rc
= qed_spq_post(p_hwfn
, p_ent
, NULL
);
321 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "QP(0x%x)rc=%d\n", qp
->icid
, rc
);
326 enum qed_iwarp_qp_state
qed_roce2iwarp_state(enum qed_roce_qp_state state
)
329 case QED_ROCE_QP_STATE_RESET
:
330 case QED_ROCE_QP_STATE_INIT
:
331 case QED_ROCE_QP_STATE_RTR
:
332 return QED_IWARP_QP_STATE_IDLE
;
333 case QED_ROCE_QP_STATE_RTS
:
334 return QED_IWARP_QP_STATE_RTS
;
335 case QED_ROCE_QP_STATE_SQD
:
336 return QED_IWARP_QP_STATE_CLOSING
;
337 case QED_ROCE_QP_STATE_ERR
:
338 return QED_IWARP_QP_STATE_ERROR
;
339 case QED_ROCE_QP_STATE_SQE
:
340 return QED_IWARP_QP_STATE_TERMINATE
;
342 return QED_IWARP_QP_STATE_ERROR
;
346 static enum qed_roce_qp_state
347 qed_iwarp2roce_state(enum qed_iwarp_qp_state state
)
350 case QED_IWARP_QP_STATE_IDLE
:
351 return QED_ROCE_QP_STATE_INIT
;
352 case QED_IWARP_QP_STATE_RTS
:
353 return QED_ROCE_QP_STATE_RTS
;
354 case QED_IWARP_QP_STATE_TERMINATE
:
355 return QED_ROCE_QP_STATE_SQE
;
356 case QED_IWARP_QP_STATE_CLOSING
:
357 return QED_ROCE_QP_STATE_SQD
;
358 case QED_IWARP_QP_STATE_ERROR
:
359 return QED_ROCE_QP_STATE_ERR
;
361 return QED_ROCE_QP_STATE_ERR
;
365 static const char * const iwarp_state_names
[] = {
374 qed_iwarp_modify_qp(struct qed_hwfn
*p_hwfn
,
375 struct qed_rdma_qp
*qp
,
376 enum qed_iwarp_qp_state new_state
, bool internal
)
378 enum qed_iwarp_qp_state prev_iw_state
;
379 bool modify_fw
= false;
382 /* modify QP can be called from upper-layer or as a result of async
383 * RST/FIN... therefore need to protect
385 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.qp_lock
);
386 prev_iw_state
= qp
->iwarp_state
;
388 if (prev_iw_state
== new_state
) {
389 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.qp_lock
);
393 switch (prev_iw_state
) {
394 case QED_IWARP_QP_STATE_IDLE
:
396 case QED_IWARP_QP_STATE_RTS
:
397 qp
->iwarp_state
= QED_IWARP_QP_STATE_RTS
;
399 case QED_IWARP_QP_STATE_ERROR
:
400 qp
->iwarp_state
= QED_IWARP_QP_STATE_ERROR
;
408 case QED_IWARP_QP_STATE_RTS
:
410 case QED_IWARP_QP_STATE_CLOSING
:
414 qp
->iwarp_state
= QED_IWARP_QP_STATE_CLOSING
;
416 case QED_IWARP_QP_STATE_ERROR
:
419 qp
->iwarp_state
= QED_IWARP_QP_STATE_ERROR
;
425 case QED_IWARP_QP_STATE_ERROR
:
427 case QED_IWARP_QP_STATE_IDLE
:
429 qp
->iwarp_state
= new_state
;
431 case QED_IWARP_QP_STATE_CLOSING
:
432 /* could happen due to race... do nothing.... */
438 case QED_IWARP_QP_STATE_TERMINATE
:
439 case QED_IWARP_QP_STATE_CLOSING
:
440 qp
->iwarp_state
= new_state
;
446 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "QP(0x%x) %s --> %s%s\n",
448 iwarp_state_names
[prev_iw_state
],
449 iwarp_state_names
[qp
->iwarp_state
],
450 internal
? "internal" : "");
452 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.qp_lock
);
455 rc
= qed_iwarp_modify_fw(p_hwfn
, qp
);
460 int qed_iwarp_fw_destroy(struct qed_hwfn
*p_hwfn
, struct qed_rdma_qp
*qp
)
462 struct qed_sp_init_data init_data
;
463 struct qed_spq_entry
*p_ent
;
467 memset(&init_data
, 0, sizeof(init_data
));
468 init_data
.cid
= qp
->icid
;
469 init_data
.opaque_fid
= p_hwfn
->hw_info
.opaque_fid
;
470 init_data
.comp_mode
= QED_SPQ_MODE_EBLOCK
;
472 rc
= qed_sp_init_request(p_hwfn
, &p_ent
,
473 IWARP_RAMROD_CMD_ID_DESTROY_QP
,
474 p_hwfn
->p_rdma_info
->proto
, &init_data
);
478 rc
= qed_spq_post(p_hwfn
, p_ent
, NULL
);
480 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "QP(0x%x) rc = %d\n", qp
->icid
, rc
);
485 static void qed_iwarp_destroy_ep(struct qed_hwfn
*p_hwfn
,
486 struct qed_iwarp_ep
*ep
,
487 bool remove_from_active_list
)
489 dma_free_coherent(&p_hwfn
->cdev
->pdev
->dev
,
490 sizeof(*ep
->ep_buffer_virt
),
491 ep
->ep_buffer_virt
, ep
->ep_buffer_phys
);
493 if (remove_from_active_list
) {
494 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
495 list_del(&ep
->list_entry
);
496 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
505 int qed_iwarp_destroy_qp(struct qed_hwfn
*p_hwfn
, struct qed_rdma_qp
*qp
)
507 struct qed_iwarp_ep
*ep
= qp
->ep
;
511 if (qp
->iwarp_state
!= QED_IWARP_QP_STATE_ERROR
) {
512 rc
= qed_iwarp_modify_qp(p_hwfn
, qp
,
513 QED_IWARP_QP_STATE_ERROR
, false);
518 /* Make sure ep is closed before returning and freeing memory. */
520 while (READ_ONCE(ep
->state
) != QED_IWARP_EP_CLOSED
&&
524 if (ep
->state
!= QED_IWARP_EP_CLOSED
)
525 DP_NOTICE(p_hwfn
, "ep state close timeout state=%x\n",
528 qed_iwarp_destroy_ep(p_hwfn
, ep
, false);
531 rc
= qed_iwarp_fw_destroy(p_hwfn
, qp
);
533 if (qp
->shared_queue
)
534 dma_free_coherent(&p_hwfn
->cdev
->pdev
->dev
,
535 IWARP_SHARED_QUEUE_PAGE_SIZE
,
536 qp
->shared_queue
, qp
->shared_queue_phys_addr
);
542 qed_iwarp_create_ep(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
**ep_out
)
544 struct qed_iwarp_ep
*ep
;
547 ep
= kzalloc(sizeof(*ep
), GFP_KERNEL
);
551 ep
->state
= QED_IWARP_EP_INIT
;
553 ep
->ep_buffer_virt
= dma_alloc_coherent(&p_hwfn
->cdev
->pdev
->dev
,
554 sizeof(*ep
->ep_buffer_virt
),
557 if (!ep
->ep_buffer_virt
) {
562 ep
->sig
= QED_EP_SIG
;
574 qed_iwarp_print_tcp_ramrod(struct qed_hwfn
*p_hwfn
,
575 struct iwarp_tcp_offload_ramrod_data
*p_tcp_ramrod
)
577 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "local_mac=%x %x %x, remote_mac=%x %x %x\n",
578 p_tcp_ramrod
->tcp
.local_mac_addr_lo
,
579 p_tcp_ramrod
->tcp
.local_mac_addr_mid
,
580 p_tcp_ramrod
->tcp
.local_mac_addr_hi
,
581 p_tcp_ramrod
->tcp
.remote_mac_addr_lo
,
582 p_tcp_ramrod
->tcp
.remote_mac_addr_mid
,
583 p_tcp_ramrod
->tcp
.remote_mac_addr_hi
);
585 if (p_tcp_ramrod
->tcp
.ip_version
== TCP_IPV4
) {
586 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
587 "local_ip=%pI4h:%x, remote_ip=%pI4h:%x, vlan=%x\n",
588 p_tcp_ramrod
->tcp
.local_ip
,
589 p_tcp_ramrod
->tcp
.local_port
,
590 p_tcp_ramrod
->tcp
.remote_ip
,
591 p_tcp_ramrod
->tcp
.remote_port
,
592 p_tcp_ramrod
->tcp
.vlan_id
);
594 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
595 "local_ip=%pI6:%x, remote_ip=%pI6:%x, vlan=%x\n",
596 p_tcp_ramrod
->tcp
.local_ip
,
597 p_tcp_ramrod
->tcp
.local_port
,
598 p_tcp_ramrod
->tcp
.remote_ip
,
599 p_tcp_ramrod
->tcp
.remote_port
,
600 p_tcp_ramrod
->tcp
.vlan_id
);
603 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
604 "flow_label=%x, ttl=%x, tos_or_tc=%x, mss=%x, rcv_wnd_scale=%x, connect_mode=%x, flags=%x\n",
605 p_tcp_ramrod
->tcp
.flow_label
,
606 p_tcp_ramrod
->tcp
.ttl
,
607 p_tcp_ramrod
->tcp
.tos_or_tc
,
608 p_tcp_ramrod
->tcp
.mss
,
609 p_tcp_ramrod
->tcp
.rcv_wnd_scale
,
610 p_tcp_ramrod
->tcp
.connect_mode
,
611 p_tcp_ramrod
->tcp
.flags
);
613 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "syn_ip_payload_length=%x, lo=%x, hi=%x\n",
614 p_tcp_ramrod
->tcp
.syn_ip_payload_length
,
615 p_tcp_ramrod
->tcp
.syn_phy_addr_lo
,
616 p_tcp_ramrod
->tcp
.syn_phy_addr_hi
);
620 qed_iwarp_tcp_offload(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
*ep
)
622 struct qed_iwarp_info
*iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
623 struct iwarp_tcp_offload_ramrod_data
*p_tcp_ramrod
;
624 struct tcp_offload_params_opt2
*tcp
;
625 struct qed_sp_init_data init_data
;
626 struct qed_spq_entry
*p_ent
;
627 dma_addr_t async_output_phys
;
628 dma_addr_t in_pdata_phys
;
635 memset(&init_data
, 0, sizeof(init_data
));
636 init_data
.cid
= ep
->tcp_cid
;
637 init_data
.opaque_fid
= p_hwfn
->hw_info
.opaque_fid
;
638 if (ep
->connect_mode
== TCP_CONNECT_PASSIVE
)
639 init_data
.comp_mode
= QED_SPQ_MODE_CB
;
641 init_data
.comp_mode
= QED_SPQ_MODE_EBLOCK
;
643 rc
= qed_sp_init_request(p_hwfn
, &p_ent
,
644 IWARP_RAMROD_CMD_ID_TCP_OFFLOAD
,
645 PROTOCOLID_IWARP
, &init_data
);
649 p_tcp_ramrod
= &p_ent
->ramrod
.iwarp_tcp_offload
;
651 in_pdata_phys
= ep
->ep_buffer_phys
+
652 offsetof(struct qed_iwarp_ep_memory
, in_pdata
);
653 DMA_REGPAIR_LE(p_tcp_ramrod
->iwarp
.incoming_ulp_buffer
.addr
,
656 p_tcp_ramrod
->iwarp
.incoming_ulp_buffer
.len
=
657 cpu_to_le16(sizeof(ep
->ep_buffer_virt
->in_pdata
));
659 async_output_phys
= ep
->ep_buffer_phys
+
660 offsetof(struct qed_iwarp_ep_memory
, async_output
);
661 DMA_REGPAIR_LE(p_tcp_ramrod
->iwarp
.async_eqe_output_buf
,
664 p_tcp_ramrod
->iwarp
.handle_for_async
.hi
= cpu_to_le32(PTR_HI(ep
));
665 p_tcp_ramrod
->iwarp
.handle_for_async
.lo
= cpu_to_le32(PTR_LO(ep
));
667 physical_q
= qed_get_cm_pq_idx(p_hwfn
, PQ_FLAGS_OFLD
);
668 p_tcp_ramrod
->iwarp
.physical_q0
= cpu_to_le16(physical_q
);
669 physical_q
= qed_get_cm_pq_idx(p_hwfn
, PQ_FLAGS_ACK
);
670 p_tcp_ramrod
->iwarp
.physical_q1
= cpu_to_le16(physical_q
);
671 p_tcp_ramrod
->iwarp
.mpa_mode
= iwarp_info
->mpa_rev
;
673 tcp
= &p_tcp_ramrod
->tcp
;
674 qed_set_fw_mac_addr(&tcp
->remote_mac_addr_hi
,
675 &tcp
->remote_mac_addr_mid
,
676 &tcp
->remote_mac_addr_lo
, ep
->remote_mac_addr
);
677 qed_set_fw_mac_addr(&tcp
->local_mac_addr_hi
, &tcp
->local_mac_addr_mid
,
678 &tcp
->local_mac_addr_lo
, ep
->local_mac_addr
);
680 tcp
->vlan_id
= cpu_to_le16(ep
->cm_info
.vlan
);
682 tcp_flags
= p_hwfn
->p_rdma_info
->iwarp
.tcp_flags
;
684 SET_FIELD(flags
, TCP_OFFLOAD_PARAMS_OPT2_TS_EN
,
685 !!(tcp_flags
& QED_IWARP_TS_EN
));
687 SET_FIELD(flags
, TCP_OFFLOAD_PARAMS_OPT2_DA_EN
,
688 !!(tcp_flags
& QED_IWARP_DA_EN
));
690 tcp
->flags
= cpu_to_le16(flags
);
691 tcp
->ip_version
= ep
->cm_info
.ip_version
;
693 for (i
= 0; i
< 4; i
++) {
694 tcp
->remote_ip
[i
] = cpu_to_le32(ep
->cm_info
.remote_ip
[i
]);
695 tcp
->local_ip
[i
] = cpu_to_le32(ep
->cm_info
.local_ip
[i
]);
698 tcp
->remote_port
= cpu_to_le16(ep
->cm_info
.remote_port
);
699 tcp
->local_port
= cpu_to_le16(ep
->cm_info
.local_port
);
700 tcp
->mss
= cpu_to_le16(ep
->mss
);
705 tcp
->max_rt_time
= QED_IWARP_DEF_MAX_RT_TIME
;
706 tcp
->cwnd
= cpu_to_le32(QED_IWARP_DEF_CWND_FACTOR
* ep
->mss
);
707 tcp
->ka_max_probe_cnt
= QED_IWARP_DEF_KA_MAX_PROBE_CNT
;
708 tcp
->ka_timeout
= cpu_to_le32(QED_IWARP_DEF_KA_TIMEOUT
);
709 tcp
->ka_interval
= cpu_to_le32(QED_IWARP_DEF_KA_INTERVAL
);
711 tcp
->rcv_wnd_scale
= (u8
)p_hwfn
->p_rdma_info
->iwarp
.rcv_wnd_scale
;
712 tcp
->connect_mode
= ep
->connect_mode
;
714 if (ep
->connect_mode
== TCP_CONNECT_PASSIVE
) {
715 tcp
->syn_ip_payload_length
=
716 cpu_to_le16(ep
->syn_ip_payload_length
);
717 tcp
->syn_phy_addr_hi
= DMA_HI_LE(ep
->syn_phy_addr
);
718 tcp
->syn_phy_addr_lo
= DMA_LO_LE(ep
->syn_phy_addr
);
721 qed_iwarp_print_tcp_ramrod(p_hwfn
, p_tcp_ramrod
);
723 rc
= qed_spq_post(p_hwfn
, p_ent
, NULL
);
725 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
726 "EP(0x%x) Offload completed rc=%d\n", ep
->tcp_cid
, rc
);
732 qed_iwarp_mpa_received(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
*ep
)
734 struct qed_iwarp_info
*iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
735 struct qed_iwarp_cm_event_params params
;
736 struct mpa_v2_hdr
*mpa_v2
;
737 union async_output
*async_data
;
738 u16 mpa_ord
, mpa_ird
;
743 async_data
= &ep
->ep_buffer_virt
->async_output
;
745 mpa_rev
= async_data
->mpa_request
.mpa_handshake_mode
;
746 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
747 "private_data_len=%x handshake_mode=%x private_data=(%x)\n",
748 async_data
->mpa_request
.ulp_data_len
,
749 mpa_rev
, *((u32
*)(ep
->ep_buffer_virt
->in_pdata
)));
751 if (mpa_rev
== MPA_NEGOTIATION_TYPE_ENHANCED
) {
752 /* Read ord/ird values from private data buffer */
753 mpa_v2
= (struct mpa_v2_hdr
*)ep
->ep_buffer_virt
->in_pdata
;
754 mpa_hdr_size
= sizeof(*mpa_v2
);
756 mpa_ord
= ntohs(mpa_v2
->ord
);
757 mpa_ird
= ntohs(mpa_v2
->ird
);
759 /* Temprary store in cm_info incoming ord/ird requested, later
760 * replace with negotiated value during accept
762 ep
->cm_info
.ord
= (u8
)min_t(u16
,
763 (mpa_ord
& MPA_V2_IRD_ORD_MASK
),
764 QED_IWARP_ORD_DEFAULT
);
766 ep
->cm_info
.ird
= (u8
)min_t(u16
,
767 (mpa_ird
& MPA_V2_IRD_ORD_MASK
),
768 QED_IWARP_IRD_DEFAULT
);
770 /* Peer2Peer negotiation */
771 ep
->rtr_type
= MPA_RTR_TYPE_NONE
;
772 if (mpa_ird
& MPA_V2_PEER2PEER_MODEL
) {
773 if (mpa_ord
& MPA_V2_WRITE_RTR
)
774 ep
->rtr_type
|= MPA_RTR_TYPE_ZERO_WRITE
;
776 if (mpa_ord
& MPA_V2_READ_RTR
)
777 ep
->rtr_type
|= MPA_RTR_TYPE_ZERO_READ
;
779 if (mpa_ird
& MPA_V2_SEND_RTR
)
780 ep
->rtr_type
|= MPA_RTR_TYPE_ZERO_SEND
;
782 ep
->rtr_type
&= iwarp_info
->rtr_type
;
784 /* if we're left with no match send our capabilities */
785 if (ep
->rtr_type
== MPA_RTR_TYPE_NONE
)
786 ep
->rtr_type
= iwarp_info
->rtr_type
;
789 ep
->mpa_rev
= MPA_NEGOTIATION_TYPE_ENHANCED
;
791 ep
->cm_info
.ord
= QED_IWARP_ORD_DEFAULT
;
792 ep
->cm_info
.ird
= QED_IWARP_IRD_DEFAULT
;
793 ep
->mpa_rev
= MPA_NEGOTIATION_TYPE_BASIC
;
796 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
797 "MPA_NEGOTIATE (v%d): ORD: 0x%x IRD: 0x%x rtr:0x%x ulp_data_len = %x mpa_hdr_size = %x\n",
798 mpa_rev
, ep
->cm_info
.ord
, ep
->cm_info
.ird
, ep
->rtr_type
,
799 async_data
->mpa_request
.ulp_data_len
, mpa_hdr_size
);
801 /* Strip mpa v2 hdr from private data before sending to upper layer */
802 ep
->cm_info
.private_data
= ep
->ep_buffer_virt
->in_pdata
+ mpa_hdr_size
;
804 ulp_data_len
= le16_to_cpu(async_data
->mpa_request
.ulp_data_len
);
805 ep
->cm_info
.private_data_len
= ulp_data_len
- mpa_hdr_size
;
807 params
.event
= QED_IWARP_EVENT_MPA_REQUEST
;
808 params
.cm_info
= &ep
->cm_info
;
809 params
.ep_context
= ep
;
812 ep
->state
= QED_IWARP_EP_MPA_REQ_RCVD
;
813 ep
->event_cb(ep
->cb_context
, ¶ms
);
817 qed_iwarp_mpa_offload(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
*ep
)
819 struct iwarp_mpa_offload_ramrod_data
*p_mpa_ramrod
;
820 struct mpa_outgoing_params
*common
;
821 struct qed_iwarp_info
*iwarp_info
;
822 struct qed_sp_init_data init_data
;
823 dma_addr_t async_output_phys
;
824 struct qed_spq_entry
*p_ent
;
825 dma_addr_t out_pdata_phys
;
826 dma_addr_t in_pdata_phys
;
827 struct qed_rdma_qp
*qp
;
838 memset(&init_data
, 0, sizeof(init_data
));
839 init_data
.cid
= reject
? ep
->tcp_cid
: qp
->icid
;
840 init_data
.opaque_fid
= p_hwfn
->hw_info
.opaque_fid
;
842 if (ep
->connect_mode
== TCP_CONNECT_ACTIVE
)
843 init_data
.comp_mode
= QED_SPQ_MODE_CB
;
845 init_data
.comp_mode
= QED_SPQ_MODE_EBLOCK
;
847 rc
= qed_sp_init_request(p_hwfn
, &p_ent
,
848 IWARP_RAMROD_CMD_ID_MPA_OFFLOAD
,
849 PROTOCOLID_IWARP
, &init_data
);
853 p_mpa_ramrod
= &p_ent
->ramrod
.iwarp_mpa_offload
;
854 common
= &p_mpa_ramrod
->common
;
856 out_pdata_phys
= ep
->ep_buffer_phys
+
857 offsetof(struct qed_iwarp_ep_memory
, out_pdata
);
858 DMA_REGPAIR_LE(common
->outgoing_ulp_buffer
.addr
, out_pdata_phys
);
860 val
= ep
->cm_info
.private_data_len
;
861 common
->outgoing_ulp_buffer
.len
= cpu_to_le16(val
);
862 common
->crc_needed
= p_hwfn
->p_rdma_info
->iwarp
.crc_needed
;
864 common
->out_rq
.ord
= cpu_to_le32(ep
->cm_info
.ord
);
865 common
->out_rq
.ird
= cpu_to_le32(ep
->cm_info
.ird
);
867 val
= p_hwfn
->hw_info
.opaque_fid
<< 16 | ep
->tcp_cid
;
868 p_mpa_ramrod
->tcp_cid
= cpu_to_le32(val
);
870 in_pdata_phys
= ep
->ep_buffer_phys
+
871 offsetof(struct qed_iwarp_ep_memory
, in_pdata
);
872 p_mpa_ramrod
->tcp_connect_side
= ep
->connect_mode
;
873 DMA_REGPAIR_LE(p_mpa_ramrod
->incoming_ulp_buffer
.addr
,
875 p_mpa_ramrod
->incoming_ulp_buffer
.len
=
876 cpu_to_le16(sizeof(ep
->ep_buffer_virt
->in_pdata
));
877 async_output_phys
= ep
->ep_buffer_phys
+
878 offsetof(struct qed_iwarp_ep_memory
, async_output
);
879 DMA_REGPAIR_LE(p_mpa_ramrod
->async_eqe_output_buf
,
881 p_mpa_ramrod
->handle_for_async
.hi
= cpu_to_le32(PTR_HI(ep
));
882 p_mpa_ramrod
->handle_for_async
.lo
= cpu_to_le32(PTR_LO(ep
));
885 DMA_REGPAIR_LE(p_mpa_ramrod
->shared_queue_addr
,
886 qp
->shared_queue_phys_addr
);
887 p_mpa_ramrod
->stats_counter_id
=
888 RESC_START(p_hwfn
, QED_RDMA_STATS_QUEUE
) + qp
->stats_queue
;
893 iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
894 p_mpa_ramrod
->rcv_wnd
= cpu_to_le16(iwarp_info
->rcv_wnd_size
);
895 p_mpa_ramrod
->mode
= ep
->mpa_rev
;
896 SET_FIELD(p_mpa_ramrod
->rtr_pref
,
897 IWARP_MPA_OFFLOAD_RAMROD_DATA_RTR_SUPPORTED
, ep
->rtr_type
);
899 ep
->state
= QED_IWARP_EP_MPA_OFFLOADED
;
900 rc
= qed_spq_post(p_hwfn
, p_ent
, NULL
);
902 ep
->cid
= qp
->icid
; /* Now they're migrated. */
906 "QP(0x%x) EP(0x%x) MPA Offload rc = %d IRD=0x%x ORD=0x%x rtr_type=%d mpa_rev=%d reject=%d\n",
907 reject
? 0xffff : qp
->icid
,
911 ep
->cm_info
.ord
, ep
->rtr_type
, ep
->mpa_rev
, reject
);
916 qed_iwarp_return_ep(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
*ep
)
918 ep
->state
= QED_IWARP_EP_INIT
;
922 memset(&ep
->cm_info
, 0, sizeof(ep
->cm_info
));
924 if (ep
->tcp_cid
== QED_IWARP_INVALID_TCP_CID
) {
925 /* We don't care about the return code, it's ok if tcp_cid
926 * remains invalid...in this case we'll defer allocation
928 qed_iwarp_alloc_tcp_cid(p_hwfn
, &ep
->tcp_cid
);
930 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
932 list_move_tail(&ep
->list_entry
,
933 &p_hwfn
->p_rdma_info
->iwarp
.ep_free_list
);
935 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
939 qed_iwarp_parse_private_data(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
*ep
)
941 struct mpa_v2_hdr
*mpa_v2_params
;
942 union async_output
*async_data
;
943 u16 mpa_ird
, mpa_ord
;
944 u8 mpa_data_size
= 0;
947 if (MPA_REV2(p_hwfn
->p_rdma_info
->iwarp
.mpa_rev
)) {
949 (struct mpa_v2_hdr
*)(ep
->ep_buffer_virt
->in_pdata
);
950 mpa_data_size
= sizeof(*mpa_v2_params
);
951 mpa_ird
= ntohs(mpa_v2_params
->ird
);
952 mpa_ord
= ntohs(mpa_v2_params
->ord
);
954 ep
->cm_info
.ird
= (u8
)(mpa_ord
& MPA_V2_IRD_ORD_MASK
);
955 ep
->cm_info
.ord
= (u8
)(mpa_ird
& MPA_V2_IRD_ORD_MASK
);
958 async_data
= &ep
->ep_buffer_virt
->async_output
;
959 ep
->cm_info
.private_data
= ep
->ep_buffer_virt
->in_pdata
+ mpa_data_size
;
961 ulp_data_len
= le16_to_cpu(async_data
->mpa_response
.ulp_data_len
);
962 ep
->cm_info
.private_data_len
= ulp_data_len
- mpa_data_size
;
966 qed_iwarp_mpa_reply_arrived(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
*ep
)
968 struct qed_iwarp_cm_event_params params
;
970 if (ep
->connect_mode
== TCP_CONNECT_PASSIVE
) {
972 "MPA reply event not expected on passive side!\n");
976 params
.event
= QED_IWARP_EVENT_ACTIVE_MPA_REPLY
;
978 qed_iwarp_parse_private_data(p_hwfn
, ep
);
980 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
981 "MPA_NEGOTIATE (v%d): ORD: 0x%x IRD: 0x%x\n",
982 ep
->mpa_rev
, ep
->cm_info
.ord
, ep
->cm_info
.ird
);
984 params
.cm_info
= &ep
->cm_info
;
985 params
.ep_context
= ep
;
988 ep
->mpa_reply_processed
= true;
990 ep
->event_cb(ep
->cb_context
, ¶ms
);
993 #define QED_IWARP_CONNECT_MODE_STRING(ep) \
994 ((ep)->connect_mode == TCP_CONNECT_PASSIVE) ? "Passive" : "Active"
996 /* Called as a result of the event:
997 * IWARP_EVENT_TYPE_ASYNC_MPA_HANDSHAKE_COMPLETE
1000 qed_iwarp_mpa_complete(struct qed_hwfn
*p_hwfn
,
1001 struct qed_iwarp_ep
*ep
, u8 fw_return_code
)
1003 struct qed_iwarp_cm_event_params params
;
1005 if (ep
->connect_mode
== TCP_CONNECT_ACTIVE
)
1006 params
.event
= QED_IWARP_EVENT_ACTIVE_COMPLETE
;
1008 params
.event
= QED_IWARP_EVENT_PASSIVE_COMPLETE
;
1010 if (ep
->connect_mode
== TCP_CONNECT_ACTIVE
&& !ep
->mpa_reply_processed
)
1011 qed_iwarp_parse_private_data(p_hwfn
, ep
);
1013 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1014 "MPA_NEGOTIATE (v%d): ORD: 0x%x IRD: 0x%x\n",
1015 ep
->mpa_rev
, ep
->cm_info
.ord
, ep
->cm_info
.ird
);
1017 params
.cm_info
= &ep
->cm_info
;
1019 params
.ep_context
= ep
;
1021 switch (fw_return_code
) {
1022 case RDMA_RETURN_OK
:
1023 ep
->qp
->max_rd_atomic_req
= ep
->cm_info
.ord
;
1024 ep
->qp
->max_rd_atomic_resp
= ep
->cm_info
.ird
;
1025 qed_iwarp_modify_qp(p_hwfn
, ep
->qp
, QED_IWARP_QP_STATE_RTS
, 1);
1026 ep
->state
= QED_IWARP_EP_ESTABLISHED
;
1029 case IWARP_CONN_ERROR_MPA_TIMEOUT
:
1030 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA timeout\n",
1031 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1032 params
.status
= -EBUSY
;
1034 case IWARP_CONN_ERROR_MPA_ERROR_REJECT
:
1035 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA Reject\n",
1036 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1037 params
.status
= -ECONNREFUSED
;
1039 case IWARP_CONN_ERROR_MPA_RST
:
1040 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA reset(tcp cid: 0x%x)\n",
1041 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
,
1043 params
.status
= -ECONNRESET
;
1045 case IWARP_CONN_ERROR_MPA_FIN
:
1046 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA received FIN\n",
1047 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1048 params
.status
= -ECONNREFUSED
;
1050 case IWARP_CONN_ERROR_MPA_INSUF_IRD
:
1051 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA insufficient ird\n",
1052 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1053 params
.status
= -ECONNREFUSED
;
1055 case IWARP_CONN_ERROR_MPA_RTR_MISMATCH
:
1056 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA RTR MISMATCH\n",
1057 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1058 params
.status
= -ECONNREFUSED
;
1060 case IWARP_CONN_ERROR_MPA_INVALID_PACKET
:
1061 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA Invalid Packet\n",
1062 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1063 params
.status
= -ECONNREFUSED
;
1065 case IWARP_CONN_ERROR_MPA_LOCAL_ERROR
:
1066 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA Local Error\n",
1067 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1068 params
.status
= -ECONNREFUSED
;
1070 case IWARP_CONN_ERROR_MPA_TERMINATE
:
1071 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA TERMINATE\n",
1072 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->cid
);
1073 params
.status
= -ECONNREFUSED
;
1076 params
.status
= -ECONNRESET
;
1080 if (fw_return_code
!= RDMA_RETURN_OK
)
1081 /* paired with READ_ONCE in destroy_qp */
1082 smp_store_release(&ep
->state
, QED_IWARP_EP_CLOSED
);
1084 ep
->event_cb(ep
->cb_context
, ¶ms
);
1086 /* on passive side, if there is no associated QP (REJECT) we need to
1087 * return the ep to the pool, (in the regular case we add an element
1088 * in accept instead of this one.
1089 * In both cases we need to remove it from the ep_list.
1091 if (fw_return_code
!= RDMA_RETURN_OK
) {
1092 ep
->tcp_cid
= QED_IWARP_INVALID_TCP_CID
;
1093 if ((ep
->connect_mode
== TCP_CONNECT_PASSIVE
) &&
1094 (!ep
->qp
)) { /* Rejected */
1095 qed_iwarp_return_ep(p_hwfn
, ep
);
1097 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1098 list_del(&ep
->list_entry
);
1099 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1105 qed_iwarp_mpa_v2_set_private(struct qed_hwfn
*p_hwfn
,
1106 struct qed_iwarp_ep
*ep
, u8
*mpa_data_size
)
1108 struct mpa_v2_hdr
*mpa_v2_params
;
1109 u16 mpa_ird
, mpa_ord
;
1112 if (MPA_REV2(ep
->mpa_rev
)) {
1114 (struct mpa_v2_hdr
*)ep
->ep_buffer_virt
->out_pdata
;
1115 *mpa_data_size
= sizeof(*mpa_v2_params
);
1117 mpa_ird
= (u16
)ep
->cm_info
.ird
;
1118 mpa_ord
= (u16
)ep
->cm_info
.ord
;
1120 if (ep
->rtr_type
!= MPA_RTR_TYPE_NONE
) {
1121 mpa_ird
|= MPA_V2_PEER2PEER_MODEL
;
1123 if (ep
->rtr_type
& MPA_RTR_TYPE_ZERO_SEND
)
1124 mpa_ird
|= MPA_V2_SEND_RTR
;
1126 if (ep
->rtr_type
& MPA_RTR_TYPE_ZERO_WRITE
)
1127 mpa_ord
|= MPA_V2_WRITE_RTR
;
1129 if (ep
->rtr_type
& MPA_RTR_TYPE_ZERO_READ
)
1130 mpa_ord
|= MPA_V2_READ_RTR
;
1133 mpa_v2_params
->ird
= htons(mpa_ird
);
1134 mpa_v2_params
->ord
= htons(mpa_ord
);
1138 "MPA_NEGOTIATE Header: [%x ord:%x ird] %x ord:%x ird:%x peer2peer:%x rtr_send:%x rtr_write:%x rtr_read:%x\n",
1141 *((u32
*)mpa_v2_params
),
1142 mpa_ord
& MPA_V2_IRD_ORD_MASK
,
1143 mpa_ird
& MPA_V2_IRD_ORD_MASK
,
1144 !!(mpa_ird
& MPA_V2_PEER2PEER_MODEL
),
1145 !!(mpa_ird
& MPA_V2_SEND_RTR
),
1146 !!(mpa_ord
& MPA_V2_WRITE_RTR
),
1147 !!(mpa_ord
& MPA_V2_READ_RTR
));
1151 int qed_iwarp_connect(void *rdma_cxt
,
1152 struct qed_iwarp_connect_in
*iparams
,
1153 struct qed_iwarp_connect_out
*oparams
)
1155 struct qed_hwfn
*p_hwfn
= rdma_cxt
;
1156 struct qed_iwarp_info
*iwarp_info
;
1157 struct qed_iwarp_ep
*ep
;
1158 u8 mpa_data_size
= 0;
1162 if ((iparams
->cm_info
.ord
> QED_IWARP_ORD_DEFAULT
) ||
1163 (iparams
->cm_info
.ird
> QED_IWARP_IRD_DEFAULT
)) {
1165 "QP(0x%x) ERROR: Invalid ord(0x%x)/ird(0x%x)\n",
1166 iparams
->qp
->icid
, iparams
->cm_info
.ord
,
1167 iparams
->cm_info
.ird
);
1172 iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
1174 /* Allocate ep object */
1175 rc
= qed_iwarp_alloc_cid(p_hwfn
, &cid
);
1179 rc
= qed_iwarp_create_ep(p_hwfn
, &ep
);
1185 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1186 list_add_tail(&ep
->list_entry
, &p_hwfn
->p_rdma_info
->iwarp
.ep_list
);
1187 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1189 ep
->qp
= iparams
->qp
;
1191 ether_addr_copy(ep
->remote_mac_addr
, iparams
->remote_mac_addr
);
1192 ether_addr_copy(ep
->local_mac_addr
, iparams
->local_mac_addr
);
1193 memcpy(&ep
->cm_info
, &iparams
->cm_info
, sizeof(ep
->cm_info
));
1195 ep
->cm_info
.ord
= iparams
->cm_info
.ord
;
1196 ep
->cm_info
.ird
= iparams
->cm_info
.ird
;
1198 ep
->rtr_type
= iwarp_info
->rtr_type
;
1199 if (!iwarp_info
->peer2peer
)
1200 ep
->rtr_type
= MPA_RTR_TYPE_NONE
;
1202 if ((ep
->rtr_type
& MPA_RTR_TYPE_ZERO_READ
) && (ep
->cm_info
.ord
== 0))
1203 ep
->cm_info
.ord
= 1;
1205 ep
->mpa_rev
= iwarp_info
->mpa_rev
;
1207 qed_iwarp_mpa_v2_set_private(p_hwfn
, ep
, &mpa_data_size
);
1209 ep
->cm_info
.private_data
= ep
->ep_buffer_virt
->out_pdata
;
1210 ep
->cm_info
.private_data_len
= iparams
->cm_info
.private_data_len
+
1213 memcpy((u8
*)ep
->ep_buffer_virt
->out_pdata
+ mpa_data_size
,
1214 iparams
->cm_info
.private_data
,
1215 iparams
->cm_info
.private_data_len
);
1217 ep
->mss
= iparams
->mss
;
1218 ep
->mss
= min_t(u16
, QED_IWARP_MAX_FW_MSS
, ep
->mss
);
1220 ep
->event_cb
= iparams
->event_cb
;
1221 ep
->cb_context
= iparams
->cb_context
;
1222 ep
->connect_mode
= TCP_CONNECT_ACTIVE
;
1224 oparams
->ep_context
= ep
;
1226 rc
= qed_iwarp_tcp_offload(p_hwfn
, ep
);
1228 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "QP(0x%x) EP(0x%x) rc = %d\n",
1229 iparams
->qp
->icid
, ep
->tcp_cid
, rc
);
1232 qed_iwarp_destroy_ep(p_hwfn
, ep
, true);
1238 qed_iwarp_cid_cleaned(p_hwfn
, cid
);
1243 static struct qed_iwarp_ep
*qed_iwarp_get_free_ep(struct qed_hwfn
*p_hwfn
)
1245 struct qed_iwarp_ep
*ep
= NULL
;
1248 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1250 if (list_empty(&p_hwfn
->p_rdma_info
->iwarp
.ep_free_list
)) {
1251 DP_ERR(p_hwfn
, "Ep list is empty\n");
1255 ep
= list_first_entry(&p_hwfn
->p_rdma_info
->iwarp
.ep_free_list
,
1256 struct qed_iwarp_ep
, list_entry
);
1258 /* in some cases we could have failed allocating a tcp cid when added
1259 * from accept / failure... retry now..this is not the common case.
1261 if (ep
->tcp_cid
== QED_IWARP_INVALID_TCP_CID
) {
1262 rc
= qed_iwarp_alloc_tcp_cid(p_hwfn
, &ep
->tcp_cid
);
1264 /* if we fail we could look for another entry with a valid
1265 * tcp_cid, but since we don't expect to reach this anyway
1266 * it's not worth the handling
1269 ep
->tcp_cid
= QED_IWARP_INVALID_TCP_CID
;
1275 list_del(&ep
->list_entry
);
1278 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1282 #define QED_IWARP_MAX_CID_CLEAN_TIME 100
1283 #define QED_IWARP_MAX_NO_PROGRESS_CNT 5
1285 /* This function waits for all the bits of a bmap to be cleared, as long as
1286 * there is progress ( i.e. the number of bits left to be cleared decreases )
1287 * the function continues.
1290 qed_iwarp_wait_cid_map_cleared(struct qed_hwfn
*p_hwfn
, struct qed_bmap
*bmap
)
1292 int prev_weight
= 0;
1296 weight
= bitmap_weight(bmap
->bitmap
, bmap
->max_count
);
1297 prev_weight
= weight
;
1300 msleep(QED_IWARP_MAX_CID_CLEAN_TIME
);
1302 weight
= bitmap_weight(bmap
->bitmap
, bmap
->max_count
);
1304 if (prev_weight
== weight
) {
1307 prev_weight
= weight
;
1311 if (wait_count
> QED_IWARP_MAX_NO_PROGRESS_CNT
) {
1313 "%s bitmap wait timed out (%d cids pending)\n",
1314 bmap
->name
, weight
);
1321 static int qed_iwarp_wait_for_all_cids(struct qed_hwfn
*p_hwfn
)
1326 rc
= qed_iwarp_wait_cid_map_cleared(p_hwfn
,
1327 &p_hwfn
->p_rdma_info
->tcp_cid_map
);
1331 /* Now free the tcp cids from the main cid map */
1332 for (i
= 0; i
< QED_IWARP_PREALLOC_CNT
; i
++)
1333 qed_bmap_release_id(p_hwfn
, &p_hwfn
->p_rdma_info
->cid_map
, i
);
1335 /* Now wait for all cids to be completed */
1336 return qed_iwarp_wait_cid_map_cleared(p_hwfn
,
1337 &p_hwfn
->p_rdma_info
->cid_map
);
1340 static void qed_iwarp_free_prealloc_ep(struct qed_hwfn
*p_hwfn
)
1342 struct qed_iwarp_ep
*ep
;
1344 while (!list_empty(&p_hwfn
->p_rdma_info
->iwarp
.ep_free_list
)) {
1345 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1347 ep
= list_first_entry(&p_hwfn
->p_rdma_info
->iwarp
.ep_free_list
,
1348 struct qed_iwarp_ep
, list_entry
);
1351 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1354 list_del(&ep
->list_entry
);
1356 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1358 if (ep
->tcp_cid
!= QED_IWARP_INVALID_TCP_CID
)
1359 qed_iwarp_cid_cleaned(p_hwfn
, ep
->tcp_cid
);
1361 qed_iwarp_destroy_ep(p_hwfn
, ep
, false);
1365 static int qed_iwarp_prealloc_ep(struct qed_hwfn
*p_hwfn
, bool init
)
1367 struct qed_iwarp_ep
*ep
;
1373 count
= init
? QED_IWARP_PREALLOC_CNT
: 1;
1374 for (i
= 0; i
< count
; i
++) {
1375 rc
= qed_iwarp_create_ep(p_hwfn
, &ep
);
1379 /* During initialization we allocate from the main pool,
1380 * afterwards we allocate only from the tcp_cid.
1383 rc
= qed_iwarp_alloc_cid(p_hwfn
, &cid
);
1386 qed_iwarp_set_tcp_cid(p_hwfn
, cid
);
1388 /* We don't care about the return code, it's ok if
1389 * tcp_cid remains invalid...in this case we'll
1392 qed_iwarp_alloc_tcp_cid(p_hwfn
, &cid
);
1397 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1398 list_add_tail(&ep
->list_entry
,
1399 &p_hwfn
->p_rdma_info
->iwarp
.ep_free_list
);
1400 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1406 qed_iwarp_destroy_ep(p_hwfn
, ep
, false);
1411 int qed_iwarp_alloc(struct qed_hwfn
*p_hwfn
)
1415 /* Allocate bitmap for tcp cid. These are used by passive side
1416 * to ensure it can allocate a tcp cid during dpc that was
1417 * pre-acquired and doesn't require dynamic allocation of ilt
1419 rc
= qed_rdma_bmap_alloc(p_hwfn
, &p_hwfn
->p_rdma_info
->tcp_cid_map
,
1420 QED_IWARP_PREALLOC_CNT
, "TCP_CID");
1422 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1423 "Failed to allocate tcp cid, rc = %d\n", rc
);
1427 INIT_LIST_HEAD(&p_hwfn
->p_rdma_info
->iwarp
.ep_free_list
);
1428 spin_lock_init(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
1430 rc
= qed_iwarp_prealloc_ep(p_hwfn
, true);
1434 return qed_ooo_alloc(p_hwfn
);
1437 void qed_iwarp_resc_free(struct qed_hwfn
*p_hwfn
)
1439 struct qed_iwarp_info
*iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
1441 qed_ooo_free(p_hwfn
);
1442 qed_rdma_bmap_free(p_hwfn
, &p_hwfn
->p_rdma_info
->tcp_cid_map
, 1);
1443 kfree(iwarp_info
->mpa_bufs
);
1444 kfree(iwarp_info
->partial_fpdus
);
1445 kfree(iwarp_info
->mpa_intermediate_buf
);
1448 int qed_iwarp_accept(void *rdma_cxt
, struct qed_iwarp_accept_in
*iparams
)
1450 struct qed_hwfn
*p_hwfn
= rdma_cxt
;
1451 struct qed_iwarp_ep
*ep
;
1452 u8 mpa_data_size
= 0;
1455 ep
= iparams
->ep_context
;
1457 DP_ERR(p_hwfn
, "Ep Context receive in accept is NULL\n");
1461 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "QP(0x%x) EP(0x%x)\n",
1462 iparams
->qp
->icid
, ep
->tcp_cid
);
1464 if ((iparams
->ord
> QED_IWARP_ORD_DEFAULT
) ||
1465 (iparams
->ird
> QED_IWARP_IRD_DEFAULT
)) {
1468 "QP(0x%x) EP(0x%x) ERROR: Invalid ord(0x%x)/ird(0x%x)\n",
1470 ep
->tcp_cid
, iparams
->ord
, iparams
->ord
);
1474 qed_iwarp_prealloc_ep(p_hwfn
, false);
1476 ep
->cb_context
= iparams
->cb_context
;
1477 ep
->qp
= iparams
->qp
;
1480 if (ep
->mpa_rev
== MPA_NEGOTIATION_TYPE_ENHANCED
) {
1481 /* Negotiate ord/ird: if upperlayer requested ord larger than
1482 * ird advertised by remote, we need to decrease our ord
1484 if (iparams
->ord
> ep
->cm_info
.ird
)
1485 iparams
->ord
= ep
->cm_info
.ird
;
1487 if ((ep
->rtr_type
& MPA_RTR_TYPE_ZERO_READ
) &&
1488 (iparams
->ird
== 0))
1492 /* Update cm_info ord/ird to be negotiated values */
1493 ep
->cm_info
.ord
= iparams
->ord
;
1494 ep
->cm_info
.ird
= iparams
->ird
;
1496 qed_iwarp_mpa_v2_set_private(p_hwfn
, ep
, &mpa_data_size
);
1498 ep
->cm_info
.private_data
= ep
->ep_buffer_virt
->out_pdata
;
1499 ep
->cm_info
.private_data_len
= iparams
->private_data_len
+
1502 memcpy((u8
*)ep
->ep_buffer_virt
->out_pdata
+ mpa_data_size
,
1503 iparams
->private_data
, iparams
->private_data_len
);
1505 rc
= qed_iwarp_mpa_offload(p_hwfn
, ep
);
1507 qed_iwarp_modify_qp(p_hwfn
,
1508 iparams
->qp
, QED_IWARP_QP_STATE_ERROR
, 1);
1513 int qed_iwarp_reject(void *rdma_cxt
, struct qed_iwarp_reject_in
*iparams
)
1515 struct qed_hwfn
*p_hwfn
= rdma_cxt
;
1516 struct qed_iwarp_ep
*ep
;
1517 u8 mpa_data_size
= 0;
1519 ep
= iparams
->ep_context
;
1521 DP_ERR(p_hwfn
, "Ep Context receive in reject is NULL\n");
1525 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "EP(0x%x)\n", ep
->tcp_cid
);
1527 ep
->cb_context
= iparams
->cb_context
;
1530 qed_iwarp_mpa_v2_set_private(p_hwfn
, ep
, &mpa_data_size
);
1532 ep
->cm_info
.private_data
= ep
->ep_buffer_virt
->out_pdata
;
1533 ep
->cm_info
.private_data_len
= iparams
->private_data_len
+
1536 memcpy((u8
*)ep
->ep_buffer_virt
->out_pdata
+ mpa_data_size
,
1537 iparams
->private_data
, iparams
->private_data_len
);
1539 return qed_iwarp_mpa_offload(p_hwfn
, ep
);
1543 qed_iwarp_print_cm_info(struct qed_hwfn
*p_hwfn
,
1544 struct qed_iwarp_cm_info
*cm_info
)
1546 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "ip_version = %d\n",
1547 cm_info
->ip_version
);
1549 if (cm_info
->ip_version
== QED_TCP_IPV4
)
1550 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1551 "remote_ip %pI4h:%x, local_ip %pI4h:%x vlan=%x\n",
1552 cm_info
->remote_ip
, cm_info
->remote_port
,
1553 cm_info
->local_ip
, cm_info
->local_port
,
1556 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1557 "remote_ip %pI6:%x, local_ip %pI6:%x vlan=%x\n",
1558 cm_info
->remote_ip
, cm_info
->remote_port
,
1559 cm_info
->local_ip
, cm_info
->local_port
,
1562 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1563 "private_data_len = %x ord = %d, ird = %d\n",
1564 cm_info
->private_data_len
, cm_info
->ord
, cm_info
->ird
);
1568 qed_iwarp_ll2_post_rx(struct qed_hwfn
*p_hwfn
,
1569 struct qed_iwarp_ll2_buff
*buf
, u8 handle
)
1573 rc
= qed_ll2_post_rx_buffer(p_hwfn
, handle
, buf
->data_phys_addr
,
1574 (u16
)buf
->buff_size
, buf
, 1);
1577 "Failed to repost rx buffer to ll2 rc = %d, handle=%d\n",
1579 dma_free_coherent(&p_hwfn
->cdev
->pdev
->dev
, buf
->buff_size
,
1580 buf
->data
, buf
->data_phys_addr
);
1588 qed_iwarp_ep_exists(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_cm_info
*cm_info
)
1590 struct qed_iwarp_ep
*ep
= NULL
;
1593 list_for_each_entry(ep
,
1594 &p_hwfn
->p_rdma_info
->iwarp
.ep_list
,
1596 if ((ep
->cm_info
.local_port
== cm_info
->local_port
) &&
1597 (ep
->cm_info
.remote_port
== cm_info
->remote_port
) &&
1598 (ep
->cm_info
.vlan
== cm_info
->vlan
) &&
1599 !memcmp(&ep
->cm_info
.local_ip
, cm_info
->local_ip
,
1600 sizeof(cm_info
->local_ip
)) &&
1601 !memcmp(&ep
->cm_info
.remote_ip
, cm_info
->remote_ip
,
1602 sizeof(cm_info
->remote_ip
))) {
1610 "SYN received on active connection - dropping\n");
1611 qed_iwarp_print_cm_info(p_hwfn
, cm_info
);
1619 static struct qed_iwarp_listener
*
1620 qed_iwarp_get_listener(struct qed_hwfn
*p_hwfn
,
1621 struct qed_iwarp_cm_info
*cm_info
)
1623 struct qed_iwarp_listener
*listener
= NULL
;
1624 static const u32 ip_zero
[4] = { 0, 0, 0, 0 };
1627 qed_iwarp_print_cm_info(p_hwfn
, cm_info
);
1629 list_for_each_entry(listener
,
1630 &p_hwfn
->p_rdma_info
->iwarp
.listen_list
,
1632 if (listener
->port
== cm_info
->local_port
) {
1633 if (!memcmp(listener
->ip_addr
,
1634 ip_zero
, sizeof(ip_zero
))) {
1639 if (!memcmp(listener
->ip_addr
,
1641 sizeof(cm_info
->local_ip
)) &&
1642 (listener
->vlan
== cm_info
->vlan
)) {
1650 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "listener found = %p\n",
1655 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "listener not found\n");
1660 qed_iwarp_parse_rx_pkt(struct qed_hwfn
*p_hwfn
,
1661 struct qed_iwarp_cm_info
*cm_info
,
1663 u8
*remote_mac_addr
,
1665 int *payload_len
, int *tcp_start_offset
)
1667 struct vlan_ethhdr
*vethh
;
1668 bool vlan_valid
= false;
1669 struct ipv6hdr
*ip6h
;
1670 struct ethhdr
*ethh
;
1671 struct tcphdr
*tcph
;
1679 eth_type
= ntohs(ethh
->h_proto
);
1680 if (eth_type
== ETH_P_8021Q
) {
1682 vethh
= (struct vlan_ethhdr
*)ethh
;
1683 cm_info
->vlan
= ntohs(vethh
->h_vlan_TCI
) & VLAN_VID_MASK
;
1684 eth_type
= ntohs(vethh
->h_vlan_encapsulated_proto
);
1687 eth_hlen
= ETH_HLEN
+ (vlan_valid
? sizeof(u32
) : 0);
1689 if (!ether_addr_equal(ethh
->h_dest
,
1690 p_hwfn
->p_rdma_info
->iwarp
.mac_addr
)) {
1693 "Got unexpected mac %pM instead of %pM\n",
1694 ethh
->h_dest
, p_hwfn
->p_rdma_info
->iwarp
.mac_addr
);
1698 ether_addr_copy(remote_mac_addr
, ethh
->h_source
);
1699 ether_addr_copy(local_mac_addr
, ethh
->h_dest
);
1701 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "eth_type =%d source mac: %pM\n",
1702 eth_type
, ethh
->h_source
);
1704 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "eth_hlen=%d destination mac: %pM\n",
1705 eth_hlen
, ethh
->h_dest
);
1707 iph
= (struct iphdr
*)((u8
*)(ethh
) + eth_hlen
);
1709 if (eth_type
== ETH_P_IP
) {
1710 if (iph
->protocol
!= IPPROTO_TCP
) {
1712 "Unexpected ip protocol on ll2 %x\n",
1717 cm_info
->local_ip
[0] = ntohl(iph
->daddr
);
1718 cm_info
->remote_ip
[0] = ntohl(iph
->saddr
);
1719 cm_info
->ip_version
= QED_TCP_IPV4
;
1721 ip_hlen
= (iph
->ihl
) * sizeof(u32
);
1722 *payload_len
= ntohs(iph
->tot_len
) - ip_hlen
;
1723 } else if (eth_type
== ETH_P_IPV6
) {
1724 ip6h
= (struct ipv6hdr
*)iph
;
1726 if (ip6h
->nexthdr
!= IPPROTO_TCP
) {
1728 "Unexpected ip protocol on ll2 %x\n",
1733 for (i
= 0; i
< 4; i
++) {
1734 cm_info
->local_ip
[i
] =
1735 ntohl(ip6h
->daddr
.in6_u
.u6_addr32
[i
]);
1736 cm_info
->remote_ip
[i
] =
1737 ntohl(ip6h
->saddr
.in6_u
.u6_addr32
[i
]);
1739 cm_info
->ip_version
= QED_TCP_IPV6
;
1741 ip_hlen
= sizeof(*ip6h
);
1742 *payload_len
= ntohs(ip6h
->payload_len
);
1744 DP_NOTICE(p_hwfn
, "Unexpected ethertype on ll2 %x\n", eth_type
);
1748 tcph
= (struct tcphdr
*)((u8
*)iph
+ ip_hlen
);
1752 "Only SYN type packet expected on this ll2 conn, iph->ihl=%d source=%d dest=%d\n",
1753 iph
->ihl
, tcph
->source
, tcph
->dest
);
1757 cm_info
->local_port
= ntohs(tcph
->dest
);
1758 cm_info
->remote_port
= ntohs(tcph
->source
);
1760 qed_iwarp_print_cm_info(p_hwfn
, cm_info
);
1762 *tcp_start_offset
= eth_hlen
+ ip_hlen
;
1767 static struct qed_iwarp_fpdu
*qed_iwarp_get_curr_fpdu(struct qed_hwfn
*p_hwfn
,
1770 struct qed_iwarp_info
*iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
1771 struct qed_iwarp_fpdu
*partial_fpdu
;
1774 idx
= cid
- qed_cxt_get_proto_cid_start(p_hwfn
, PROTOCOLID_IWARP
);
1775 if (idx
>= iwarp_info
->max_num_partial_fpdus
) {
1776 DP_ERR(p_hwfn
, "Invalid cid %x max_num_partial_fpdus=%x\n", cid
,
1777 iwarp_info
->max_num_partial_fpdus
);
1781 partial_fpdu
= &iwarp_info
->partial_fpdus
[idx
];
1783 return partial_fpdu
;
1786 enum qed_iwarp_mpa_pkt_type
{
1787 QED_IWARP_MPA_PKT_PACKED
,
1788 QED_IWARP_MPA_PKT_PARTIAL
,
1789 QED_IWARP_MPA_PKT_UNALIGNED
1792 #define QED_IWARP_INVALID_FPDU_LENGTH 0xffff
1793 #define QED_IWARP_MPA_FPDU_LENGTH_SIZE (2)
1794 #define QED_IWARP_MPA_CRC32_DIGEST_SIZE (4)
1796 /* Pad to multiple of 4 */
1797 #define QED_IWARP_PDU_DATA_LEN_WITH_PAD(data_len) ALIGN(data_len, 4)
1798 #define QED_IWARP_FPDU_LEN_WITH_PAD(_mpa_len) \
1799 (QED_IWARP_PDU_DATA_LEN_WITH_PAD((_mpa_len) + \
1800 QED_IWARP_MPA_FPDU_LENGTH_SIZE) + \
1801 QED_IWARP_MPA_CRC32_DIGEST_SIZE)
1803 /* fpdu can be fragmented over maximum 3 bds: header, partial mpa, unaligned */
1804 #define QED_IWARP_MAX_BDS_PER_FPDU 3
1806 static const char * const pkt_type_str
[] = {
1807 "QED_IWARP_MPA_PKT_PACKED",
1808 "QED_IWARP_MPA_PKT_PARTIAL",
1809 "QED_IWARP_MPA_PKT_UNALIGNED"
1813 qed_iwarp_recycle_pkt(struct qed_hwfn
*p_hwfn
,
1814 struct qed_iwarp_fpdu
*fpdu
,
1815 struct qed_iwarp_ll2_buff
*buf
);
1817 static enum qed_iwarp_mpa_pkt_type
1818 qed_iwarp_mpa_classify(struct qed_hwfn
*p_hwfn
,
1819 struct qed_iwarp_fpdu
*fpdu
,
1820 u16 tcp_payload_len
, u8
*mpa_data
)
1822 enum qed_iwarp_mpa_pkt_type pkt_type
;
1825 if (fpdu
->incomplete_bytes
) {
1826 pkt_type
= QED_IWARP_MPA_PKT_UNALIGNED
;
1830 /* special case of one byte remaining...
1831 * lower byte will be read next packet
1833 if (tcp_payload_len
== 1) {
1834 fpdu
->fpdu_length
= *mpa_data
<< BITS_PER_BYTE
;
1835 pkt_type
= QED_IWARP_MPA_PKT_PARTIAL
;
1839 mpa_len
= ntohs(*(__force __be16
*)mpa_data
);
1840 fpdu
->fpdu_length
= QED_IWARP_FPDU_LEN_WITH_PAD(mpa_len
);
1842 if (fpdu
->fpdu_length
<= tcp_payload_len
)
1843 pkt_type
= QED_IWARP_MPA_PKT_PACKED
;
1845 pkt_type
= QED_IWARP_MPA_PKT_PARTIAL
;
1848 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1849 "MPA_ALIGN: %s: fpdu_length=0x%x tcp_payload_len:0x%x\n",
1850 pkt_type_str
[pkt_type
], fpdu
->fpdu_length
, tcp_payload_len
);
1856 qed_iwarp_init_fpdu(struct qed_iwarp_ll2_buff
*buf
,
1857 struct qed_iwarp_fpdu
*fpdu
,
1858 struct unaligned_opaque_data
*pkt_data
,
1859 u16 tcp_payload_size
, u8 placement_offset
)
1861 u16 first_mpa_offset
= le16_to_cpu(pkt_data
->first_mpa_offset
);
1863 fpdu
->mpa_buf
= buf
;
1864 fpdu
->pkt_hdr
= buf
->data_phys_addr
+ placement_offset
;
1865 fpdu
->pkt_hdr_size
= pkt_data
->tcp_payload_offset
;
1866 fpdu
->mpa_frag
= buf
->data_phys_addr
+ first_mpa_offset
;
1867 fpdu
->mpa_frag_virt
= (u8
*)(buf
->data
) + first_mpa_offset
;
1869 if (tcp_payload_size
== 1)
1870 fpdu
->incomplete_bytes
= QED_IWARP_INVALID_FPDU_LENGTH
;
1871 else if (tcp_payload_size
< fpdu
->fpdu_length
)
1872 fpdu
->incomplete_bytes
= fpdu
->fpdu_length
- tcp_payload_size
;
1874 fpdu
->incomplete_bytes
= 0; /* complete fpdu */
1876 fpdu
->mpa_frag_len
= fpdu
->fpdu_length
- fpdu
->incomplete_bytes
;
1880 qed_iwarp_cp_pkt(struct qed_hwfn
*p_hwfn
,
1881 struct qed_iwarp_fpdu
*fpdu
,
1882 struct unaligned_opaque_data
*pkt_data
,
1883 struct qed_iwarp_ll2_buff
*buf
, u16 tcp_payload_size
)
1885 u16 first_mpa_offset
= le16_to_cpu(pkt_data
->first_mpa_offset
);
1886 u8
*tmp_buf
= p_hwfn
->p_rdma_info
->iwarp
.mpa_intermediate_buf
;
1889 /* need to copy the data from the partial packet stored in fpdu
1890 * to the new buf, for this we also need to move the data currently
1891 * placed on the buf. The assumption is that the buffer is big enough
1892 * since fpdu_length <= mss, we use an intermediate buffer since
1893 * we may need to copy the new data to an overlapping location
1895 if ((fpdu
->mpa_frag_len
+ tcp_payload_size
) > (u16
)buf
->buff_size
) {
1897 "MPA ALIGN: Unexpected: buffer is not large enough for split fpdu buff_size = %d mpa_frag_len = %d, tcp_payload_size = %d, incomplete_bytes = %d\n",
1898 buf
->buff_size
, fpdu
->mpa_frag_len
,
1899 tcp_payload_size
, fpdu
->incomplete_bytes
);
1903 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1904 "MPA ALIGN Copying fpdu: [%p, %d] [%p, %d]\n",
1905 fpdu
->mpa_frag_virt
, fpdu
->mpa_frag_len
,
1906 (u8
*)(buf
->data
) + first_mpa_offset
, tcp_payload_size
);
1908 memcpy(tmp_buf
, fpdu
->mpa_frag_virt
, fpdu
->mpa_frag_len
);
1909 memcpy(tmp_buf
+ fpdu
->mpa_frag_len
,
1910 (u8
*)(buf
->data
) + first_mpa_offset
, tcp_payload_size
);
1912 rc
= qed_iwarp_recycle_pkt(p_hwfn
, fpdu
, fpdu
->mpa_buf
);
1916 /* If we managed to post the buffer copy the data to the new buffer
1917 * o/w this will occur in the next round...
1919 memcpy((u8
*)(buf
->data
), tmp_buf
,
1920 fpdu
->mpa_frag_len
+ tcp_payload_size
);
1922 fpdu
->mpa_buf
= buf
;
1923 /* fpdu->pkt_hdr remains as is */
1924 /* fpdu->mpa_frag is overridden with new buf */
1925 fpdu
->mpa_frag
= buf
->data_phys_addr
;
1926 fpdu
->mpa_frag_virt
= buf
->data
;
1927 fpdu
->mpa_frag_len
+= tcp_payload_size
;
1929 fpdu
->incomplete_bytes
-= tcp_payload_size
;
1933 "MPA ALIGN: split fpdu buff_size = %d mpa_frag_len = %d, tcp_payload_size = %d, incomplete_bytes = %d\n",
1934 buf
->buff_size
, fpdu
->mpa_frag_len
, tcp_payload_size
,
1935 fpdu
->incomplete_bytes
);
1941 qed_iwarp_update_fpdu_length(struct qed_hwfn
*p_hwfn
,
1942 struct qed_iwarp_fpdu
*fpdu
, u8
*mpa_data
)
1946 /* Update incomplete packets if needed */
1947 if (fpdu
->incomplete_bytes
== QED_IWARP_INVALID_FPDU_LENGTH
) {
1948 /* Missing lower byte is now available */
1949 mpa_len
= fpdu
->fpdu_length
| *mpa_data
;
1950 fpdu
->fpdu_length
= QED_IWARP_FPDU_LEN_WITH_PAD(mpa_len
);
1951 /* one byte of hdr */
1952 fpdu
->mpa_frag_len
= 1;
1953 fpdu
->incomplete_bytes
= fpdu
->fpdu_length
- 1;
1956 "MPA_ALIGN: Partial header mpa_len=%x fpdu_length=%x incomplete_bytes=%x\n",
1957 mpa_len
, fpdu
->fpdu_length
, fpdu
->incomplete_bytes
);
1961 #define QED_IWARP_IS_RIGHT_EDGE(_curr_pkt) \
1962 (GET_FIELD((_curr_pkt)->flags, \
1963 UNALIGNED_OPAQUE_DATA_PKT_REACHED_WIN_RIGHT_EDGE))
1965 /* This function is used to recycle a buffer using the ll2 drop option. It
1966 * uses the mechanism to ensure that all buffers posted to tx before this one
1967 * were completed. The buffer sent here will be sent as a cookie in the tx
1968 * completion function and can then be reposted to rx chain when done. The flow
1969 * that requires this is the flow where a FPDU splits over more than 3 tcp
1970 * segments. In this case the driver needs to re-post a rx buffer instead of
1971 * the one received, but driver can't simply repost a buffer it copied from
1972 * as there is a case where the buffer was originally a packed FPDU, and is
1973 * partially posted to FW. Driver needs to ensure FW is done with it.
1976 qed_iwarp_recycle_pkt(struct qed_hwfn
*p_hwfn
,
1977 struct qed_iwarp_fpdu
*fpdu
,
1978 struct qed_iwarp_ll2_buff
*buf
)
1980 struct qed_ll2_tx_pkt_info tx_pkt
;
1984 memset(&tx_pkt
, 0, sizeof(tx_pkt
));
1985 tx_pkt
.num_of_bds
= 1;
1986 tx_pkt
.tx_dest
= QED_LL2_TX_DEST_DROP
;
1987 tx_pkt
.l4_hdr_offset_w
= fpdu
->pkt_hdr_size
>> 2;
1988 tx_pkt
.first_frag
= fpdu
->pkt_hdr
;
1989 tx_pkt
.first_frag_len
= fpdu
->pkt_hdr_size
;
1990 buf
->piggy_buf
= NULL
;
1991 tx_pkt
.cookie
= buf
;
1993 ll2_handle
= p_hwfn
->p_rdma_info
->iwarp
.ll2_mpa_handle
;
1995 rc
= qed_ll2_prepare_tx_packet(p_hwfn
, ll2_handle
, &tx_pkt
, true);
1997 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
1998 "Can't drop packet rc=%d\n", rc
);
2002 "MPA_ALIGN: send drop tx packet [%lx, 0x%x], buf=%p, rc=%d\n",
2003 (unsigned long int)tx_pkt
.first_frag
,
2004 tx_pkt
.first_frag_len
, buf
, rc
);
2010 qed_iwarp_win_right_edge(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_fpdu
*fpdu
)
2012 struct qed_ll2_tx_pkt_info tx_pkt
;
2016 memset(&tx_pkt
, 0, sizeof(tx_pkt
));
2017 tx_pkt
.num_of_bds
= 1;
2018 tx_pkt
.tx_dest
= QED_LL2_TX_DEST_LB
;
2019 tx_pkt
.l4_hdr_offset_w
= fpdu
->pkt_hdr_size
>> 2;
2021 tx_pkt
.first_frag
= fpdu
->pkt_hdr
;
2022 tx_pkt
.first_frag_len
= fpdu
->pkt_hdr_size
;
2023 tx_pkt
.enable_ip_cksum
= true;
2024 tx_pkt
.enable_l4_cksum
= true;
2025 tx_pkt
.calc_ip_len
= true;
2026 /* vlan overload with enum iwarp_ll2_tx_queues */
2027 tx_pkt
.vlan
= IWARP_LL2_ALIGNED_RIGHT_TRIMMED_TX_QUEUE
;
2029 ll2_handle
= p_hwfn
->p_rdma_info
->iwarp
.ll2_mpa_handle
;
2031 rc
= qed_ll2_prepare_tx_packet(p_hwfn
, ll2_handle
, &tx_pkt
, true);
2033 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
2034 "Can't send right edge rc=%d\n", rc
);
2037 "MPA_ALIGN: Sent right edge FPDU num_bds=%d [%lx, 0x%x], rc=%d\n",
2039 (unsigned long int)tx_pkt
.first_frag
,
2040 tx_pkt
.first_frag_len
, rc
);
2046 qed_iwarp_send_fpdu(struct qed_hwfn
*p_hwfn
,
2047 struct qed_iwarp_fpdu
*fpdu
,
2048 struct unaligned_opaque_data
*curr_pkt
,
2049 struct qed_iwarp_ll2_buff
*buf
,
2050 u16 tcp_payload_size
, enum qed_iwarp_mpa_pkt_type pkt_type
)
2052 struct qed_ll2_tx_pkt_info tx_pkt
;
2053 u16 first_mpa_offset
;
2057 memset(&tx_pkt
, 0, sizeof(tx_pkt
));
2059 /* An unaligned packet means it's split over two tcp segments. So the
2060 * complete packet requires 3 bds, one for the header, one for the
2061 * part of the fpdu of the first tcp segment, and the last fragment
2062 * will point to the remainder of the fpdu. A packed pdu, requires only
2063 * two bds, one for the header and one for the data.
2065 tx_pkt
.num_of_bds
= (pkt_type
== QED_IWARP_MPA_PKT_UNALIGNED
) ? 3 : 2;
2066 tx_pkt
.tx_dest
= QED_LL2_TX_DEST_LB
;
2067 tx_pkt
.l4_hdr_offset_w
= fpdu
->pkt_hdr_size
>> 2; /* offset in words */
2069 /* Send the mpa_buf only with the last fpdu (in case of packed) */
2070 if (pkt_type
== QED_IWARP_MPA_PKT_UNALIGNED
||
2071 tcp_payload_size
<= fpdu
->fpdu_length
)
2072 tx_pkt
.cookie
= fpdu
->mpa_buf
;
2074 tx_pkt
.first_frag
= fpdu
->pkt_hdr
;
2075 tx_pkt
.first_frag_len
= fpdu
->pkt_hdr_size
;
2076 tx_pkt
.enable_ip_cksum
= true;
2077 tx_pkt
.enable_l4_cksum
= true;
2078 tx_pkt
.calc_ip_len
= true;
2079 /* vlan overload with enum iwarp_ll2_tx_queues */
2080 tx_pkt
.vlan
= IWARP_LL2_ALIGNED_TX_QUEUE
;
2082 /* special case of unaligned packet and not packed, need to send
2083 * both buffers as cookie to release.
2085 if (tcp_payload_size
== fpdu
->incomplete_bytes
)
2086 fpdu
->mpa_buf
->piggy_buf
= buf
;
2088 ll2_handle
= p_hwfn
->p_rdma_info
->iwarp
.ll2_mpa_handle
;
2090 /* Set first fragment to header */
2091 rc
= qed_ll2_prepare_tx_packet(p_hwfn
, ll2_handle
, &tx_pkt
, true);
2095 /* Set second fragment to first part of packet */
2096 rc
= qed_ll2_set_fragment_of_tx_packet(p_hwfn
, ll2_handle
,
2098 fpdu
->mpa_frag_len
);
2102 if (!fpdu
->incomplete_bytes
)
2105 first_mpa_offset
= le16_to_cpu(curr_pkt
->first_mpa_offset
);
2107 /* Set third fragment to second part of the packet */
2108 rc
= qed_ll2_set_fragment_of_tx_packet(p_hwfn
,
2110 buf
->data_phys_addr
+
2112 fpdu
->incomplete_bytes
);
2116 "MPA_ALIGN: Sent FPDU num_bds=%d first_frag_len=%x, mpa_frag_len=0x%x, incomplete_bytes:0x%x rc=%d\n",
2118 tx_pkt
.first_frag_len
,
2120 fpdu
->incomplete_bytes
, rc
);
2126 qed_iwarp_mpa_get_data(struct qed_hwfn
*p_hwfn
,
2127 struct unaligned_opaque_data
*curr_pkt
,
2128 u32 opaque_data0
, u32 opaque_data1
)
2132 opaque_data
= HILO_64(cpu_to_le32(opaque_data1
),
2133 cpu_to_le32(opaque_data0
));
2134 *curr_pkt
= *((struct unaligned_opaque_data
*)&opaque_data
);
2136 le16_add_cpu(&curr_pkt
->first_mpa_offset
,
2137 curr_pkt
->tcp_payload_offset
);
2140 /* This function is called when an unaligned or incomplete MPA packet arrives
2141 * driver needs to align the packet, perhaps using previous data and send
2142 * it down to FW once it is aligned.
2145 qed_iwarp_process_mpa_pkt(struct qed_hwfn
*p_hwfn
,
2146 struct qed_iwarp_ll2_mpa_buf
*mpa_buf
)
2148 struct unaligned_opaque_data
*curr_pkt
= &mpa_buf
->data
;
2149 struct qed_iwarp_ll2_buff
*buf
= mpa_buf
->ll2_buf
;
2150 enum qed_iwarp_mpa_pkt_type pkt_type
;
2151 struct qed_iwarp_fpdu
*fpdu
;
2152 u16 cid
, first_mpa_offset
;
2156 cid
= le32_to_cpu(curr_pkt
->cid
);
2158 fpdu
= qed_iwarp_get_curr_fpdu(p_hwfn
, (u16
)cid
);
2159 if (!fpdu
) { /* something corrupt with cid, post rx back */
2160 DP_ERR(p_hwfn
, "Invalid cid, drop and post back to rx cid=%x\n",
2166 first_mpa_offset
= le16_to_cpu(curr_pkt
->first_mpa_offset
);
2167 mpa_data
= ((u8
*)(buf
->data
) + first_mpa_offset
);
2169 pkt_type
= qed_iwarp_mpa_classify(p_hwfn
, fpdu
,
2170 mpa_buf
->tcp_payload_len
,
2174 case QED_IWARP_MPA_PKT_PARTIAL
:
2175 qed_iwarp_init_fpdu(buf
, fpdu
,
2177 mpa_buf
->tcp_payload_len
,
2178 mpa_buf
->placement_offset
);
2180 if (!QED_IWARP_IS_RIGHT_EDGE(curr_pkt
)) {
2181 mpa_buf
->tcp_payload_len
= 0;
2185 rc
= qed_iwarp_win_right_edge(p_hwfn
, fpdu
);
2188 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
2189 "Can't send FPDU:reset rc=%d\n", rc
);
2190 memset(fpdu
, 0, sizeof(*fpdu
));
2194 mpa_buf
->tcp_payload_len
= 0;
2196 case QED_IWARP_MPA_PKT_PACKED
:
2197 qed_iwarp_init_fpdu(buf
, fpdu
,
2199 mpa_buf
->tcp_payload_len
,
2200 mpa_buf
->placement_offset
);
2202 rc
= qed_iwarp_send_fpdu(p_hwfn
, fpdu
, curr_pkt
, buf
,
2203 mpa_buf
->tcp_payload_len
,
2206 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
2207 "Can't send FPDU:reset rc=%d\n", rc
);
2208 memset(fpdu
, 0, sizeof(*fpdu
));
2212 mpa_buf
->tcp_payload_len
-= fpdu
->fpdu_length
;
2213 le16_add_cpu(&curr_pkt
->first_mpa_offset
,
2216 case QED_IWARP_MPA_PKT_UNALIGNED
:
2217 qed_iwarp_update_fpdu_length(p_hwfn
, fpdu
, mpa_data
);
2218 if (mpa_buf
->tcp_payload_len
< fpdu
->incomplete_bytes
) {
2219 /* special handling of fpdu split over more
2222 if (QED_IWARP_IS_RIGHT_EDGE(curr_pkt
)) {
2223 rc
= qed_iwarp_win_right_edge(p_hwfn
,
2225 /* packet will be re-processed later */
2230 rc
= qed_iwarp_cp_pkt(p_hwfn
, fpdu
, curr_pkt
,
2232 mpa_buf
->tcp_payload_len
);
2233 if (rc
) /* packet will be re-processed later */
2236 mpa_buf
->tcp_payload_len
= 0;
2240 rc
= qed_iwarp_send_fpdu(p_hwfn
, fpdu
, curr_pkt
, buf
,
2241 mpa_buf
->tcp_payload_len
,
2244 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
2245 "Can't send FPDU:delay rc=%d\n", rc
);
2246 /* don't reset fpdu -> we need it for next
2252 mpa_buf
->tcp_payload_len
-= fpdu
->incomplete_bytes
;
2253 le16_add_cpu(&curr_pkt
->first_mpa_offset
,
2254 fpdu
->incomplete_bytes
);
2256 /* The framed PDU was sent - no more incomplete bytes */
2257 fpdu
->incomplete_bytes
= 0;
2260 } while (mpa_buf
->tcp_payload_len
&& !rc
);
2265 qed_iwarp_ll2_post_rx(p_hwfn
,
2267 p_hwfn
->p_rdma_info
->iwarp
.ll2_mpa_handle
);
2271 static void qed_iwarp_process_pending_pkts(struct qed_hwfn
*p_hwfn
)
2273 struct qed_iwarp_info
*iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
2274 struct qed_iwarp_ll2_mpa_buf
*mpa_buf
= NULL
;
2277 while (!list_empty(&iwarp_info
->mpa_buf_pending_list
)) {
2278 mpa_buf
= list_first_entry(&iwarp_info
->mpa_buf_pending_list
,
2279 struct qed_iwarp_ll2_mpa_buf
,
2282 rc
= qed_iwarp_process_mpa_pkt(p_hwfn
, mpa_buf
);
2284 /* busy means break and continue processing later, don't
2285 * remove the buf from the pending list.
2290 list_move_tail(&mpa_buf
->list_entry
,
2291 &iwarp_info
->mpa_buf_list
);
2293 if (rc
) { /* different error, don't continue */
2294 DP_NOTICE(p_hwfn
, "process pkts failed rc=%d\n", rc
);
2301 qed_iwarp_ll2_comp_mpa_pkt(void *cxt
, struct qed_ll2_comp_rx_data
*data
)
2303 struct qed_iwarp_ll2_mpa_buf
*mpa_buf
;
2304 struct qed_iwarp_info
*iwarp_info
;
2305 struct qed_hwfn
*p_hwfn
= cxt
;
2306 u16 first_mpa_offset
;
2308 iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
2309 mpa_buf
= list_first_entry(&iwarp_info
->mpa_buf_list
,
2310 struct qed_iwarp_ll2_mpa_buf
, list_entry
);
2312 DP_ERR(p_hwfn
, "No free mpa buf\n");
2316 list_del(&mpa_buf
->list_entry
);
2317 qed_iwarp_mpa_get_data(p_hwfn
, &mpa_buf
->data
,
2318 data
->opaque_data_0
, data
->opaque_data_1
);
2320 first_mpa_offset
= le16_to_cpu(mpa_buf
->data
.first_mpa_offset
);
2324 "LL2 MPA CompRx payload_len:0x%x\tfirst_mpa_offset:0x%x\ttcp_payload_offset:0x%x\tflags:0x%x\tcid:0x%x\n",
2325 data
->length
.packet_length
, first_mpa_offset
,
2326 mpa_buf
->data
.tcp_payload_offset
, mpa_buf
->data
.flags
,
2329 mpa_buf
->ll2_buf
= data
->cookie
;
2330 mpa_buf
->tcp_payload_len
= data
->length
.packet_length
-
2333 first_mpa_offset
+= data
->u
.placement_offset
;
2334 mpa_buf
->data
.first_mpa_offset
= cpu_to_le16(first_mpa_offset
);
2335 mpa_buf
->placement_offset
= data
->u
.placement_offset
;
2337 list_add_tail(&mpa_buf
->list_entry
, &iwarp_info
->mpa_buf_pending_list
);
2339 qed_iwarp_process_pending_pkts(p_hwfn
);
2342 qed_iwarp_ll2_post_rx(p_hwfn
, data
->cookie
,
2343 iwarp_info
->ll2_mpa_handle
);
2347 qed_iwarp_ll2_comp_syn_pkt(void *cxt
, struct qed_ll2_comp_rx_data
*data
)
2349 struct qed_iwarp_ll2_buff
*buf
= data
->cookie
;
2350 struct qed_iwarp_listener
*listener
;
2351 struct qed_ll2_tx_pkt_info tx_pkt
;
2352 struct qed_iwarp_cm_info cm_info
;
2353 struct qed_hwfn
*p_hwfn
= cxt
;
2354 u8 remote_mac_addr
[ETH_ALEN
];
2355 u8 local_mac_addr
[ETH_ALEN
];
2356 struct qed_iwarp_ep
*ep
;
2357 int tcp_start_offset
;
2363 memset(&cm_info
, 0, sizeof(cm_info
));
2364 ll2_syn_handle
= p_hwfn
->p_rdma_info
->iwarp
.ll2_syn_handle
;
2366 /* Check if packet was received with errors... */
2367 if (data
->err_flags
) {
2368 DP_NOTICE(p_hwfn
, "Error received on SYN packet: 0x%x\n",
2373 if (GET_FIELD(data
->parse_flags
,
2374 PARSING_AND_ERR_FLAGS_L4CHKSMWASCALCULATED
) &&
2375 GET_FIELD(data
->parse_flags
, PARSING_AND_ERR_FLAGS_L4CHKSMERROR
)) {
2376 DP_NOTICE(p_hwfn
, "Syn packet received with checksum error\n");
2380 rc
= qed_iwarp_parse_rx_pkt(p_hwfn
, &cm_info
, (u8
*)(buf
->data
) +
2381 data
->u
.placement_offset
, remote_mac_addr
,
2382 local_mac_addr
, &payload_len
,
2387 /* Check if there is a listener for this 4-tuple+vlan */
2388 listener
= qed_iwarp_get_listener(p_hwfn
, &cm_info
);
2392 "SYN received on tuple not listened on parse_flags=%d packet len=%d\n",
2393 data
->parse_flags
, data
->length
.packet_length
);
2395 memset(&tx_pkt
, 0, sizeof(tx_pkt
));
2396 tx_pkt
.num_of_bds
= 1;
2397 tx_pkt
.l4_hdr_offset_w
= (data
->length
.packet_length
) >> 2;
2398 tx_pkt
.tx_dest
= QED_LL2_TX_DEST_LB
;
2399 tx_pkt
.first_frag
= buf
->data_phys_addr
+
2400 data
->u
.placement_offset
;
2401 tx_pkt
.first_frag_len
= data
->length
.packet_length
;
2402 tx_pkt
.cookie
= buf
;
2404 rc
= qed_ll2_prepare_tx_packet(p_hwfn
, ll2_syn_handle
,
2409 "Can't post SYN back to chip rc=%d\n", rc
);
2415 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "Received syn on listening port\n");
2416 /* There may be an open ep on this connection if this is a syn
2417 * retrasnmit... need to make sure there isn't...
2419 if (qed_iwarp_ep_exists(p_hwfn
, &cm_info
))
2422 ep
= qed_iwarp_get_free_ep(p_hwfn
);
2426 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
2427 list_add_tail(&ep
->list_entry
, &p_hwfn
->p_rdma_info
->iwarp
.ep_list
);
2428 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
2430 ether_addr_copy(ep
->remote_mac_addr
, remote_mac_addr
);
2431 ether_addr_copy(ep
->local_mac_addr
, local_mac_addr
);
2433 memcpy(&ep
->cm_info
, &cm_info
, sizeof(ep
->cm_info
));
2435 hdr_size
= ((cm_info
.ip_version
== QED_TCP_IPV4
) ? 40 : 60);
2436 ep
->mss
= p_hwfn
->p_rdma_info
->iwarp
.max_mtu
- hdr_size
;
2437 ep
->mss
= min_t(u16
, QED_IWARP_MAX_FW_MSS
, ep
->mss
);
2439 ep
->event_cb
= listener
->event_cb
;
2440 ep
->cb_context
= listener
->cb_context
;
2441 ep
->connect_mode
= TCP_CONNECT_PASSIVE
;
2444 ep
->syn_ip_payload_length
= (u16
)payload_len
;
2445 ep
->syn_phy_addr
= buf
->data_phys_addr
+ data
->u
.placement_offset
+
2448 rc
= qed_iwarp_tcp_offload(p_hwfn
, ep
);
2450 qed_iwarp_return_ep(p_hwfn
, ep
);
2456 qed_iwarp_ll2_post_rx(p_hwfn
, buf
, ll2_syn_handle
);
2459 static void qed_iwarp_ll2_rel_rx_pkt(void *cxt
, u8 connection_handle
,
2460 void *cookie
, dma_addr_t rx_buf_addr
,
2463 struct qed_iwarp_ll2_buff
*buffer
= cookie
;
2464 struct qed_hwfn
*p_hwfn
= cxt
;
2466 dma_free_coherent(&p_hwfn
->cdev
->pdev
->dev
, buffer
->buff_size
,
2467 buffer
->data
, buffer
->data_phys_addr
);
2471 static void qed_iwarp_ll2_comp_tx_pkt(void *cxt
, u8 connection_handle
,
2472 void *cookie
, dma_addr_t first_frag_addr
,
2473 bool b_last_fragment
, bool b_last_packet
)
2475 struct qed_iwarp_ll2_buff
*buffer
= cookie
;
2476 struct qed_iwarp_ll2_buff
*piggy
;
2477 struct qed_hwfn
*p_hwfn
= cxt
;
2479 if (!buffer
) /* can happen in packed mpa unaligned... */
2482 /* this was originally an rx packet, post it back */
2483 piggy
= buffer
->piggy_buf
;
2485 buffer
->piggy_buf
= NULL
;
2486 qed_iwarp_ll2_post_rx(p_hwfn
, piggy
, connection_handle
);
2489 qed_iwarp_ll2_post_rx(p_hwfn
, buffer
, connection_handle
);
2491 if (connection_handle
== p_hwfn
->p_rdma_info
->iwarp
.ll2_mpa_handle
)
2492 qed_iwarp_process_pending_pkts(p_hwfn
);
2497 static void qed_iwarp_ll2_rel_tx_pkt(void *cxt
, u8 connection_handle
,
2498 void *cookie
, dma_addr_t first_frag_addr
,
2499 bool b_last_fragment
, bool b_last_packet
)
2501 struct qed_iwarp_ll2_buff
*buffer
= cookie
;
2502 struct qed_hwfn
*p_hwfn
= cxt
;
2507 if (buffer
->piggy_buf
) {
2508 dma_free_coherent(&p_hwfn
->cdev
->pdev
->dev
,
2509 buffer
->piggy_buf
->buff_size
,
2510 buffer
->piggy_buf
->data
,
2511 buffer
->piggy_buf
->data_phys_addr
);
2513 kfree(buffer
->piggy_buf
);
2516 dma_free_coherent(&p_hwfn
->cdev
->pdev
->dev
, buffer
->buff_size
,
2517 buffer
->data
, buffer
->data_phys_addr
);
2522 /* The only slowpath for iwarp ll2 is unalign flush. When this completion
2523 * is received, need to reset the FPDU.
2526 qed_iwarp_ll2_slowpath(void *cxt
,
2527 u8 connection_handle
,
2528 u32 opaque_data_0
, u32 opaque_data_1
)
2530 struct unaligned_opaque_data unalign_data
;
2531 struct qed_hwfn
*p_hwfn
= cxt
;
2532 struct qed_iwarp_fpdu
*fpdu
;
2535 qed_iwarp_mpa_get_data(p_hwfn
, &unalign_data
,
2536 opaque_data_0
, opaque_data_1
);
2538 cid
= le32_to_cpu(unalign_data
.cid
);
2540 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "(0x%x) Flush fpdu\n", cid
);
2542 fpdu
= qed_iwarp_get_curr_fpdu(p_hwfn
, (u16
)cid
);
2544 memset(fpdu
, 0, sizeof(*fpdu
));
2547 static int qed_iwarp_ll2_stop(struct qed_hwfn
*p_hwfn
)
2549 struct qed_iwarp_info
*iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
2552 if (iwarp_info
->ll2_syn_handle
!= QED_IWARP_HANDLE_INVAL
) {
2553 rc
= qed_ll2_terminate_connection(p_hwfn
,
2554 iwarp_info
->ll2_syn_handle
);
2556 DP_INFO(p_hwfn
, "Failed to terminate syn connection\n");
2558 qed_ll2_release_connection(p_hwfn
, iwarp_info
->ll2_syn_handle
);
2559 iwarp_info
->ll2_syn_handle
= QED_IWARP_HANDLE_INVAL
;
2562 if (iwarp_info
->ll2_ooo_handle
!= QED_IWARP_HANDLE_INVAL
) {
2563 rc
= qed_ll2_terminate_connection(p_hwfn
,
2564 iwarp_info
->ll2_ooo_handle
);
2566 DP_INFO(p_hwfn
, "Failed to terminate ooo connection\n");
2568 qed_ll2_release_connection(p_hwfn
, iwarp_info
->ll2_ooo_handle
);
2569 iwarp_info
->ll2_ooo_handle
= QED_IWARP_HANDLE_INVAL
;
2572 if (iwarp_info
->ll2_mpa_handle
!= QED_IWARP_HANDLE_INVAL
) {
2573 rc
= qed_ll2_terminate_connection(p_hwfn
,
2574 iwarp_info
->ll2_mpa_handle
);
2576 DP_INFO(p_hwfn
, "Failed to terminate mpa connection\n");
2578 qed_ll2_release_connection(p_hwfn
, iwarp_info
->ll2_mpa_handle
);
2579 iwarp_info
->ll2_mpa_handle
= QED_IWARP_HANDLE_INVAL
;
2582 qed_llh_remove_mac_filter(p_hwfn
->cdev
, 0,
2583 p_hwfn
->p_rdma_info
->iwarp
.mac_addr
);
2589 qed_iwarp_ll2_alloc_buffers(struct qed_hwfn
*p_hwfn
,
2590 int num_rx_bufs
, int buff_size
, u8 ll2_handle
)
2592 struct qed_iwarp_ll2_buff
*buffer
;
2596 for (i
= 0; i
< num_rx_bufs
; i
++) {
2597 buffer
= kzalloc(sizeof(*buffer
), GFP_KERNEL
);
2603 buffer
->data
= dma_alloc_coherent(&p_hwfn
->cdev
->pdev
->dev
,
2605 &buffer
->data_phys_addr
,
2607 if (!buffer
->data
) {
2613 buffer
->buff_size
= buff_size
;
2614 rc
= qed_iwarp_ll2_post_rx(p_hwfn
, buffer
, ll2_handle
);
2616 /* buffers will be deallocated by qed_ll2 */
2622 #define QED_IWARP_MAX_BUF_SIZE(mtu) \
2623 ALIGN((mtu) + ETH_HLEN + 2 * VLAN_HLEN + 2 + ETH_CACHE_LINE_SIZE, \
2624 ETH_CACHE_LINE_SIZE)
2627 qed_iwarp_ll2_start(struct qed_hwfn
*p_hwfn
,
2628 struct qed_rdma_start_in_params
*params
,
2631 struct qed_iwarp_info
*iwarp_info
;
2632 struct qed_ll2_acquire_data data
;
2633 struct qed_ll2_cbs cbs
;
2639 iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
2640 iwarp_info
->ll2_syn_handle
= QED_IWARP_HANDLE_INVAL
;
2641 iwarp_info
->ll2_ooo_handle
= QED_IWARP_HANDLE_INVAL
;
2642 iwarp_info
->ll2_mpa_handle
= QED_IWARP_HANDLE_INVAL
;
2644 iwarp_info
->max_mtu
= params
->max_mtu
;
2646 ether_addr_copy(p_hwfn
->p_rdma_info
->iwarp
.mac_addr
, params
->mac_addr
);
2648 rc
= qed_llh_add_mac_filter(p_hwfn
->cdev
, 0, params
->mac_addr
);
2652 /* Start SYN connection */
2653 cbs
.rx_comp_cb
= qed_iwarp_ll2_comp_syn_pkt
;
2654 cbs
.rx_release_cb
= qed_iwarp_ll2_rel_rx_pkt
;
2655 cbs
.tx_comp_cb
= qed_iwarp_ll2_comp_tx_pkt
;
2656 cbs
.tx_release_cb
= qed_iwarp_ll2_rel_tx_pkt
;
2657 cbs
.slowpath_cb
= NULL
;
2658 cbs
.cookie
= p_hwfn
;
2660 memset(&data
, 0, sizeof(data
));
2661 data
.input
.conn_type
= QED_LL2_TYPE_IWARP
;
2662 /* SYN will use ctx based queues */
2663 data
.input
.rx_conn_type
= QED_LL2_RX_TYPE_CTX
;
2664 data
.input
.mtu
= params
->max_mtu
;
2665 data
.input
.rx_num_desc
= QED_IWARP_LL2_SYN_RX_SIZE
;
2666 data
.input
.tx_num_desc
= QED_IWARP_LL2_SYN_TX_SIZE
;
2667 data
.input
.tx_max_bds_per_packet
= 1; /* will never be fragmented */
2668 data
.input
.tx_tc
= PKT_LB_TC
;
2669 data
.input
.tx_dest
= QED_LL2_TX_DEST_LB
;
2670 data
.p_connection_handle
= &iwarp_info
->ll2_syn_handle
;
2673 rc
= qed_ll2_acquire_connection(p_hwfn
, &data
);
2675 DP_NOTICE(p_hwfn
, "Failed to acquire LL2 connection\n");
2676 qed_llh_remove_mac_filter(p_hwfn
->cdev
, 0, params
->mac_addr
);
2680 rc
= qed_ll2_establish_connection(p_hwfn
, iwarp_info
->ll2_syn_handle
);
2682 DP_NOTICE(p_hwfn
, "Failed to establish LL2 connection\n");
2686 buff_size
= QED_IWARP_MAX_BUF_SIZE(params
->max_mtu
);
2687 rc
= qed_iwarp_ll2_alloc_buffers(p_hwfn
,
2688 QED_IWARP_LL2_SYN_RX_SIZE
,
2690 iwarp_info
->ll2_syn_handle
);
2694 /* Start OOO connection */
2695 data
.input
.conn_type
= QED_LL2_TYPE_OOO
;
2696 /* OOO/unaligned will use legacy ll2 queues (ram based) */
2697 data
.input
.rx_conn_type
= QED_LL2_RX_TYPE_LEGACY
;
2698 data
.input
.mtu
= params
->max_mtu
;
2700 n_ooo_bufs
= (QED_IWARP_MAX_OOO
* rcv_wnd_size
) /
2701 iwarp_info
->max_mtu
;
2702 n_ooo_bufs
= min_t(u32
, n_ooo_bufs
, QED_IWARP_LL2_OOO_MAX_RX_SIZE
);
2704 data
.input
.rx_num_desc
= n_ooo_bufs
;
2705 data
.input
.rx_num_ooo_buffers
= n_ooo_bufs
;
2707 data
.input
.tx_max_bds_per_packet
= 1; /* will never be fragmented */
2708 data
.input
.tx_num_desc
= QED_IWARP_LL2_OOO_DEF_TX_SIZE
;
2709 data
.p_connection_handle
= &iwarp_info
->ll2_ooo_handle
;
2711 rc
= qed_ll2_acquire_connection(p_hwfn
, &data
);
2715 rc
= qed_ll2_establish_connection(p_hwfn
, iwarp_info
->ll2_ooo_handle
);
2719 /* Start Unaligned MPA connection */
2720 cbs
.rx_comp_cb
= qed_iwarp_ll2_comp_mpa_pkt
;
2721 cbs
.slowpath_cb
= qed_iwarp_ll2_slowpath
;
2723 memset(&data
, 0, sizeof(data
));
2724 data
.input
.conn_type
= QED_LL2_TYPE_IWARP
;
2725 data
.input
.mtu
= params
->max_mtu
;
2726 /* FW requires that once a packet arrives OOO, it must have at
2727 * least 2 rx buffers available on the unaligned connection
2728 * for handling the case that it is a partial fpdu.
2730 data
.input
.rx_num_desc
= n_ooo_bufs
* 2;
2731 data
.input
.tx_num_desc
= data
.input
.rx_num_desc
;
2732 data
.input
.tx_max_bds_per_packet
= QED_IWARP_MAX_BDS_PER_FPDU
;
2733 data
.input
.tx_tc
= PKT_LB_TC
;
2734 data
.input
.tx_dest
= QED_LL2_TX_DEST_LB
;
2735 data
.p_connection_handle
= &iwarp_info
->ll2_mpa_handle
;
2736 data
.input
.secondary_queue
= true;
2739 rc
= qed_ll2_acquire_connection(p_hwfn
, &data
);
2743 rc
= qed_ll2_establish_connection(p_hwfn
, iwarp_info
->ll2_mpa_handle
);
2747 rc
= qed_iwarp_ll2_alloc_buffers(p_hwfn
,
2748 data
.input
.rx_num_desc
,
2750 iwarp_info
->ll2_mpa_handle
);
2754 iwarp_info
->partial_fpdus
= kcalloc((u16
)p_hwfn
->p_rdma_info
->num_qps
,
2755 sizeof(*iwarp_info
->partial_fpdus
),
2757 if (!iwarp_info
->partial_fpdus
) {
2762 iwarp_info
->max_num_partial_fpdus
= (u16
)p_hwfn
->p_rdma_info
->num_qps
;
2764 iwarp_info
->mpa_intermediate_buf
= kzalloc(buff_size
, GFP_KERNEL
);
2765 if (!iwarp_info
->mpa_intermediate_buf
) {
2770 /* The mpa_bufs array serves for pending RX packets received on the
2771 * mpa ll2 that don't have place on the tx ring and require later
2772 * processing. We can't fail on allocation of such a struct therefore
2773 * we allocate enough to take care of all rx packets
2775 iwarp_info
->mpa_bufs
= kcalloc(data
.input
.rx_num_desc
,
2776 sizeof(*iwarp_info
->mpa_bufs
),
2778 if (!iwarp_info
->mpa_bufs
) {
2783 INIT_LIST_HEAD(&iwarp_info
->mpa_buf_pending_list
);
2784 INIT_LIST_HEAD(&iwarp_info
->mpa_buf_list
);
2785 for (i
= 0; i
< data
.input
.rx_num_desc
; i
++)
2786 list_add_tail(&iwarp_info
->mpa_bufs
[i
].list_entry
,
2787 &iwarp_info
->mpa_buf_list
);
2790 qed_iwarp_ll2_stop(p_hwfn
);
2798 } qed_iwarp_rcv_wnd_size
[MAX_CHIP_IDS
] = {
2799 {QED_IWARP_RCV_WND_SIZE_DEF_BB_2P
, QED_IWARP_RCV_WND_SIZE_DEF_BB_4P
},
2800 {QED_IWARP_RCV_WND_SIZE_DEF_AH_2P
, QED_IWARP_RCV_WND_SIZE_DEF_AH_4P
}
2803 int qed_iwarp_setup(struct qed_hwfn
*p_hwfn
,
2804 struct qed_rdma_start_in_params
*params
)
2806 struct qed_dev
*cdev
= p_hwfn
->cdev
;
2807 struct qed_iwarp_info
*iwarp_info
;
2808 enum chip_ids chip_id
;
2811 iwarp_info
= &p_hwfn
->p_rdma_info
->iwarp
;
2813 iwarp_info
->tcp_flags
= QED_IWARP_TS_EN
;
2815 chip_id
= QED_IS_BB(cdev
) ? CHIP_BB
: CHIP_K2
;
2816 rcv_wnd_size
= (qed_device_num_ports(cdev
) == 4) ?
2817 qed_iwarp_rcv_wnd_size
[chip_id
].four_ports
:
2818 qed_iwarp_rcv_wnd_size
[chip_id
].two_ports
;
2820 /* value 0 is used for ilog2(QED_IWARP_RCV_WND_SIZE_MIN) */
2821 iwarp_info
->rcv_wnd_scale
= ilog2(rcv_wnd_size
) -
2822 ilog2(QED_IWARP_RCV_WND_SIZE_MIN
);
2823 iwarp_info
->rcv_wnd_size
= rcv_wnd_size
>> iwarp_info
->rcv_wnd_scale
;
2824 iwarp_info
->crc_needed
= QED_IWARP_PARAM_CRC_NEEDED
;
2825 iwarp_info
->mpa_rev
= MPA_NEGOTIATION_TYPE_ENHANCED
;
2827 iwarp_info
->peer2peer
= QED_IWARP_PARAM_P2P
;
2829 iwarp_info
->rtr_type
= MPA_RTR_TYPE_ZERO_SEND
|
2830 MPA_RTR_TYPE_ZERO_WRITE
|
2831 MPA_RTR_TYPE_ZERO_READ
;
2833 spin_lock_init(&p_hwfn
->p_rdma_info
->iwarp
.qp_lock
);
2834 INIT_LIST_HEAD(&p_hwfn
->p_rdma_info
->iwarp
.ep_list
);
2835 INIT_LIST_HEAD(&p_hwfn
->p_rdma_info
->iwarp
.listen_list
);
2837 qed_spq_register_async_cb(p_hwfn
, PROTOCOLID_IWARP
,
2838 qed_iwarp_async_event
);
2839 qed_ooo_setup(p_hwfn
);
2841 return qed_iwarp_ll2_start(p_hwfn
, params
, rcv_wnd_size
);
2844 int qed_iwarp_stop(struct qed_hwfn
*p_hwfn
)
2848 qed_iwarp_free_prealloc_ep(p_hwfn
);
2849 rc
= qed_iwarp_wait_for_all_cids(p_hwfn
);
2853 return qed_iwarp_ll2_stop(p_hwfn
);
2856 static void qed_iwarp_qp_in_error(struct qed_hwfn
*p_hwfn
,
2857 struct qed_iwarp_ep
*ep
,
2860 struct qed_iwarp_cm_event_params params
;
2862 qed_iwarp_modify_qp(p_hwfn
, ep
->qp
, QED_IWARP_QP_STATE_ERROR
, true);
2864 params
.event
= QED_IWARP_EVENT_CLOSE
;
2865 params
.ep_context
= ep
;
2866 params
.cm_info
= &ep
->cm_info
;
2867 params
.status
= (fw_return_code
== IWARP_QP_IN_ERROR_GOOD_CLOSE
) ?
2870 /* paired with READ_ONCE in destroy_qp */
2871 smp_store_release(&ep
->state
, QED_IWARP_EP_CLOSED
);
2873 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
2874 list_del(&ep
->list_entry
);
2875 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
2877 ep
->event_cb(ep
->cb_context
, ¶ms
);
2880 static void qed_iwarp_exception_received(struct qed_hwfn
*p_hwfn
,
2881 struct qed_iwarp_ep
*ep
,
2884 struct qed_iwarp_cm_event_params params
;
2885 bool event_cb
= false;
2887 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "EP(0x%x) fw_ret_code=%d\n",
2888 ep
->cid
, fw_ret_code
);
2890 switch (fw_ret_code
) {
2891 case IWARP_EXCEPTION_DETECTED_LLP_CLOSED
:
2893 params
.event
= QED_IWARP_EVENT_DISCONNECT
;
2896 case IWARP_EXCEPTION_DETECTED_LLP_RESET
:
2897 params
.status
= -ECONNRESET
;
2898 params
.event
= QED_IWARP_EVENT_DISCONNECT
;
2901 case IWARP_EXCEPTION_DETECTED_RQ_EMPTY
:
2902 params
.event
= QED_IWARP_EVENT_RQ_EMPTY
;
2905 case IWARP_EXCEPTION_DETECTED_IRQ_FULL
:
2906 params
.event
= QED_IWARP_EVENT_IRQ_FULL
;
2909 case IWARP_EXCEPTION_DETECTED_LLP_TIMEOUT
:
2910 params
.event
= QED_IWARP_EVENT_LLP_TIMEOUT
;
2913 case IWARP_EXCEPTION_DETECTED_REMOTE_PROTECTION_ERROR
:
2914 params
.event
= QED_IWARP_EVENT_REMOTE_PROTECTION_ERROR
;
2917 case IWARP_EXCEPTION_DETECTED_CQ_OVERFLOW
:
2918 params
.event
= QED_IWARP_EVENT_CQ_OVERFLOW
;
2921 case IWARP_EXCEPTION_DETECTED_LOCAL_CATASTROPHIC
:
2922 params
.event
= QED_IWARP_EVENT_QP_CATASTROPHIC
;
2925 case IWARP_EXCEPTION_DETECTED_LOCAL_ACCESS_ERROR
:
2926 params
.event
= QED_IWARP_EVENT_LOCAL_ACCESS_ERROR
;
2929 case IWARP_EXCEPTION_DETECTED_REMOTE_OPERATION_ERROR
:
2930 params
.event
= QED_IWARP_EVENT_REMOTE_OPERATION_ERROR
;
2933 case IWARP_EXCEPTION_DETECTED_TERMINATE_RECEIVED
:
2934 params
.event
= QED_IWARP_EVENT_TERMINATE_RECEIVED
;
2938 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
2939 "Unhandled exception received...fw_ret_code=%d\n",
2945 params
.ep_context
= ep
;
2946 params
.cm_info
= &ep
->cm_info
;
2947 ep
->event_cb(ep
->cb_context
, ¶ms
);
2952 qed_iwarp_tcp_connect_unsuccessful(struct qed_hwfn
*p_hwfn
,
2953 struct qed_iwarp_ep
*ep
, u8 fw_return_code
)
2955 struct qed_iwarp_cm_event_params params
;
2957 memset(¶ms
, 0, sizeof(params
));
2958 params
.event
= QED_IWARP_EVENT_ACTIVE_COMPLETE
;
2959 params
.ep_context
= ep
;
2960 params
.cm_info
= &ep
->cm_info
;
2961 /* paired with READ_ONCE in destroy_qp */
2962 smp_store_release(&ep
->state
, QED_IWARP_EP_CLOSED
);
2964 switch (fw_return_code
) {
2965 case IWARP_CONN_ERROR_TCP_CONNECT_INVALID_PACKET
:
2966 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
2967 "%s(0x%x) TCP connect got invalid packet\n",
2968 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->tcp_cid
);
2969 params
.status
= -ECONNRESET
;
2971 case IWARP_CONN_ERROR_TCP_CONNECTION_RST
:
2972 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
2973 "%s(0x%x) TCP Connection Reset\n",
2974 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->tcp_cid
);
2975 params
.status
= -ECONNRESET
;
2977 case IWARP_CONN_ERROR_TCP_CONNECT_TIMEOUT
:
2978 DP_NOTICE(p_hwfn
, "%s(0x%x) TCP timeout\n",
2979 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->tcp_cid
);
2980 params
.status
= -EBUSY
;
2982 case IWARP_CONN_ERROR_MPA_NOT_SUPPORTED_VER
:
2983 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA not supported VER\n",
2984 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->tcp_cid
);
2985 params
.status
= -ECONNREFUSED
;
2987 case IWARP_CONN_ERROR_MPA_INVALID_PACKET
:
2988 DP_NOTICE(p_hwfn
, "%s(0x%x) MPA Invalid Packet\n",
2989 QED_IWARP_CONNECT_MODE_STRING(ep
), ep
->tcp_cid
);
2990 params
.status
= -ECONNRESET
;
2994 "%s(0x%x) Unexpected return code tcp connect: %d\n",
2995 QED_IWARP_CONNECT_MODE_STRING(ep
),
2996 ep
->tcp_cid
, fw_return_code
);
2997 params
.status
= -ECONNRESET
;
3001 if (ep
->connect_mode
== TCP_CONNECT_PASSIVE
) {
3002 ep
->tcp_cid
= QED_IWARP_INVALID_TCP_CID
;
3003 qed_iwarp_return_ep(p_hwfn
, ep
);
3005 ep
->event_cb(ep
->cb_context
, ¶ms
);
3006 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
3007 list_del(&ep
->list_entry
);
3008 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
3013 qed_iwarp_connect_complete(struct qed_hwfn
*p_hwfn
,
3014 struct qed_iwarp_ep
*ep
, u8 fw_return_code
)
3016 u8 ll2_syn_handle
= p_hwfn
->p_rdma_info
->iwarp
.ll2_syn_handle
;
3018 if (ep
->connect_mode
== TCP_CONNECT_PASSIVE
) {
3019 /* Done with the SYN packet, post back to ll2 rx */
3020 qed_iwarp_ll2_post_rx(p_hwfn
, ep
->syn
, ll2_syn_handle
);
3024 /* If connect failed - upper layer doesn't know about it */
3025 if (fw_return_code
== RDMA_RETURN_OK
)
3026 qed_iwarp_mpa_received(p_hwfn
, ep
);
3028 qed_iwarp_tcp_connect_unsuccessful(p_hwfn
, ep
,
3031 if (fw_return_code
== RDMA_RETURN_OK
)
3032 qed_iwarp_mpa_offload(p_hwfn
, ep
);
3034 qed_iwarp_tcp_connect_unsuccessful(p_hwfn
, ep
,
3040 qed_iwarp_check_ep_ok(struct qed_hwfn
*p_hwfn
, struct qed_iwarp_ep
*ep
)
3042 if (!ep
|| (ep
->sig
!= QED_EP_SIG
)) {
3043 DP_ERR(p_hwfn
, "ERROR ON ASYNC ep=%p\n", ep
);
3050 static int qed_iwarp_async_event(struct qed_hwfn
*p_hwfn
, u8 fw_event_code
,
3051 __le16 echo
, union event_ring_data
*data
,
3054 struct qed_rdma_events events
= p_hwfn
->p_rdma_info
->events
;
3055 struct regpair
*fw_handle
= &data
->rdma_data
.async_handle
;
3056 struct qed_iwarp_ep
*ep
= NULL
;
3061 ep
= (struct qed_iwarp_ep
*)(uintptr_t)HILO_64(fw_handle
->hi
,
3064 switch (fw_event_code
) {
3065 case IWARP_EVENT_TYPE_ASYNC_CONNECT_COMPLETE
:
3066 /* Async completion after TCP 3-way handshake */
3067 if (!qed_iwarp_check_ep_ok(p_hwfn
, ep
))
3071 "EP(0x%x) IWARP_EVENT_TYPE_ASYNC_CONNECT_COMPLETE fw_ret_code=%d\n",
3072 ep
->tcp_cid
, fw_return_code
);
3073 qed_iwarp_connect_complete(p_hwfn
, ep
, fw_return_code
);
3075 case IWARP_EVENT_TYPE_ASYNC_EXCEPTION_DETECTED
:
3076 if (!qed_iwarp_check_ep_ok(p_hwfn
, ep
))
3080 "QP(0x%x) IWARP_EVENT_TYPE_ASYNC_EXCEPTION_DETECTED fw_ret_code=%d\n",
3081 ep
->cid
, fw_return_code
);
3082 qed_iwarp_exception_received(p_hwfn
, ep
, fw_return_code
);
3084 case IWARP_EVENT_TYPE_ASYNC_QP_IN_ERROR_STATE
:
3085 /* Async completion for Close Connection ramrod */
3086 if (!qed_iwarp_check_ep_ok(p_hwfn
, ep
))
3090 "QP(0x%x) IWARP_EVENT_TYPE_ASYNC_QP_IN_ERROR_STATE fw_ret_code=%d\n",
3091 ep
->cid
, fw_return_code
);
3092 qed_iwarp_qp_in_error(p_hwfn
, ep
, fw_return_code
);
3094 case IWARP_EVENT_TYPE_ASYNC_ENHANCED_MPA_REPLY_ARRIVED
:
3095 /* Async event for active side only */
3096 if (!qed_iwarp_check_ep_ok(p_hwfn
, ep
))
3100 "QP(0x%x) IWARP_EVENT_TYPE_ASYNC_MPA_HANDSHAKE_MPA_REPLY_ARRIVED fw_ret_code=%d\n",
3101 ep
->cid
, fw_return_code
);
3102 qed_iwarp_mpa_reply_arrived(p_hwfn
, ep
);
3104 case IWARP_EVENT_TYPE_ASYNC_MPA_HANDSHAKE_COMPLETE
:
3105 if (!qed_iwarp_check_ep_ok(p_hwfn
, ep
))
3109 "QP(0x%x) IWARP_EVENT_TYPE_ASYNC_MPA_HANDSHAKE_COMPLETE fw_ret_code=%d\n",
3110 ep
->cid
, fw_return_code
);
3111 qed_iwarp_mpa_complete(p_hwfn
, ep
, fw_return_code
);
3113 case IWARP_EVENT_TYPE_ASYNC_CID_CLEANED
:
3114 cid
= (u16
)le32_to_cpu(fw_handle
->lo
);
3115 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
,
3116 "(0x%x)IWARP_EVENT_TYPE_ASYNC_CID_CLEANED\n", cid
);
3117 qed_iwarp_cid_cleaned(p_hwfn
, cid
);
3120 case IWARP_EVENT_TYPE_ASYNC_SRQ_EMPTY
:
3121 DP_NOTICE(p_hwfn
, "IWARP_EVENT_TYPE_ASYNC_SRQ_EMPTY\n");
3122 srq_offset
= p_hwfn
->p_rdma_info
->srq_id_offset
;
3123 /* FW assigns value that is no greater than u16 */
3124 srq_id
= ((u16
)le32_to_cpu(fw_handle
->lo
)) - srq_offset
;
3125 events
.affiliated_event(events
.context
,
3126 QED_IWARP_EVENT_SRQ_EMPTY
,
3129 case IWARP_EVENT_TYPE_ASYNC_SRQ_LIMIT
:
3130 DP_NOTICE(p_hwfn
, "IWARP_EVENT_TYPE_ASYNC_SRQ_LIMIT\n");
3131 srq_offset
= p_hwfn
->p_rdma_info
->srq_id_offset
;
3132 /* FW assigns value that is no greater than u16 */
3133 srq_id
= ((u16
)le32_to_cpu(fw_handle
->lo
)) - srq_offset
;
3134 events
.affiliated_event(events
.context
,
3135 QED_IWARP_EVENT_SRQ_LIMIT
,
3138 case IWARP_EVENT_TYPE_ASYNC_CQ_OVERFLOW
:
3139 DP_NOTICE(p_hwfn
, "IWARP_EVENT_TYPE_ASYNC_CQ_OVERFLOW\n");
3141 p_hwfn
->p_rdma_info
->events
.affiliated_event(
3142 p_hwfn
->p_rdma_info
->events
.context
,
3143 QED_IWARP_EVENT_CQ_OVERFLOW
,
3147 DP_ERR(p_hwfn
, "Received unexpected async iwarp event %d\n",
3155 qed_iwarp_create_listen(void *rdma_cxt
,
3156 struct qed_iwarp_listen_in
*iparams
,
3157 struct qed_iwarp_listen_out
*oparams
)
3159 struct qed_hwfn
*p_hwfn
= rdma_cxt
;
3160 struct qed_iwarp_listener
*listener
;
3162 listener
= kzalloc(sizeof(*listener
), GFP_KERNEL
);
3166 listener
->ip_version
= iparams
->ip_version
;
3167 memcpy(listener
->ip_addr
, iparams
->ip_addr
, sizeof(listener
->ip_addr
));
3168 listener
->port
= iparams
->port
;
3169 listener
->vlan
= iparams
->vlan
;
3171 listener
->event_cb
= iparams
->event_cb
;
3172 listener
->cb_context
= iparams
->cb_context
;
3173 listener
->max_backlog
= iparams
->max_backlog
;
3174 oparams
->handle
= listener
;
3176 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
3177 list_add_tail(&listener
->list_entry
,
3178 &p_hwfn
->p_rdma_info
->iwarp
.listen_list
);
3179 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
3183 "callback=%p handle=%p ip=%x:%x:%x:%x port=0x%x vlan=0x%x\n",
3186 listener
->ip_addr
[0],
3187 listener
->ip_addr
[1],
3188 listener
->ip_addr
[2],
3189 listener
->ip_addr
[3], listener
->port
, listener
->vlan
);
3194 int qed_iwarp_destroy_listen(void *rdma_cxt
, void *handle
)
3196 struct qed_iwarp_listener
*listener
= handle
;
3197 struct qed_hwfn
*p_hwfn
= rdma_cxt
;
3199 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "handle=%p\n", handle
);
3201 spin_lock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
3202 list_del(&listener
->list_entry
);
3203 spin_unlock_bh(&p_hwfn
->p_rdma_info
->iwarp
.iw_lock
);
3210 int qed_iwarp_send_rtr(void *rdma_cxt
, struct qed_iwarp_send_rtr_in
*iparams
)
3212 struct qed_hwfn
*p_hwfn
= rdma_cxt
;
3213 struct qed_sp_init_data init_data
;
3214 struct qed_spq_entry
*p_ent
;
3215 struct qed_iwarp_ep
*ep
;
3216 struct qed_rdma_qp
*qp
;
3219 ep
= iparams
->ep_context
;
3221 DP_ERR(p_hwfn
, "Ep Context receive in send_rtr is NULL\n");
3227 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "QP(0x%x) EP(0x%x)\n",
3228 qp
->icid
, ep
->tcp_cid
);
3230 memset(&init_data
, 0, sizeof(init_data
));
3231 init_data
.cid
= qp
->icid
;
3232 init_data
.opaque_fid
= p_hwfn
->hw_info
.opaque_fid
;
3233 init_data
.comp_mode
= QED_SPQ_MODE_CB
;
3235 rc
= qed_sp_init_request(p_hwfn
, &p_ent
,
3236 IWARP_RAMROD_CMD_ID_MPA_OFFLOAD_SEND_RTR
,
3237 PROTOCOLID_IWARP
, &init_data
);
3242 rc
= qed_spq_post(p_hwfn
, p_ent
, NULL
);
3244 DP_VERBOSE(p_hwfn
, QED_MSG_RDMA
, "rc = 0x%x\n", rc
);
3250 qed_iwarp_query_qp(struct qed_rdma_qp
*qp
,
3251 struct qed_rdma_query_qp_out_params
*out_params
)
3253 out_params
->state
= qed_iwarp2roce_state(qp
->iwarp_state
);