2 * Copyright (c) 2006 - 2014 Intel Corporation. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
35 #define TCPOPT_TIMESTAMP 8
37 #include <linux/atomic.h>
38 #include <linux/skbuff.h>
40 #include <linux/tcp.h>
41 #include <linux/init.h>
42 #include <linux/if_arp.h>
43 #include <linux/if_vlan.h>
44 #include <linux/notifier.h>
45 #include <linux/net.h>
46 #include <linux/types.h>
47 #include <linux/timer.h>
48 #include <linux/time.h>
49 #include <linux/delay.h>
50 #include <linux/etherdevice.h>
51 #include <linux/netdevice.h>
52 #include <linux/random.h>
53 #include <linux/list.h>
54 #include <linux/threads.h>
55 #include <linux/highmem.h>
56 #include <linux/slab.h>
58 #include <net/neighbour.h>
59 #include <net/route.h>
60 #include <net/ip_fib.h>
62 #include <linux/fcntl.h>
67 u32 cm_packets_bounced
;
68 u32 cm_packets_dropped
;
69 u32 cm_packets_retrans
;
70 u32 cm_packets_created
;
71 u32 cm_packets_received
;
72 atomic_t cm_listens_created
;
73 atomic_t cm_listens_destroyed
;
75 atomic_t cm_loopbacks
;
76 atomic_t cm_nodes_created
;
77 atomic_t cm_nodes_destroyed
;
78 atomic_t cm_accel_dropped_pkts
;
79 atomic_t cm_resets_recvd
;
81 static inline int mini_cm_accelerated(struct nes_cm_core
*, struct nes_cm_node
*);
82 static struct nes_cm_listener
*mini_cm_listen(struct nes_cm_core
*, struct nes_vnic
*, struct nes_cm_info
*);
83 static int mini_cm_del_listen(struct nes_cm_core
*, struct nes_cm_listener
*);
84 static struct nes_cm_node
*mini_cm_connect(struct nes_cm_core
*, struct nes_vnic
*, u16
, void *, struct nes_cm_info
*);
85 static int mini_cm_close(struct nes_cm_core
*, struct nes_cm_node
*);
86 static int mini_cm_accept(struct nes_cm_core
*, struct nes_cm_node
*);
87 static int mini_cm_reject(struct nes_cm_core
*, struct nes_cm_node
*);
88 static int mini_cm_recv_pkt(struct nes_cm_core
*, struct nes_vnic
*, struct sk_buff
*);
89 static int mini_cm_dealloc_core(struct nes_cm_core
*);
90 static int mini_cm_get(struct nes_cm_core
*);
91 static int mini_cm_set(struct nes_cm_core
*, u32
, u32
);
93 static void form_cm_frame(struct sk_buff
*, struct nes_cm_node
*, void *, u32
, void *, u32
, u8
);
94 static int add_ref_cm_node(struct nes_cm_node
*);
95 static int rem_ref_cm_node(struct nes_cm_core
*, struct nes_cm_node
*);
97 static int nes_cm_disconn_true(struct nes_qp
*);
98 static int nes_cm_post_event(struct nes_cm_event
*event
);
99 static int nes_disconnect(struct nes_qp
*nesqp
, int abrupt
);
100 static void nes_disconnect_worker(struct work_struct
*work
);
102 static int send_mpa_request(struct nes_cm_node
*, struct sk_buff
*);
103 static int send_mpa_reject(struct nes_cm_node
*);
104 static int send_syn(struct nes_cm_node
*, u32
, struct sk_buff
*);
105 static int send_reset(struct nes_cm_node
*, struct sk_buff
*);
106 static int send_ack(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
);
107 static int send_fin(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
);
108 static void process_packet(struct nes_cm_node
*, struct sk_buff
*, struct nes_cm_core
*);
110 static void active_open_err(struct nes_cm_node
*, struct sk_buff
*, int);
111 static void passive_open_err(struct nes_cm_node
*, struct sk_buff
*, int);
112 static void cleanup_retrans_entry(struct nes_cm_node
*);
113 static void handle_rcv_mpa(struct nes_cm_node
*, struct sk_buff
*);
114 static void free_retrans_entry(struct nes_cm_node
*cm_node
);
115 static int handle_tcp_options(struct nes_cm_node
*cm_node
, struct tcphdr
*tcph
, struct sk_buff
*skb
, int optionsize
, int passive
);
117 /* CM event handler functions */
118 static void cm_event_connected(struct nes_cm_event
*);
119 static void cm_event_connect_error(struct nes_cm_event
*);
120 static void cm_event_reset(struct nes_cm_event
*);
121 static void cm_event_mpa_req(struct nes_cm_event
*);
122 static void cm_event_mpa_reject(struct nes_cm_event
*);
123 static void handle_recv_entry(struct nes_cm_node
*cm_node
, u32 rem_node
);
125 /* MPA build functions */
126 static int cm_build_mpa_frame(struct nes_cm_node
*, u8
**, u16
*, u8
*, u8
);
127 static void build_mpa_v2(struct nes_cm_node
*, void *, u8
);
128 static void build_mpa_v1(struct nes_cm_node
*, void *, u8
);
129 static void build_rdma0_msg(struct nes_cm_node
*, struct nes_qp
**);
131 static void print_core(struct nes_cm_core
*core
);
132 static void record_ird_ord(struct nes_cm_node
*, u16
, u16
);
134 /* External CM API Interface */
135 /* instance of function pointers for client API */
136 /* set address of this instance to cm_core->cm_ops at cm_core alloc */
137 static struct nes_cm_ops nes_cm_api
= {
146 mini_cm_dealloc_core
,
151 static struct nes_cm_core
*g_cm_core
;
153 atomic_t cm_connects
;
155 atomic_t cm_disconnects
;
157 atomic_t cm_connecteds
;
158 atomic_t cm_connect_reqs
;
161 int nes_add_ref_cm_node(struct nes_cm_node
*cm_node
)
163 return add_ref_cm_node(cm_node
);
166 int nes_rem_ref_cm_node(struct nes_cm_node
*cm_node
)
168 return rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
173 static struct nes_cm_event
*create_event(struct nes_cm_node
* cm_node
,
174 enum nes_cm_event_type type
)
176 struct nes_cm_event
*event
;
181 /* allocate an empty event */
182 event
= kzalloc(sizeof(*event
), GFP_ATOMIC
);
188 event
->cm_node
= cm_node
;
189 event
->cm_info
.rem_addr
= cm_node
->rem_addr
;
190 event
->cm_info
.loc_addr
= cm_node
->loc_addr
;
191 event
->cm_info
.rem_port
= cm_node
->rem_port
;
192 event
->cm_info
.loc_port
= cm_node
->loc_port
;
193 event
->cm_info
.cm_id
= cm_node
->cm_id
;
195 nes_debug(NES_DBG_CM
, "cm_node=%p Created event=%p, type=%u, "
196 "dst_addr=%08x[%x], src_addr=%08x[%x]\n",
197 cm_node
, event
, type
, event
->cm_info
.loc_addr
,
198 event
->cm_info
.loc_port
, event
->cm_info
.rem_addr
,
199 event
->cm_info
.rem_port
);
201 nes_cm_post_event(event
);
209 static int send_mpa_request(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
)
212 u8
*start_ptr
= &start_addr
;
213 u8
**start_buff
= &start_ptr
;
217 nes_debug(NES_DBG_CM
, "skb set to NULL\n");
221 /* send an MPA Request frame */
222 cm_build_mpa_frame(cm_node
, start_buff
, &buff_len
, NULL
, MPA_KEY_REQUEST
);
223 form_cm_frame(skb
, cm_node
, NULL
, 0, *start_buff
, buff_len
, SET_ACK
);
225 return schedule_nes_timer(cm_node
, skb
, NES_TIMER_TYPE_SEND
, 1, 0);
230 static int send_mpa_reject(struct nes_cm_node
*cm_node
)
232 struct sk_buff
*skb
= NULL
;
234 u8
*start_ptr
= &start_addr
;
235 u8
**start_buff
= &start_ptr
;
237 struct ietf_mpa_v1
*mpa_frame
;
239 skb
= dev_alloc_skb(MAX_CM_BUFFER
);
241 nes_debug(NES_DBG_CM
, "Failed to get a Free pkt\n");
245 /* send an MPA reject frame */
246 cm_build_mpa_frame(cm_node
, start_buff
, &buff_len
, NULL
, MPA_KEY_REPLY
);
247 mpa_frame
= (struct ietf_mpa_v1
*)*start_buff
;
248 mpa_frame
->flags
|= IETF_MPA_FLAGS_REJECT
;
249 form_cm_frame(skb
, cm_node
, NULL
, 0, *start_buff
, buff_len
, SET_ACK
| SET_FIN
);
251 cm_node
->state
= NES_CM_STATE_FIN_WAIT1
;
252 return schedule_nes_timer(cm_node
, skb
, NES_TIMER_TYPE_SEND
, 1, 0);
257 * recv_mpa - process a received TCP pkt, we are expecting an
260 static int parse_mpa(struct nes_cm_node
*cm_node
, u8
*buffer
, u32
*type
,
263 struct ietf_mpa_v1
*mpa_frame
;
264 struct ietf_mpa_v2
*mpa_v2_frame
;
265 struct ietf_rtr_msg
*rtr_msg
;
269 *type
= NES_MPA_REQUEST_ACCEPT
;
271 /* assume req frame is in tcp data payload */
272 if (len
< sizeof(struct ietf_mpa_v1
)) {
273 nes_debug(NES_DBG_CM
, "The received ietf buffer was too small (%x)\n", len
);
277 /* points to the beginning of the frame, which could be MPA V1 or V2 */
278 mpa_frame
= (struct ietf_mpa_v1
*)buffer
;
279 mpa_hdr_len
= sizeof(struct ietf_mpa_v1
);
280 priv_data_len
= ntohs(mpa_frame
->priv_data_len
);
282 /* make sure mpa private data len is less than 512 bytes */
283 if (priv_data_len
> IETF_MAX_PRIV_DATA_LEN
) {
284 nes_debug(NES_DBG_CM
, "The received Length of Private"
285 " Data field exceeds 512 octets\n");
289 * make sure MPA receiver interoperate with the
290 * received MPA version and MPA key information
293 if (mpa_frame
->rev
!= IETF_MPA_V1
&& mpa_frame
->rev
!= IETF_MPA_V2
) {
294 nes_debug(NES_DBG_CM
, "The received mpa version"
295 " is not supported\n");
299 * backwards compatibility only
301 if (mpa_frame
->rev
> cm_node
->mpa_frame_rev
) {
302 nes_debug(NES_DBG_CM
, "The received mpa version"
303 " can not be interoperated\n");
306 cm_node
->mpa_frame_rev
= mpa_frame
->rev
;
309 if (cm_node
->state
!= NES_CM_STATE_MPAREQ_SENT
) {
310 if (memcmp(mpa_frame
->key
, IEFT_MPA_KEY_REQ
, IETF_MPA_KEY_SIZE
)) {
311 nes_debug(NES_DBG_CM
, "Unexpected MPA Key received \n");
315 if (memcmp(mpa_frame
->key
, IEFT_MPA_KEY_REP
, IETF_MPA_KEY_SIZE
)) {
316 nes_debug(NES_DBG_CM
, "Unexpected MPA Key received \n");
321 if (priv_data_len
+ mpa_hdr_len
!= len
) {
322 nes_debug(NES_DBG_CM
, "The received ietf buffer was not right"
323 " complete (%x + %x != %x)\n",
324 priv_data_len
, mpa_hdr_len
, len
);
327 /* make sure it does not exceed the max size */
328 if (len
> MAX_CM_BUFFER
) {
329 nes_debug(NES_DBG_CM
, "The received ietf buffer was too large"
330 " (%x + %x != %x)\n",
331 priv_data_len
, mpa_hdr_len
, len
);
335 cm_node
->mpa_frame_size
= priv_data_len
;
337 switch (mpa_frame
->rev
) {
344 mpa_v2_frame
= (struct ietf_mpa_v2
*)buffer
;
345 mpa_hdr_len
+= IETF_RTR_MSG_SIZE
;
346 cm_node
->mpa_frame_size
-= IETF_RTR_MSG_SIZE
;
347 rtr_msg
= &mpa_v2_frame
->rtr_msg
;
349 /* parse rtr message */
350 rtr_ctrl_ird
= ntohs(rtr_msg
->ctrl_ird
);
351 rtr_ctrl_ord
= ntohs(rtr_msg
->ctrl_ord
);
352 ird_size
= rtr_ctrl_ird
& IETF_NO_IRD_ORD
;
353 ord_size
= rtr_ctrl_ord
& IETF_NO_IRD_ORD
;
355 if (!(rtr_ctrl_ird
& IETF_PEER_TO_PEER
)) {
359 if (ird_size
== IETF_NO_IRD_ORD
|| ord_size
== IETF_NO_IRD_ORD
)
360 cm_node
->mpav2_ird_ord
= IETF_NO_IRD_ORD
;
362 if (cm_node
->mpav2_ird_ord
!= IETF_NO_IRD_ORD
) {
364 if (cm_node
->state
!= NES_CM_STATE_MPAREQ_SENT
) {
365 /* we are still negotiating */
366 if (ord_size
> NES_MAX_IRD
) {
367 cm_node
->ird_size
= NES_MAX_IRD
;
369 cm_node
->ird_size
= ord_size
;
371 (rtr_ctrl_ord
& IETF_RDMA0_READ
)) {
372 cm_node
->ird_size
= 1;
373 nes_debug(NES_DBG_CM
,
374 "%s: Remote peer doesn't support RDMA0_READ (ord=%u)\n",
378 if (ird_size
> NES_MAX_ORD
)
379 cm_node
->ord_size
= NES_MAX_ORD
;
381 cm_node
->ord_size
= ird_size
;
382 } else { /* initiator */
383 if (ord_size
> NES_MAX_IRD
) {
384 nes_debug(NES_DBG_CM
,
385 "%s: Unable to support the requested (ord =%u)\n",
389 cm_node
->ird_size
= ord_size
;
391 if (ird_size
> NES_MAX_ORD
) {
392 cm_node
->ord_size
= NES_MAX_ORD
;
395 (rtr_ctrl_ord
& IETF_RDMA0_READ
)) {
396 nes_debug(NES_DBG_CM
,
397 "%s: Remote peer doesn't support RDMA0_READ (ird=%u)\n",
401 cm_node
->ord_size
= ird_size
;
407 if (rtr_ctrl_ord
& IETF_RDMA0_READ
) {
408 cm_node
->send_rdma0_op
= SEND_RDMA_READ_ZERO
;
410 } else if (rtr_ctrl_ord
& IETF_RDMA0_WRITE
) {
411 cm_node
->send_rdma0_op
= SEND_RDMA_WRITE_ZERO
;
412 } else { /* Not supported RDMA0 operation */
422 /* copy entire MPA frame to our cm_node's frame */
423 memcpy(cm_node
->mpa_frame_buf
, buffer
+ mpa_hdr_len
, cm_node
->mpa_frame_size
);
425 if (mpa_frame
->flags
& IETF_MPA_FLAGS_REJECT
)
426 *type
= NES_MPA_REQUEST_REJECT
;
432 * form_cm_frame - get a free packet and build empty frame Use
433 * node info to build.
435 static void form_cm_frame(struct sk_buff
*skb
,
436 struct nes_cm_node
*cm_node
, void *options
, u32 optionsize
,
437 void *data
, u32 datasize
, u8 flags
)
443 u16 packetsize
= sizeof(*iph
);
445 packetsize
+= sizeof(*tcph
);
446 packetsize
+= optionsize
+ datasize
;
449 memset(skb
->data
, 0x00, ETH_HLEN
+ sizeof(*iph
) + sizeof(*tcph
));
451 buf
= skb_put(skb
, packetsize
+ ETH_HLEN
);
453 ethh
= (struct ethhdr
*)buf
;
456 iph
= (struct iphdr
*)buf
;
458 tcph
= (struct tcphdr
*)buf
;
459 skb_reset_mac_header(skb
);
460 skb_set_network_header(skb
, ETH_HLEN
);
461 skb_set_transport_header(skb
, ETH_HLEN
+ sizeof(*iph
));
462 buf
+= sizeof(*tcph
);
464 skb
->ip_summed
= CHECKSUM_PARTIAL
;
465 if (!(cm_node
->netdev
->features
& NETIF_F_IP_CSUM
))
466 skb
->ip_summed
= CHECKSUM_NONE
;
467 skb
->protocol
= htons(0x800);
469 skb
->mac_len
= ETH_HLEN
;
471 memcpy(ethh
->h_dest
, cm_node
->rem_mac
, ETH_ALEN
);
472 memcpy(ethh
->h_source
, cm_node
->loc_mac
, ETH_ALEN
);
473 ethh
->h_proto
= htons(0x0800);
475 iph
->version
= IPVERSION
;
476 iph
->ihl
= 5; /* 5 * 4Byte words, IP headr len */
478 iph
->tot_len
= htons(packetsize
);
479 iph
->id
= htons(++cm_node
->tcp_cntxt
.loc_id
);
481 iph
->frag_off
= htons(0x4000);
483 iph
->protocol
= 0x06; /* IPPROTO_TCP */
485 iph
->saddr
= htonl(cm_node
->mapped_loc_addr
);
486 iph
->daddr
= htonl(cm_node
->mapped_rem_addr
);
488 tcph
->source
= htons(cm_node
->mapped_loc_port
);
489 tcph
->dest
= htons(cm_node
->mapped_rem_port
);
490 tcph
->seq
= htonl(cm_node
->tcp_cntxt
.loc_seq_num
);
492 if (flags
& SET_ACK
) {
493 cm_node
->tcp_cntxt
.loc_ack_num
= cm_node
->tcp_cntxt
.rcv_nxt
;
494 tcph
->ack_seq
= htonl(cm_node
->tcp_cntxt
.loc_ack_num
);
500 if (flags
& SET_SYN
) {
501 cm_node
->tcp_cntxt
.loc_seq_num
++;
504 cm_node
->tcp_cntxt
.loc_seq_num
+= datasize
;
507 if (flags
& SET_FIN
) {
508 cm_node
->tcp_cntxt
.loc_seq_num
++;
515 tcph
->doff
= (u16
)((sizeof(*tcph
) + optionsize
+ 3) >> 2);
516 tcph
->window
= htons(cm_node
->tcp_cntxt
.rcv_wnd
);
519 memcpy(buf
, options
, optionsize
);
522 memcpy(buf
, data
, datasize
);
524 skb_shinfo(skb
)->nr_frags
= 0;
525 cm_packets_created
++;
529 * nes_create_sockaddr - Record ip addr and tcp port in a sockaddr struct
531 static void nes_create_sockaddr(__be32 ip_addr
, __be16 port
,
532 struct sockaddr_storage
*addr
)
534 struct sockaddr_in
*nes_sockaddr
= (struct sockaddr_in
*)addr
;
535 nes_sockaddr
->sin_family
= AF_INET
;
536 memcpy(&nes_sockaddr
->sin_addr
.s_addr
, &ip_addr
, sizeof(__be32
));
537 nes_sockaddr
->sin_port
= port
;
541 * nes_create_mapinfo - Create a mapinfo object in the port mapper data base
543 static int nes_create_mapinfo(struct nes_cm_info
*cm_info
)
545 struct sockaddr_storage local_sockaddr
;
546 struct sockaddr_storage mapped_sockaddr
;
548 nes_create_sockaddr(htonl(cm_info
->loc_addr
), htons(cm_info
->loc_port
),
550 nes_create_sockaddr(htonl(cm_info
->mapped_loc_addr
),
551 htons(cm_info
->mapped_loc_port
), &mapped_sockaddr
);
553 return iwpm_create_mapinfo(&local_sockaddr
,
554 &mapped_sockaddr
, RDMA_NL_NES
);
558 * nes_remove_mapinfo - Remove a mapinfo object from the port mapper data base
559 * and send a remove mapping op message to
560 * the userspace port mapper
562 static int nes_remove_mapinfo(u32 loc_addr
, u16 loc_port
,
563 u32 mapped_loc_addr
, u16 mapped_loc_port
)
565 struct sockaddr_storage local_sockaddr
;
566 struct sockaddr_storage mapped_sockaddr
;
568 nes_create_sockaddr(htonl(loc_addr
), htons(loc_port
), &local_sockaddr
);
569 nes_create_sockaddr(htonl(mapped_loc_addr
), htons(mapped_loc_port
),
572 iwpm_remove_mapinfo(&local_sockaddr
, &mapped_sockaddr
);
573 return iwpm_remove_mapping(&local_sockaddr
, RDMA_NL_NES
);
577 * nes_form_pm_msg - Form a port mapper message with mapping info
579 static void nes_form_pm_msg(struct nes_cm_info
*cm_info
,
580 struct iwpm_sa_data
*pm_msg
)
582 nes_create_sockaddr(htonl(cm_info
->loc_addr
), htons(cm_info
->loc_port
),
584 nes_create_sockaddr(htonl(cm_info
->rem_addr
), htons(cm_info
->rem_port
),
589 * nes_form_reg_msg - Form a port mapper message with dev info
591 static void nes_form_reg_msg(struct nes_vnic
*nesvnic
,
592 struct iwpm_dev_data
*pm_msg
)
594 memcpy(pm_msg
->dev_name
, nesvnic
->nesibdev
->ibdev
.name
,
596 memcpy(pm_msg
->if_name
, nesvnic
->netdev
->name
, IWPM_IFNAME_SIZE
);
599 static void record_sockaddr_info(struct sockaddr_storage
*addr_info
,
600 nes_addr_t
*ip_addr
, u16
*port_num
)
602 struct sockaddr_in
*in_addr
= (struct sockaddr_in
*)addr_info
;
604 if (in_addr
->sin_family
== AF_INET
) {
605 *ip_addr
= ntohl(in_addr
->sin_addr
.s_addr
);
606 *port_num
= ntohs(in_addr
->sin_port
);
611 * nes_record_pm_msg - Save the received mapping info
613 static void nes_record_pm_msg(struct nes_cm_info
*cm_info
,
614 struct iwpm_sa_data
*pm_msg
)
616 record_sockaddr_info(&pm_msg
->mapped_loc_addr
,
617 &cm_info
->mapped_loc_addr
, &cm_info
->mapped_loc_port
);
619 record_sockaddr_info(&pm_msg
->mapped_rem_addr
,
620 &cm_info
->mapped_rem_addr
, &cm_info
->mapped_rem_port
);
624 * nes_get_reminfo - Get the address info of the remote connecting peer
626 static int nes_get_remote_addr(struct nes_cm_node
*cm_node
)
628 struct sockaddr_storage mapped_loc_addr
, mapped_rem_addr
;
629 struct sockaddr_storage remote_addr
;
632 nes_create_sockaddr(htonl(cm_node
->mapped_loc_addr
),
633 htons(cm_node
->mapped_loc_port
), &mapped_loc_addr
);
634 nes_create_sockaddr(htonl(cm_node
->mapped_rem_addr
),
635 htons(cm_node
->mapped_rem_port
), &mapped_rem_addr
);
637 ret
= iwpm_get_remote_info(&mapped_loc_addr
, &mapped_rem_addr
,
638 &remote_addr
, RDMA_NL_NES
);
640 nes_debug(NES_DBG_CM
, "Unable to find remote peer address info\n");
642 record_sockaddr_info(&remote_addr
, &cm_node
->rem_addr
,
648 * print_core - dump a cm core
650 static void print_core(struct nes_cm_core
*core
)
652 nes_debug(NES_DBG_CM
, "---------------------------------------------\n");
653 nes_debug(NES_DBG_CM
, "CM Core -- (core = %p )\n", core
);
656 nes_debug(NES_DBG_CM
, "---------------------------------------------\n");
658 nes_debug(NES_DBG_CM
, "State : %u \n", core
->state
);
660 nes_debug(NES_DBG_CM
, "Listen Nodes : %u \n", atomic_read(&core
->listen_node_cnt
));
661 nes_debug(NES_DBG_CM
, "Active Nodes : %u \n", atomic_read(&core
->node_cnt
));
663 nes_debug(NES_DBG_CM
, "core : %p \n", core
);
665 nes_debug(NES_DBG_CM
, "-------------- end core ---------------\n");
668 static void record_ird_ord(struct nes_cm_node
*cm_node
,
669 u16 conn_ird
, u16 conn_ord
)
671 if (conn_ird
> NES_MAX_IRD
)
672 conn_ird
= NES_MAX_IRD
;
674 if (conn_ord
> NES_MAX_ORD
)
675 conn_ord
= NES_MAX_ORD
;
677 cm_node
->ird_size
= conn_ird
;
678 cm_node
->ord_size
= conn_ord
;
682 * cm_build_mpa_frame - build a MPA V1 frame or MPA V2 frame
684 static int cm_build_mpa_frame(struct nes_cm_node
*cm_node
, u8
**start_buff
,
685 u16
*buff_len
, u8
*pci_mem
, u8 mpa_key
)
689 *start_buff
= (pci_mem
) ? pci_mem
: &cm_node
->mpa_frame_buf
[0];
691 switch (cm_node
->mpa_frame_rev
) {
693 *start_buff
= (u8
*)*start_buff
+ sizeof(struct ietf_rtr_msg
);
694 *buff_len
= sizeof(struct ietf_mpa_v1
) + cm_node
->mpa_frame_size
;
695 build_mpa_v1(cm_node
, *start_buff
, mpa_key
);
698 *buff_len
= sizeof(struct ietf_mpa_v2
) + cm_node
->mpa_frame_size
;
699 build_mpa_v2(cm_node
, *start_buff
, mpa_key
);
708 * build_mpa_v2 - build a MPA V2 frame
710 static void build_mpa_v2(struct nes_cm_node
*cm_node
,
711 void *start_addr
, u8 mpa_key
)
713 struct ietf_mpa_v2
*mpa_frame
= (struct ietf_mpa_v2
*)start_addr
;
714 struct ietf_rtr_msg
*rtr_msg
= &mpa_frame
->rtr_msg
;
718 /* initialize the upper 5 bytes of the frame */
719 build_mpa_v1(cm_node
, start_addr
, mpa_key
);
720 mpa_frame
->flags
|= IETF_MPA_V2_FLAG
; /* set a bit to indicate MPA V2 */
721 mpa_frame
->priv_data_len
+= htons(IETF_RTR_MSG_SIZE
);
723 /* initialize RTR msg */
724 if (cm_node
->mpav2_ird_ord
== IETF_NO_IRD_ORD
) {
725 ctrl_ird
= IETF_NO_IRD_ORD
;
726 ctrl_ord
= IETF_NO_IRD_ORD
;
728 ctrl_ird
= cm_node
->ird_size
& IETF_NO_IRD_ORD
;
729 ctrl_ord
= cm_node
->ord_size
& IETF_NO_IRD_ORD
;
731 ctrl_ird
|= IETF_PEER_TO_PEER
;
732 ctrl_ird
|= IETF_FLPDU_ZERO_LEN
;
735 case MPA_KEY_REQUEST
:
736 ctrl_ord
|= IETF_RDMA0_WRITE
;
737 ctrl_ord
|= IETF_RDMA0_READ
;
740 switch (cm_node
->send_rdma0_op
) {
741 case SEND_RDMA_WRITE_ZERO
:
742 ctrl_ord
|= IETF_RDMA0_WRITE
;
744 case SEND_RDMA_READ_ZERO
:
745 ctrl_ord
|= IETF_RDMA0_READ
;
749 rtr_msg
->ctrl_ird
= htons(ctrl_ird
);
750 rtr_msg
->ctrl_ord
= htons(ctrl_ord
);
754 * build_mpa_v1 - build a MPA V1 frame
756 static void build_mpa_v1(struct nes_cm_node
*cm_node
, void *start_addr
, u8 mpa_key
)
758 struct ietf_mpa_v1
*mpa_frame
= (struct ietf_mpa_v1
*)start_addr
;
761 case MPA_KEY_REQUEST
:
762 memcpy(mpa_frame
->key
, IEFT_MPA_KEY_REQ
, IETF_MPA_KEY_SIZE
);
765 memcpy(mpa_frame
->key
, IEFT_MPA_KEY_REP
, IETF_MPA_KEY_SIZE
);
768 mpa_frame
->flags
= IETF_MPA_FLAGS_CRC
;
769 mpa_frame
->rev
= cm_node
->mpa_frame_rev
;
770 mpa_frame
->priv_data_len
= htons(cm_node
->mpa_frame_size
);
773 static void build_rdma0_msg(struct nes_cm_node
*cm_node
, struct nes_qp
**nesqp_addr
)
776 struct nes_qp
*nesqp
= *nesqp_addr
;
777 struct nes_hw_qp_wqe
*wqe
= &nesqp
->hwqp
.sq_vbase
[0];
779 u64temp
= (unsigned long)nesqp
->nesuqp_addr
;
780 u64temp
|= NES_SW_CONTEXT_ALIGN
>> 1;
781 set_wqe_64bit_value(wqe
->wqe_words
, NES_IWARP_SQ_WQE_COMP_CTX_LOW_IDX
, u64temp
);
783 wqe
->wqe_words
[NES_IWARP_SQ_WQE_FRAG0_LOW_IDX
] = 0;
784 wqe
->wqe_words
[NES_IWARP_SQ_WQE_FRAG0_HIGH_IDX
] = 0;
786 switch (cm_node
->send_rdma0_op
) {
787 case SEND_RDMA_WRITE_ZERO
:
788 nes_debug(NES_DBG_CM
, "Sending first write.\n");
789 wqe
->wqe_words
[NES_IWARP_SQ_WQE_MISC_IDX
] =
790 cpu_to_le32(NES_IWARP_SQ_OP_RDMAW
);
791 wqe
->wqe_words
[NES_IWARP_SQ_WQE_TOTAL_PAYLOAD_IDX
] = 0;
792 wqe
->wqe_words
[NES_IWARP_SQ_WQE_LENGTH0_IDX
] = 0;
793 wqe
->wqe_words
[NES_IWARP_SQ_WQE_STAG0_IDX
] = 0;
796 case SEND_RDMA_READ_ZERO
:
798 if (cm_node
->send_rdma0_op
!= SEND_RDMA_READ_ZERO
)
799 WARN(1, "Unsupported RDMA0 len operation=%u\n",
800 cm_node
->send_rdma0_op
);
801 nes_debug(NES_DBG_CM
, "Sending first rdma operation.\n");
802 wqe
->wqe_words
[NES_IWARP_SQ_WQE_MISC_IDX
] =
803 cpu_to_le32(NES_IWARP_SQ_OP_RDMAR
);
804 wqe
->wqe_words
[NES_IWARP_SQ_WQE_RDMA_TO_LOW_IDX
] = 1;
805 wqe
->wqe_words
[NES_IWARP_SQ_WQE_RDMA_TO_HIGH_IDX
] = 0;
806 wqe
->wqe_words
[NES_IWARP_SQ_WQE_RDMA_LENGTH_IDX
] = 0;
807 wqe
->wqe_words
[NES_IWARP_SQ_WQE_RDMA_STAG_IDX
] = 1;
808 wqe
->wqe_words
[NES_IWARP_SQ_WQE_STAG0_IDX
] = 1;
812 if (nesqp
->sq_kmapped
) {
813 nesqp
->sq_kmapped
= 0;
817 /*use the reserved spot on the WQ for the extra first WQE*/
818 nesqp
->nesqp_context
->ird_ord_sizes
&= cpu_to_le32(~(NES_QPCONTEXT_ORDIRD_LSMM_PRESENT
|
819 NES_QPCONTEXT_ORDIRD_WRPDU
|
820 NES_QPCONTEXT_ORDIRD_ALSMM
));
821 nesqp
->skip_lsmm
= 1;
822 nesqp
->hwqp
.sq_tail
= 0;
827 * note - cm_node needs to be protected before calling this. Encase in:
828 * rem_ref_cm_node(cm_core, cm_node);add_ref_cm_node(cm_node);
830 int schedule_nes_timer(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
831 enum nes_timer_type type
, int send_retrans
,
832 int close_when_complete
)
835 struct nes_cm_core
*cm_core
= cm_node
->cm_core
;
836 struct nes_timer_entry
*new_send
;
839 new_send
= kzalloc(sizeof(*new_send
), GFP_ATOMIC
);
843 /* new_send->timetosend = currenttime */
844 new_send
->retrycount
= NES_DEFAULT_RETRYS
;
845 new_send
->retranscount
= NES_DEFAULT_RETRANS
;
847 new_send
->timetosend
= jiffies
;
848 new_send
->type
= type
;
849 new_send
->netdev
= cm_node
->netdev
;
850 new_send
->send_retrans
= send_retrans
;
851 new_send
->close_when_complete
= close_when_complete
;
853 if (type
== NES_TIMER_TYPE_CLOSE
) {
854 new_send
->timetosend
+= (HZ
/ 10);
855 if (cm_node
->recv_entry
) {
860 cm_node
->recv_entry
= new_send
;
863 if (type
== NES_TIMER_TYPE_SEND
) {
864 new_send
->seq_num
= ntohl(tcp_hdr(skb
)->seq
);
865 atomic_inc(&new_send
->skb
->users
);
866 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
867 cm_node
->send_entry
= new_send
;
868 add_ref_cm_node(cm_node
);
869 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
870 new_send
->timetosend
= jiffies
+ NES_RETRY_TIMEOUT
;
872 ret
= nes_nic_cm_xmit(new_send
->skb
, cm_node
->netdev
);
873 if (ret
!= NETDEV_TX_OK
) {
874 nes_debug(NES_DBG_CM
, "Error sending packet %p "
875 "(jiffies = %lu)\n", new_send
, jiffies
);
876 new_send
->timetosend
= jiffies
;
881 cleanup_retrans_entry(cm_node
);
882 if (close_when_complete
)
883 rem_ref_cm_node(cm_core
, cm_node
);
889 if (!timer_pending(&cm_core
->tcp_timer
))
890 mod_timer(&cm_core
->tcp_timer
, new_send
->timetosend
);
895 static void nes_retrans_expired(struct nes_cm_node
*cm_node
)
897 struct iw_cm_id
*cm_id
= cm_node
->cm_id
;
898 enum nes_cm_node_state state
= cm_node
->state
;
899 cm_node
->state
= NES_CM_STATE_CLOSED
;
902 case NES_CM_STATE_SYN_RCVD
:
903 case NES_CM_STATE_CLOSING
:
904 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
906 case NES_CM_STATE_LAST_ACK
:
907 case NES_CM_STATE_FIN_WAIT1
:
909 cm_id
->rem_ref(cm_id
);
910 send_reset(cm_node
, NULL
);
913 add_ref_cm_node(cm_node
);
914 send_reset(cm_node
, NULL
);
915 create_event(cm_node
, NES_CM_EVENT_ABORTED
);
919 static void handle_recv_entry(struct nes_cm_node
*cm_node
, u32 rem_node
)
921 struct nes_timer_entry
*recv_entry
= cm_node
->recv_entry
;
922 struct iw_cm_id
*cm_id
= cm_node
->cm_id
;
923 struct nes_qp
*nesqp
;
924 unsigned long qplockflags
;
928 nesqp
= (struct nes_qp
*)recv_entry
->skb
;
930 spin_lock_irqsave(&nesqp
->lock
, qplockflags
);
932 nes_debug(NES_DBG_CM
, "QP%u: cm_id = %p, "
933 "refcount = %d: HIT A "
934 "NES_TIMER_TYPE_CLOSE with something "
935 "to do!!!\n", nesqp
->hwqp
.qp_id
, cm_id
,
936 atomic_read(&nesqp
->refcount
));
937 nesqp
->hw_tcp_state
= NES_AEQE_TCP_STATE_CLOSED
;
938 nesqp
->last_aeq
= NES_AEQE_AEID_RESET_SENT
;
939 nesqp
->ibqp_state
= IB_QPS_ERR
;
940 spin_unlock_irqrestore(&nesqp
->lock
, qplockflags
);
941 nes_cm_disconn(nesqp
);
943 spin_unlock_irqrestore(&nesqp
->lock
, qplockflags
);
944 nes_debug(NES_DBG_CM
, "QP%u: cm_id = %p, "
945 "refcount = %d: HIT A "
946 "NES_TIMER_TYPE_CLOSE with nothing "
947 "to do!!!\n", nesqp
->hwqp
.qp_id
, cm_id
,
948 atomic_read(&nesqp
->refcount
));
950 } else if (rem_node
) {
951 /* TIME_WAIT state */
952 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
955 cm_id
->rem_ref(cm_id
);
957 cm_node
->recv_entry
= NULL
;
963 static void nes_cm_timer_tick(unsigned long pass
)
966 unsigned long nexttimeout
= jiffies
+ NES_LONG_TIME
;
967 struct nes_cm_node
*cm_node
;
968 struct nes_timer_entry
*send_entry
, *recv_entry
;
969 struct list_head
*list_core_temp
;
970 struct list_head
*list_node
;
971 struct nes_cm_core
*cm_core
= g_cm_core
;
973 unsigned long timetosend
;
974 int ret
= NETDEV_TX_OK
;
976 struct list_head timer_list
;
978 INIT_LIST_HEAD(&timer_list
);
979 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
981 list_for_each_safe(list_node
, list_core_temp
,
982 &cm_core
->connected_nodes
) {
983 cm_node
= container_of(list_node
, struct nes_cm_node
, list
);
984 if ((cm_node
->recv_entry
) || (cm_node
->send_entry
)) {
985 add_ref_cm_node(cm_node
);
986 list_add(&cm_node
->timer_entry
, &timer_list
);
989 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
991 list_for_each_safe(list_node
, list_core_temp
, &timer_list
) {
992 cm_node
= container_of(list_node
, struct nes_cm_node
,
994 recv_entry
= cm_node
->recv_entry
;
997 if (time_after(recv_entry
->timetosend
, jiffies
)) {
998 if (nexttimeout
> recv_entry
->timetosend
||
1000 nexttimeout
= recv_entry
->timetosend
;
1004 handle_recv_entry(cm_node
, 1);
1008 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
1010 send_entry
= cm_node
->send_entry
;
1013 if (time_after(send_entry
->timetosend
, jiffies
)) {
1014 if (cm_node
->state
!= NES_CM_STATE_TSA
) {
1016 send_entry
->timetosend
) ||
1019 send_entry
->timetosend
;
1023 free_retrans_entry(cm_node
);
1028 if ((cm_node
->state
== NES_CM_STATE_TSA
) ||
1029 (cm_node
->state
== NES_CM_STATE_CLOSED
)) {
1030 free_retrans_entry(cm_node
);
1034 if (!send_entry
->retranscount
||
1035 !send_entry
->retrycount
) {
1036 cm_packets_dropped
++;
1037 free_retrans_entry(cm_node
);
1039 spin_unlock_irqrestore(
1040 &cm_node
->retrans_list_lock
, flags
);
1041 nes_retrans_expired(cm_node
);
1042 cm_node
->state
= NES_CM_STATE_CLOSED
;
1043 spin_lock_irqsave(&cm_node
->retrans_list_lock
,
1047 atomic_inc(&send_entry
->skb
->users
);
1048 cm_packets_retrans
++;
1049 nes_debug(NES_DBG_CM
, "Retransmitting send_entry %p "
1050 "for node %p, jiffies = %lu, time to send = "
1051 "%lu, retranscount = %u, send_entry->seq_num = "
1052 "0x%08X, cm_node->tcp_cntxt.rem_ack_num = "
1053 "0x%08X\n", send_entry
, cm_node
, jiffies
,
1054 send_entry
->timetosend
,
1055 send_entry
->retranscount
,
1056 send_entry
->seq_num
,
1057 cm_node
->tcp_cntxt
.rem_ack_num
);
1059 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
,
1061 ret
= nes_nic_cm_xmit(send_entry
->skb
, cm_node
->netdev
);
1062 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
1063 if (ret
!= NETDEV_TX_OK
) {
1064 nes_debug(NES_DBG_CM
, "rexmit failed for "
1065 "node=%p\n", cm_node
);
1066 cm_packets_bounced
++;
1067 send_entry
->retrycount
--;
1068 nexttimeout
= jiffies
+ NES_SHORT_TIME
;
1074 nes_debug(NES_DBG_CM
, "Packet Sent: retrans count = "
1075 "%u, retry count = %u.\n",
1076 send_entry
->retranscount
,
1077 send_entry
->retrycount
);
1078 if (send_entry
->send_retrans
) {
1079 send_entry
->retranscount
--;
1080 timetosend
= (NES_RETRY_TIMEOUT
<<
1081 (NES_DEFAULT_RETRANS
- send_entry
->retranscount
));
1083 send_entry
->timetosend
= jiffies
+
1084 min(timetosend
, NES_MAX_TIMEOUT
);
1085 if (nexttimeout
> send_entry
->timetosend
||
1087 nexttimeout
= send_entry
->timetosend
;
1091 int close_when_complete
;
1092 close_when_complete
=
1093 send_entry
->close_when_complete
;
1094 nes_debug(NES_DBG_CM
, "cm_node=%p state=%d\n",
1095 cm_node
, cm_node
->state
);
1096 free_retrans_entry(cm_node
);
1097 if (close_when_complete
)
1098 rem_ref_cm_node(cm_node
->cm_core
,
1103 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
1104 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
1108 if (!timer_pending(&cm_core
->tcp_timer
))
1109 mod_timer(&cm_core
->tcp_timer
, nexttimeout
);
1117 static int send_syn(struct nes_cm_node
*cm_node
, u32 sendack
,
1118 struct sk_buff
*skb
)
1121 int flags
= SET_SYN
;
1122 char optionsbuffer
[sizeof(struct option_mss
) +
1123 sizeof(struct option_windowscale
) + sizeof(struct option_base
) +
1124 TCP_OPTIONS_PADDING
];
1126 int optionssize
= 0;
1127 /* Sending MSS option */
1128 union all_known_options
*options
;
1133 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1134 options
->as_mss
.optionnum
= OPTION_NUMBER_MSS
;
1135 options
->as_mss
.length
= sizeof(struct option_mss
);
1136 options
->as_mss
.mss
= htons(cm_node
->tcp_cntxt
.mss
);
1137 optionssize
+= sizeof(struct option_mss
);
1139 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1140 options
->as_windowscale
.optionnum
= OPTION_NUMBER_WINDOW_SCALE
;
1141 options
->as_windowscale
.length
= sizeof(struct option_windowscale
);
1142 options
->as_windowscale
.shiftcount
= cm_node
->tcp_cntxt
.rcv_wscale
;
1143 optionssize
+= sizeof(struct option_windowscale
);
1145 if (sendack
&& !(NES_DRV_OPT_SUPRESS_OPTION_BC
& nes_drv_opt
)) {
1146 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1147 options
->as_base
.optionnum
= OPTION_NUMBER_WRITE0
;
1148 options
->as_base
.length
= sizeof(struct option_base
);
1149 optionssize
+= sizeof(struct option_base
);
1150 /* we need the size to be a multiple of 4 */
1151 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1152 options
->as_end
= 1;
1154 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1155 options
->as_end
= 1;
1159 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1160 options
->as_end
= OPTION_NUMBER_END
;
1164 skb
= dev_alloc_skb(MAX_CM_BUFFER
);
1166 nes_debug(NES_DBG_CM
, "Failed to get a Free pkt\n");
1173 form_cm_frame(skb
, cm_node
, optionsbuffer
, optionssize
, NULL
, 0, flags
);
1174 ret
= schedule_nes_timer(cm_node
, skb
, NES_TIMER_TYPE_SEND
, 1, 0);
1183 static int send_reset(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
)
1186 int flags
= SET_RST
| SET_ACK
;
1189 skb
= dev_alloc_skb(MAX_CM_BUFFER
);
1191 nes_debug(NES_DBG_CM
, "Failed to get a Free pkt\n");
1195 form_cm_frame(skb
, cm_node
, NULL
, 0, NULL
, 0, flags
);
1196 ret
= schedule_nes_timer(cm_node
, skb
, NES_TIMER_TYPE_SEND
, 0, 1);
1205 static int send_ack(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
)
1210 skb
= dev_alloc_skb(MAX_CM_BUFFER
);
1213 nes_debug(NES_DBG_CM
, "Failed to get a Free pkt\n");
1217 form_cm_frame(skb
, cm_node
, NULL
, 0, NULL
, 0, SET_ACK
);
1218 ret
= schedule_nes_timer(cm_node
, skb
, NES_TIMER_TYPE_SEND
, 0, 0);
1227 static int send_fin(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
)
1231 /* if we didn't get a frame get one */
1233 skb
= dev_alloc_skb(MAX_CM_BUFFER
);
1236 nes_debug(NES_DBG_CM
, "Failed to get a Free pkt\n");
1240 form_cm_frame(skb
, cm_node
, NULL
, 0, NULL
, 0, SET_ACK
| SET_FIN
);
1241 ret
= schedule_nes_timer(cm_node
, skb
, NES_TIMER_TYPE_SEND
, 1, 0);
1248 * find_node - find a cm node that matches the reference cm node
1250 static struct nes_cm_node
*find_node(struct nes_cm_core
*cm_core
,
1251 u16 rem_port
, nes_addr_t rem_addr
, u16 loc_port
, nes_addr_t loc_addr
)
1253 unsigned long flags
;
1254 struct list_head
*hte
;
1255 struct nes_cm_node
*cm_node
;
1257 /* get a handle on the hte */
1258 hte
= &cm_core
->connected_nodes
;
1260 /* walk list and find cm_node associated with this session ID */
1261 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1262 list_for_each_entry(cm_node
, hte
, list
) {
1263 /* compare quad, return node handle if a match */
1264 nes_debug(NES_DBG_CM
, "finding node %x:%x =? %x:%x ^ %x:%x =? %x:%x\n",
1265 cm_node
->loc_addr
, cm_node
->loc_port
,
1267 cm_node
->rem_addr
, cm_node
->rem_port
,
1268 rem_addr
, rem_port
);
1269 if ((cm_node
->mapped_loc_addr
== loc_addr
) &&
1270 (cm_node
->mapped_loc_port
== loc_port
) &&
1271 (cm_node
->mapped_rem_addr
== rem_addr
) &&
1272 (cm_node
->mapped_rem_port
== rem_port
)) {
1274 add_ref_cm_node(cm_node
);
1275 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1279 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1287 * find_listener - find a cm node listening on this addr-port pair
1289 static struct nes_cm_listener
*find_listener(struct nes_cm_core
*cm_core
,
1290 nes_addr_t dst_addr
, u16 dst_port
,
1291 enum nes_cm_listener_state listener_state
, int local
)
1293 unsigned long flags
;
1294 struct nes_cm_listener
*listen_node
;
1295 nes_addr_t listen_addr
;
1298 /* walk list and find cm_node associated with this session ID */
1299 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
1300 list_for_each_entry(listen_node
, &cm_core
->listen_list
.list
, list
) {
1302 listen_addr
= listen_node
->loc_addr
;
1303 listen_port
= listen_node
->loc_port
;
1305 listen_addr
= listen_node
->mapped_loc_addr
;
1306 listen_port
= listen_node
->mapped_loc_port
;
1308 /* compare node pair, return node handle if a match */
1309 if (((listen_addr
== dst_addr
) ||
1310 listen_addr
== 0x00000000) &&
1311 (listen_port
== dst_port
) &&
1312 (listener_state
& listen_node
->listener_state
)) {
1313 atomic_inc(&listen_node
->ref_count
);
1314 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1318 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1325 * add_hte_node - add a cm node to the hash table
1327 static int add_hte_node(struct nes_cm_core
*cm_core
, struct nes_cm_node
*cm_node
)
1329 unsigned long flags
;
1330 struct list_head
*hte
;
1332 if (!cm_node
|| !cm_core
)
1335 nes_debug(NES_DBG_CM
, "Adding Node %p to Active Connection HT\n",
1338 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1340 /* get a handle on the hash table element (list head for this slot) */
1341 hte
= &cm_core
->connected_nodes
;
1342 list_add_tail(&cm_node
->list
, hte
);
1343 atomic_inc(&cm_core
->ht_node_cnt
);
1345 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1352 * mini_cm_dec_refcnt_listen
1354 static int mini_cm_dec_refcnt_listen(struct nes_cm_core
*cm_core
,
1355 struct nes_cm_listener
*listener
, int free_hanging_nodes
)
1359 unsigned long flags
;
1360 struct list_head
*list_pos
= NULL
;
1361 struct list_head
*list_temp
= NULL
;
1362 struct nes_cm_node
*cm_node
= NULL
;
1363 struct list_head reset_list
;
1365 nes_debug(NES_DBG_CM
, "attempting listener= %p free_nodes= %d, "
1366 "refcnt=%d\n", listener
, free_hanging_nodes
,
1367 atomic_read(&listener
->ref_count
));
1368 /* free non-accelerated child nodes for this listener */
1369 INIT_LIST_HEAD(&reset_list
);
1370 if (free_hanging_nodes
) {
1371 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1372 list_for_each_safe(list_pos
, list_temp
,
1373 &g_cm_core
->connected_nodes
) {
1374 cm_node
= container_of(list_pos
, struct nes_cm_node
,
1376 if ((cm_node
->listener
== listener
) &&
1377 (!cm_node
->accelerated
)) {
1378 add_ref_cm_node(cm_node
);
1379 list_add(&cm_node
->reset_entry
, &reset_list
);
1382 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1385 list_for_each_safe(list_pos
, list_temp
, &reset_list
) {
1386 cm_node
= container_of(list_pos
, struct nes_cm_node
,
1389 struct nes_cm_node
*loopback
= cm_node
->loopbackpartner
;
1390 enum nes_cm_node_state old_state
;
1391 if (NES_CM_STATE_FIN_WAIT1
<= cm_node
->state
) {
1392 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
1395 cleanup_retrans_entry(cm_node
);
1396 err
= send_reset(cm_node
, NULL
);
1399 NES_CM_STATE_CLOSED
;
1402 old_state
= cm_node
->state
;
1403 cm_node
->state
= NES_CM_STATE_LISTENER_DESTROYED
;
1404 if (old_state
!= NES_CM_STATE_MPAREQ_RCVD
)
1410 struct nes_cm_event event
;
1412 event
.cm_node
= loopback
;
1413 event
.cm_info
.rem_addr
=
1415 event
.cm_info
.loc_addr
=
1417 event
.cm_info
.rem_port
=
1419 event
.cm_info
.loc_port
=
1421 event
.cm_info
.cm_id
= loopback
->cm_id
;
1422 add_ref_cm_node(loopback
);
1423 loopback
->state
= NES_CM_STATE_CLOSED
;
1424 cm_event_connect_error(&event
);
1425 cm_node
->state
= NES_CM_STATE_LISTENER_DESTROYED
;
1427 rem_ref_cm_node(cm_node
->cm_core
,
1435 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
1436 if (!atomic_dec_return(&listener
->ref_count
)) {
1437 list_del(&listener
->list
);
1439 /* decrement our listen node count */
1440 atomic_dec(&cm_core
->listen_node_cnt
);
1442 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1444 if (listener
->nesvnic
) {
1445 nes_manage_apbvt(listener
->nesvnic
,
1446 listener
->mapped_loc_port
,
1447 PCI_FUNC(listener
->nesvnic
->nesdev
->pcidev
->devfn
),
1448 NES_MANAGE_APBVT_DEL
);
1450 nes_remove_mapinfo(listener
->loc_addr
,
1452 listener
->mapped_loc_addr
,
1453 listener
->mapped_loc_port
);
1454 nes_debug(NES_DBG_NLMSG
,
1455 "Delete APBVT mapped_loc_port = %04X\n",
1456 listener
->mapped_loc_port
);
1459 nes_debug(NES_DBG_CM
, "destroying listener (%p)\n", listener
);
1464 atomic_inc(&cm_listens_destroyed
);
1466 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1469 if (atomic_read(&listener
->pend_accepts_cnt
) > 0)
1470 nes_debug(NES_DBG_CM
, "destroying listener (%p)"
1471 " with non-zero pending accepts=%u\n",
1472 listener
, atomic_read(&listener
->pend_accepts_cnt
));
1480 * mini_cm_del_listen
1482 static int mini_cm_del_listen(struct nes_cm_core
*cm_core
,
1483 struct nes_cm_listener
*listener
)
1485 listener
->listener_state
= NES_CM_LISTENER_PASSIVE_STATE
;
1486 listener
->cm_id
= NULL
; /* going to be destroyed pretty soon */
1487 return mini_cm_dec_refcnt_listen(cm_core
, listener
, 1);
1492 * mini_cm_accelerated
1494 static inline int mini_cm_accelerated(struct nes_cm_core
*cm_core
,
1495 struct nes_cm_node
*cm_node
)
1497 cm_node
->accelerated
= 1;
1499 if (cm_node
->accept_pend
) {
1500 BUG_ON(!cm_node
->listener
);
1501 atomic_dec(&cm_node
->listener
->pend_accepts_cnt
);
1502 cm_node
->accept_pend
= 0;
1503 BUG_ON(atomic_read(&cm_node
->listener
->pend_accepts_cnt
) < 0);
1506 if (!timer_pending(&cm_core
->tcp_timer
))
1507 mod_timer(&cm_core
->tcp_timer
, (jiffies
+ NES_SHORT_TIME
));
1514 * nes_addr_resolve_neigh
1516 static int nes_addr_resolve_neigh(struct nes_vnic
*nesvnic
, u32 dst_ip
, int arpindex
)
1519 struct neighbour
*neigh
;
1521 struct net_device
*netdev
;
1522 struct nes_adapter
*nesadapter
= nesvnic
->nesdev
->nesadapter
;
1523 __be32 dst_ipaddr
= htonl(dst_ip
);
1525 rt
= ip_route_output(&init_net
, dst_ipaddr
, nesvnic
->local_ipaddr
, 0, 0);
1527 printk(KERN_ERR
"%s: ip_route_output_key failed for 0x%08X\n",
1532 if (netif_is_bond_slave(nesvnic
->netdev
))
1533 netdev
= netdev_master_upper_dev_get(nesvnic
->netdev
);
1535 netdev
= nesvnic
->netdev
;
1537 neigh
= dst_neigh_lookup(&rt
->dst
, &dst_ipaddr
);
1541 if (neigh
->nud_state
& NUD_VALID
) {
1542 nes_debug(NES_DBG_CM
, "Neighbor MAC address for 0x%08X"
1543 " is %pM, Gateway is 0x%08X \n", dst_ip
,
1544 neigh
->ha
, ntohl(rt
->rt_gateway
));
1546 if (arpindex
>= 0) {
1547 if (ether_addr_equal(nesadapter
->arp_table
[arpindex
].mac_addr
, neigh
->ha
)) {
1548 /* Mac address same as in nes_arp_table */
1552 nes_manage_arp_cache(nesvnic
->netdev
,
1553 nesadapter
->arp_table
[arpindex
].mac_addr
,
1554 dst_ip
, NES_ARP_DELETE
);
1557 nes_manage_arp_cache(nesvnic
->netdev
, neigh
->ha
,
1558 dst_ip
, NES_ARP_ADD
);
1559 rc
= nes_arp_table(nesvnic
->nesdev
, dst_ip
, NULL
,
1562 neigh_event_send(neigh
, NULL
);
1569 neigh_release(neigh
);
1576 * make_cm_node - create a new instance of a cm node
1578 static struct nes_cm_node
*make_cm_node(struct nes_cm_core
*cm_core
,
1579 struct nes_vnic
*nesvnic
, struct nes_cm_info
*cm_info
,
1580 struct nes_cm_listener
*listener
)
1582 struct nes_cm_node
*cm_node
;
1584 int oldarpindex
= 0;
1586 struct nes_device
*nesdev
;
1587 struct nes_adapter
*nesadapter
;
1589 /* create an hte and cm_node for this instance */
1590 cm_node
= kzalloc(sizeof(*cm_node
), GFP_ATOMIC
);
1594 /* set our node specific transport info */
1596 cm_node
->loc_addr
= listener
->loc_addr
;
1597 cm_node
->loc_port
= listener
->loc_port
;
1599 cm_node
->loc_addr
= cm_info
->loc_addr
;
1600 cm_node
->loc_port
= cm_info
->loc_port
;
1602 cm_node
->rem_addr
= cm_info
->rem_addr
;
1603 cm_node
->rem_port
= cm_info
->rem_port
;
1605 cm_node
->mapped_loc_addr
= cm_info
->mapped_loc_addr
;
1606 cm_node
->mapped_rem_addr
= cm_info
->mapped_rem_addr
;
1607 cm_node
->mapped_loc_port
= cm_info
->mapped_loc_port
;
1608 cm_node
->mapped_rem_port
= cm_info
->mapped_rem_port
;
1610 cm_node
->mpa_frame_rev
= mpa_version
;
1611 cm_node
->send_rdma0_op
= SEND_RDMA_READ_ZERO
;
1612 cm_node
->mpav2_ird_ord
= 0;
1613 cm_node
->ird_size
= 0;
1614 cm_node
->ord_size
= 0;
1616 nes_debug(NES_DBG_CM
, "Make node addresses : loc = %pI4:%x, rem = %pI4:%x\n",
1617 &cm_node
->loc_addr
, cm_node
->loc_port
,
1618 &cm_node
->rem_addr
, cm_node
->rem_port
);
1619 cm_node
->listener
= listener
;
1621 cm_node
->tos
= listener
->tos
;
1622 cm_node
->netdev
= nesvnic
->netdev
;
1623 cm_node
->cm_id
= cm_info
->cm_id
;
1624 memcpy(cm_node
->loc_mac
, nesvnic
->netdev
->dev_addr
, ETH_ALEN
);
1626 nes_debug(NES_DBG_CM
, "listener=%p, cm_id=%p\n", cm_node
->listener
,
1629 spin_lock_init(&cm_node
->retrans_list_lock
);
1631 cm_node
->loopbackpartner
= NULL
;
1632 atomic_set(&cm_node
->ref_count
, 1);
1633 /* associate our parent CM core */
1634 cm_node
->cm_core
= cm_core
;
1635 cm_node
->tcp_cntxt
.loc_id
= NES_CM_DEF_LOCAL_ID
;
1636 cm_node
->tcp_cntxt
.rcv_wscale
= NES_CM_DEFAULT_RCV_WND_SCALE
;
1637 cm_node
->tcp_cntxt
.rcv_wnd
= NES_CM_DEFAULT_RCV_WND_SCALED
>>
1638 NES_CM_DEFAULT_RCV_WND_SCALE
;
1639 ts
= current_kernel_time();
1640 cm_node
->tcp_cntxt
.loc_seq_num
= htonl(ts
.tv_nsec
);
1641 cm_node
->tcp_cntxt
.mss
= nesvnic
->max_frame_size
- sizeof(struct iphdr
) -
1642 sizeof(struct tcphdr
) - ETH_HLEN
- VLAN_HLEN
;
1643 cm_node
->tcp_cntxt
.rcv_nxt
= 0;
1644 /* get a unique session ID , add thread_id to an upcounter to handle race */
1645 atomic_inc(&cm_core
->node_cnt
);
1646 cm_node
->conn_type
= cm_info
->conn_type
;
1647 cm_node
->apbvt_set
= 0;
1648 cm_node
->accept_pend
= 0;
1650 cm_node
->nesvnic
= nesvnic
;
1651 /* get some device handles, for arp lookup */
1652 nesdev
= nesvnic
->nesdev
;
1653 nesadapter
= nesdev
->nesadapter
;
1655 cm_node
->loopbackpartner
= NULL
;
1657 /* get the mac addr for the remote node */
1658 oldarpindex
= nes_arp_table(nesdev
, cm_node
->mapped_rem_addr
,
1659 NULL
, NES_ARP_RESOLVE
);
1660 arpindex
= nes_addr_resolve_neigh(nesvnic
,
1661 cm_node
->mapped_rem_addr
, oldarpindex
);
1667 /* copy the mac addr to node context */
1668 memcpy(cm_node
->rem_mac
, nesadapter
->arp_table
[arpindex
].mac_addr
, ETH_ALEN
);
1669 nes_debug(NES_DBG_CM
, "Remote mac addr from arp table: %pM\n",
1672 add_hte_node(cm_core
, cm_node
);
1673 atomic_inc(&cm_nodes_created
);
1680 * add_ref_cm_node - destroy an instance of a cm node
1682 static int add_ref_cm_node(struct nes_cm_node
*cm_node
)
1684 atomic_inc(&cm_node
->ref_count
);
1690 * rem_ref_cm_node - destroy an instance of a cm node
1692 static int rem_ref_cm_node(struct nes_cm_core
*cm_core
,
1693 struct nes_cm_node
*cm_node
)
1695 unsigned long flags
;
1696 struct nes_qp
*nesqp
;
1701 spin_lock_irqsave(&cm_node
->cm_core
->ht_lock
, flags
);
1702 if (atomic_dec_return(&cm_node
->ref_count
)) {
1703 spin_unlock_irqrestore(&cm_node
->cm_core
->ht_lock
, flags
);
1706 list_del(&cm_node
->list
);
1707 atomic_dec(&cm_core
->ht_node_cnt
);
1708 spin_unlock_irqrestore(&cm_node
->cm_core
->ht_lock
, flags
);
1710 /* if the node is destroyed before connection was accelerated */
1711 if (!cm_node
->accelerated
&& cm_node
->accept_pend
) {
1712 BUG_ON(!cm_node
->listener
);
1713 atomic_dec(&cm_node
->listener
->pend_accepts_cnt
);
1714 BUG_ON(atomic_read(&cm_node
->listener
->pend_accepts_cnt
) < 0);
1716 WARN_ON(cm_node
->send_entry
);
1717 if (cm_node
->recv_entry
)
1718 handle_recv_entry(cm_node
, 0);
1719 if (cm_node
->listener
) {
1720 mini_cm_dec_refcnt_listen(cm_core
, cm_node
->listener
, 0);
1722 if (cm_node
->apbvt_set
&& cm_node
->nesvnic
) {
1723 nes_manage_apbvt(cm_node
->nesvnic
, cm_node
->mapped_loc_port
,
1724 PCI_FUNC(cm_node
->nesvnic
->nesdev
->pcidev
->devfn
),
1725 NES_MANAGE_APBVT_DEL
);
1727 nes_debug(NES_DBG_NLMSG
, "Delete APBVT mapped_loc_port = %04X\n",
1728 cm_node
->mapped_loc_port
);
1729 nes_remove_mapinfo(cm_node
->loc_addr
, cm_node
->loc_port
,
1730 cm_node
->mapped_loc_addr
, cm_node
->mapped_loc_port
);
1733 atomic_dec(&cm_core
->node_cnt
);
1734 atomic_inc(&cm_nodes_destroyed
);
1735 nesqp
= cm_node
->nesqp
;
1737 nesqp
->cm_node
= NULL
;
1738 nes_rem_ref(&nesqp
->ibqp
);
1739 cm_node
->nesqp
= NULL
;
1749 static int process_options(struct nes_cm_node
*cm_node
, u8
*optionsloc
,
1750 u32 optionsize
, u32 syn_packet
)
1754 union all_known_options
*all_options
;
1755 char got_mss_option
= 0;
1757 while (offset
< optionsize
) {
1758 all_options
= (union all_known_options
*)(optionsloc
+ offset
);
1759 switch (all_options
->as_base
.optionnum
) {
1760 case OPTION_NUMBER_END
:
1761 offset
= optionsize
;
1763 case OPTION_NUMBER_NONE
:
1766 case OPTION_NUMBER_MSS
:
1767 nes_debug(NES_DBG_CM
, "%s: MSS Length: %d Offset: %d "
1768 "Size: %d\n", __func__
,
1769 all_options
->as_mss
.length
, offset
, optionsize
);
1771 if (all_options
->as_mss
.length
!= 4) {
1774 tmp
= ntohs(all_options
->as_mss
.mss
);
1775 if (tmp
> 0 && tmp
<
1776 cm_node
->tcp_cntxt
.mss
)
1777 cm_node
->tcp_cntxt
.mss
= tmp
;
1780 case OPTION_NUMBER_WINDOW_SCALE
:
1781 cm_node
->tcp_cntxt
.snd_wscale
=
1782 all_options
->as_windowscale
.shiftcount
;
1785 nes_debug(NES_DBG_CM
, "TCP Option not understood: %x\n",
1786 all_options
->as_base
.optionnum
);
1789 offset
+= all_options
->as_base
.length
;
1791 if ((!got_mss_option
) && (syn_packet
))
1792 cm_node
->tcp_cntxt
.mss
= NES_CM_DEFAULT_MSS
;
1796 static void drop_packet(struct sk_buff
*skb
)
1798 atomic_inc(&cm_accel_dropped_pkts
);
1799 dev_kfree_skb_any(skb
);
1802 static void handle_fin_pkt(struct nes_cm_node
*cm_node
)
1804 nes_debug(NES_DBG_CM
, "Received FIN, cm_node = %p, state = %u. "
1805 "refcnt=%d\n", cm_node
, cm_node
->state
,
1806 atomic_read(&cm_node
->ref_count
));
1807 switch (cm_node
->state
) {
1808 case NES_CM_STATE_SYN_RCVD
:
1809 case NES_CM_STATE_SYN_SENT
:
1810 case NES_CM_STATE_ESTABLISHED
:
1811 case NES_CM_STATE_MPAREJ_RCVD
:
1812 cm_node
->tcp_cntxt
.rcv_nxt
++;
1813 cleanup_retrans_entry(cm_node
);
1814 cm_node
->state
= NES_CM_STATE_LAST_ACK
;
1815 send_fin(cm_node
, NULL
);
1817 case NES_CM_STATE_MPAREQ_SENT
:
1818 create_event(cm_node
, NES_CM_EVENT_ABORTED
);
1819 cm_node
->tcp_cntxt
.rcv_nxt
++;
1820 cleanup_retrans_entry(cm_node
);
1821 cm_node
->state
= NES_CM_STATE_CLOSED
;
1822 add_ref_cm_node(cm_node
);
1823 send_reset(cm_node
, NULL
);
1825 case NES_CM_STATE_FIN_WAIT1
:
1826 cm_node
->tcp_cntxt
.rcv_nxt
++;
1827 cleanup_retrans_entry(cm_node
);
1828 cm_node
->state
= NES_CM_STATE_CLOSING
;
1829 send_ack(cm_node
, NULL
);
1830 /* Wait for ACK as this is simultaneous close..
1831 * After we receive ACK, do not send anything..
1832 * Just rm the node.. Done.. */
1834 case NES_CM_STATE_FIN_WAIT2
:
1835 cm_node
->tcp_cntxt
.rcv_nxt
++;
1836 cleanup_retrans_entry(cm_node
);
1837 cm_node
->state
= NES_CM_STATE_TIME_WAIT
;
1838 send_ack(cm_node
, NULL
);
1839 schedule_nes_timer(cm_node
, NULL
, NES_TIMER_TYPE_CLOSE
, 1, 0);
1841 case NES_CM_STATE_TIME_WAIT
:
1842 cm_node
->tcp_cntxt
.rcv_nxt
++;
1843 cleanup_retrans_entry(cm_node
);
1844 cm_node
->state
= NES_CM_STATE_CLOSED
;
1845 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
1847 case NES_CM_STATE_TSA
:
1849 nes_debug(NES_DBG_CM
, "Error Rcvd FIN for node-%p state = %d\n",
1850 cm_node
, cm_node
->state
);
1856 static void handle_rst_pkt(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
1857 struct tcphdr
*tcph
)
1860 int reset
= 0; /* whether to send reset in case of err.. */
1861 atomic_inc(&cm_resets_recvd
);
1862 nes_debug(NES_DBG_CM
, "Received Reset, cm_node = %p, state = %u."
1863 " refcnt=%d\n", cm_node
, cm_node
->state
,
1864 atomic_read(&cm_node
->ref_count
));
1865 cleanup_retrans_entry(cm_node
);
1866 switch (cm_node
->state
) {
1867 case NES_CM_STATE_SYN_SENT
:
1868 case NES_CM_STATE_MPAREQ_SENT
:
1869 nes_debug(NES_DBG_CM
, "%s[%u] create abort for cm_node=%p "
1870 "listener=%p state=%d\n", __func__
, __LINE__
, cm_node
,
1871 cm_node
->listener
, cm_node
->state
);
1872 switch (cm_node
->mpa_frame_rev
) {
1874 cm_node
->mpa_frame_rev
= IETF_MPA_V1
;
1875 /* send a syn and goto syn sent state */
1876 cm_node
->state
= NES_CM_STATE_SYN_SENT
;
1877 if (send_syn(cm_node
, 0, NULL
)) {
1878 active_open_err(cm_node
, skb
, reset
);
1883 active_open_err(cm_node
, skb
, reset
);
1887 case NES_CM_STATE_MPAREQ_RCVD
:
1888 atomic_inc(&cm_node
->passive_state
);
1889 dev_kfree_skb_any(skb
);
1891 case NES_CM_STATE_ESTABLISHED
:
1892 case NES_CM_STATE_SYN_RCVD
:
1893 case NES_CM_STATE_LISTENING
:
1894 nes_debug(NES_DBG_CM
, "Bad state %s[%u]\n", __func__
, __LINE__
);
1895 passive_open_err(cm_node
, skb
, reset
);
1897 case NES_CM_STATE_TSA
:
1898 active_open_err(cm_node
, skb
, reset
);
1900 case NES_CM_STATE_CLOSED
:
1903 case NES_CM_STATE_FIN_WAIT2
:
1904 case NES_CM_STATE_FIN_WAIT1
:
1905 case NES_CM_STATE_LAST_ACK
:
1906 cm_node
->cm_id
->rem_ref(cm_node
->cm_id
);
1907 case NES_CM_STATE_TIME_WAIT
:
1908 cm_node
->state
= NES_CM_STATE_CLOSED
;
1909 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
1919 static void handle_rcv_mpa(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
)
1922 int datasize
= skb
->len
;
1923 u8
*dataloc
= skb
->data
;
1925 enum nes_cm_event_type type
= NES_CM_EVENT_UNKNOWN
;
1928 ret
= parse_mpa(cm_node
, dataloc
, &res_type
, datasize
);
1930 nes_debug(NES_DBG_CM
, "didn't like MPA Request\n");
1931 if (cm_node
->state
== NES_CM_STATE_MPAREQ_SENT
) {
1932 nes_debug(NES_DBG_CM
, "%s[%u] create abort for "
1933 "cm_node=%p listener=%p state=%d\n", __func__
,
1934 __LINE__
, cm_node
, cm_node
->listener
,
1936 active_open_err(cm_node
, skb
, 1);
1938 passive_open_err(cm_node
, skb
, 1);
1943 switch (cm_node
->state
) {
1944 case NES_CM_STATE_ESTABLISHED
:
1945 if (res_type
== NES_MPA_REQUEST_REJECT
)
1946 /*BIG problem as we are receiving the MPA.. So should
1947 * not be REJECT.. This is Passive Open.. We can
1948 * only receive it Reject for Active Open...*/
1950 cm_node
->state
= NES_CM_STATE_MPAREQ_RCVD
;
1951 type
= NES_CM_EVENT_MPA_REQ
;
1952 atomic_set(&cm_node
->passive_state
,
1953 NES_PASSIVE_STATE_INDICATED
);
1955 case NES_CM_STATE_MPAREQ_SENT
:
1956 cleanup_retrans_entry(cm_node
);
1957 if (res_type
== NES_MPA_REQUEST_REJECT
) {
1958 type
= NES_CM_EVENT_MPA_REJECT
;
1959 cm_node
->state
= NES_CM_STATE_MPAREJ_RCVD
;
1961 type
= NES_CM_EVENT_CONNECTED
;
1962 cm_node
->state
= NES_CM_STATE_TSA
;
1970 dev_kfree_skb_any(skb
);
1971 create_event(cm_node
, type
);
1974 static void indicate_pkt_err(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
)
1976 switch (cm_node
->state
) {
1977 case NES_CM_STATE_SYN_SENT
:
1978 case NES_CM_STATE_MPAREQ_SENT
:
1979 nes_debug(NES_DBG_CM
, "%s[%u] create abort for cm_node=%p "
1980 "listener=%p state=%d\n", __func__
, __LINE__
, cm_node
,
1981 cm_node
->listener
, cm_node
->state
);
1982 active_open_err(cm_node
, skb
, 1);
1984 case NES_CM_STATE_ESTABLISHED
:
1985 case NES_CM_STATE_SYN_RCVD
:
1986 passive_open_err(cm_node
, skb
, 1);
1988 case NES_CM_STATE_TSA
:
1994 static int check_syn(struct nes_cm_node
*cm_node
, struct tcphdr
*tcph
,
1995 struct sk_buff
*skb
)
1999 err
= ((ntohl(tcph
->ack_seq
) == cm_node
->tcp_cntxt
.loc_seq_num
)) ? 0 : 1;
2001 active_open_err(cm_node
, skb
, 1);
2006 static int check_seq(struct nes_cm_node
*cm_node
, struct tcphdr
*tcph
,
2007 struct sk_buff
*skb
)
2012 u32 loc_seq_num
= cm_node
->tcp_cntxt
.loc_seq_num
;
2013 u32 rcv_nxt
= cm_node
->tcp_cntxt
.rcv_nxt
;
2016 seq
= ntohl(tcph
->seq
);
2017 ack_seq
= ntohl(tcph
->ack_seq
);
2018 rcv_wnd
= cm_node
->tcp_cntxt
.rcv_wnd
;
2019 if (ack_seq
!= loc_seq_num
)
2021 else if (!between(seq
, rcv_nxt
, (rcv_nxt
+ rcv_wnd
)))
2024 nes_debug(NES_DBG_CM
, "%s[%u] create abort for cm_node=%p "
2025 "listener=%p state=%d\n", __func__
, __LINE__
, cm_node
,
2026 cm_node
->listener
, cm_node
->state
);
2027 indicate_pkt_err(cm_node
, skb
);
2028 nes_debug(NES_DBG_CM
, "seq ERROR cm_node =%p seq=0x%08X "
2029 "rcv_nxt=0x%08X rcv_wnd=0x%x\n", cm_node
, seq
, rcv_nxt
,
2036 * handle_syn_pkt() is for Passive node. The syn packet is received when a node
2037 * is created with a listener or it may comein as rexmitted packet which in
2038 * that case will be just dropped.
2040 static void handle_syn_pkt(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
2041 struct tcphdr
*tcph
)
2047 optionsize
= (tcph
->doff
<< 2) - sizeof(struct tcphdr
);
2049 inc_sequence
= ntohl(tcph
->seq
);
2051 switch (cm_node
->state
) {
2052 case NES_CM_STATE_SYN_SENT
:
2053 case NES_CM_STATE_MPAREQ_SENT
:
2054 /* Rcvd syn on active open connection*/
2055 active_open_err(cm_node
, skb
, 1);
2057 case NES_CM_STATE_LISTENING
:
2059 if (atomic_read(&cm_node
->listener
->pend_accepts_cnt
) >
2060 cm_node
->listener
->backlog
) {
2061 nes_debug(NES_DBG_CM
, "drop syn due to backlog "
2064 passive_open_err(cm_node
, skb
, 0);
2067 ret
= handle_tcp_options(cm_node
, tcph
, skb
, optionsize
,
2070 passive_open_err(cm_node
, skb
, 0);
2074 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ 1;
2075 BUG_ON(cm_node
->send_entry
);
2076 cm_node
->accept_pend
= 1;
2077 atomic_inc(&cm_node
->listener
->pend_accepts_cnt
);
2079 cm_node
->state
= NES_CM_STATE_SYN_RCVD
;
2080 send_syn(cm_node
, 1, skb
);
2082 case NES_CM_STATE_CLOSED
:
2083 cleanup_retrans_entry(cm_node
);
2084 add_ref_cm_node(cm_node
);
2085 send_reset(cm_node
, skb
);
2087 case NES_CM_STATE_TSA
:
2088 case NES_CM_STATE_ESTABLISHED
:
2089 case NES_CM_STATE_FIN_WAIT1
:
2090 case NES_CM_STATE_FIN_WAIT2
:
2091 case NES_CM_STATE_MPAREQ_RCVD
:
2092 case NES_CM_STATE_LAST_ACK
:
2093 case NES_CM_STATE_CLOSING
:
2094 case NES_CM_STATE_UNKNOWN
:
2101 static void handle_synack_pkt(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
2102 struct tcphdr
*tcph
)
2108 optionsize
= (tcph
->doff
<< 2) - sizeof(struct tcphdr
);
2110 inc_sequence
= ntohl(tcph
->seq
);
2111 switch (cm_node
->state
) {
2112 case NES_CM_STATE_SYN_SENT
:
2113 cleanup_retrans_entry(cm_node
);
2115 if (check_syn(cm_node
, tcph
, skb
))
2117 cm_node
->tcp_cntxt
.rem_ack_num
= ntohl(tcph
->ack_seq
);
2119 ret
= handle_tcp_options(cm_node
, tcph
, skb
, optionsize
, 0);
2121 nes_debug(NES_DBG_CM
, "cm_node=%p tcp_options failed\n",
2125 cleanup_retrans_entry(cm_node
);
2126 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ 1;
2127 send_mpa_request(cm_node
, skb
);
2128 cm_node
->state
= NES_CM_STATE_MPAREQ_SENT
;
2130 case NES_CM_STATE_MPAREQ_RCVD
:
2131 /* passive open, so should not be here */
2132 passive_open_err(cm_node
, skb
, 1);
2134 case NES_CM_STATE_LISTENING
:
2135 cm_node
->tcp_cntxt
.loc_seq_num
= ntohl(tcph
->ack_seq
);
2136 cleanup_retrans_entry(cm_node
);
2137 cm_node
->state
= NES_CM_STATE_CLOSED
;
2138 send_reset(cm_node
, skb
);
2140 case NES_CM_STATE_CLOSED
:
2141 cm_node
->tcp_cntxt
.loc_seq_num
= ntohl(tcph
->ack_seq
);
2142 cleanup_retrans_entry(cm_node
);
2143 add_ref_cm_node(cm_node
);
2144 send_reset(cm_node
, skb
);
2146 case NES_CM_STATE_ESTABLISHED
:
2147 case NES_CM_STATE_FIN_WAIT1
:
2148 case NES_CM_STATE_FIN_WAIT2
:
2149 case NES_CM_STATE_LAST_ACK
:
2150 case NES_CM_STATE_TSA
:
2151 case NES_CM_STATE_CLOSING
:
2152 case NES_CM_STATE_UNKNOWN
:
2153 case NES_CM_STATE_MPAREQ_SENT
:
2160 static int handle_ack_pkt(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
2161 struct tcphdr
*tcph
)
2168 optionsize
= (tcph
->doff
<< 2) - sizeof(struct tcphdr
);
2170 if (check_seq(cm_node
, tcph
, skb
))
2173 skb_pull(skb
, tcph
->doff
<< 2);
2174 inc_sequence
= ntohl(tcph
->seq
);
2175 datasize
= skb
->len
;
2176 switch (cm_node
->state
) {
2177 case NES_CM_STATE_SYN_RCVD
:
2179 cleanup_retrans_entry(cm_node
);
2180 ret
= handle_tcp_options(cm_node
, tcph
, skb
, optionsize
, 1);
2183 cm_node
->tcp_cntxt
.rem_ack_num
= ntohl(tcph
->ack_seq
);
2184 cm_node
->state
= NES_CM_STATE_ESTABLISHED
;
2186 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ datasize
;
2187 nes_get_remote_addr(cm_node
);
2188 handle_rcv_mpa(cm_node
, skb
);
2189 } else { /* rcvd ACK only */
2190 dev_kfree_skb_any(skb
);
2193 case NES_CM_STATE_ESTABLISHED
:
2195 cleanup_retrans_entry(cm_node
);
2197 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ datasize
;
2198 handle_rcv_mpa(cm_node
, skb
);
2203 case NES_CM_STATE_MPAREQ_SENT
:
2204 cm_node
->tcp_cntxt
.rem_ack_num
= ntohl(tcph
->ack_seq
);
2206 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ datasize
;
2207 handle_rcv_mpa(cm_node
, skb
);
2208 } else { /* Could be just an ack pkt.. */
2209 dev_kfree_skb_any(skb
);
2212 case NES_CM_STATE_LISTENING
:
2213 cleanup_retrans_entry(cm_node
);
2214 cm_node
->state
= NES_CM_STATE_CLOSED
;
2215 send_reset(cm_node
, skb
);
2217 case NES_CM_STATE_CLOSED
:
2218 cleanup_retrans_entry(cm_node
);
2219 add_ref_cm_node(cm_node
);
2220 send_reset(cm_node
, skb
);
2222 case NES_CM_STATE_LAST_ACK
:
2223 case NES_CM_STATE_CLOSING
:
2224 cleanup_retrans_entry(cm_node
);
2225 cm_node
->state
= NES_CM_STATE_CLOSED
;
2226 cm_node
->cm_id
->rem_ref(cm_node
->cm_id
);
2227 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
2230 case NES_CM_STATE_FIN_WAIT1
:
2231 cleanup_retrans_entry(cm_node
);
2233 cm_node
->state
= NES_CM_STATE_FIN_WAIT2
;
2235 case NES_CM_STATE_SYN_SENT
:
2236 case NES_CM_STATE_FIN_WAIT2
:
2237 case NES_CM_STATE_TSA
:
2238 case NES_CM_STATE_MPAREQ_RCVD
:
2239 case NES_CM_STATE_UNKNOWN
:
2241 cleanup_retrans_entry(cm_node
);
2250 static int handle_tcp_options(struct nes_cm_node
*cm_node
, struct tcphdr
*tcph
,
2251 struct sk_buff
*skb
, int optionsize
, int passive
)
2253 u8
*optionsloc
= (u8
*)&tcph
[1];
2256 if (process_options(cm_node
, optionsloc
, optionsize
,
2258 nes_debug(NES_DBG_CM
, "%s: Node %p, Sending RESET\n",
2261 passive_open_err(cm_node
, skb
, 1);
2263 active_open_err(cm_node
, skb
, 1);
2268 cm_node
->tcp_cntxt
.snd_wnd
= ntohs(tcph
->window
) <<
2269 cm_node
->tcp_cntxt
.snd_wscale
;
2271 if (cm_node
->tcp_cntxt
.snd_wnd
> cm_node
->tcp_cntxt
.max_snd_wnd
)
2272 cm_node
->tcp_cntxt
.max_snd_wnd
= cm_node
->tcp_cntxt
.snd_wnd
;
2277 * active_open_err() will send reset() if flag set..
2278 * It will also send ABORT event.
2280 static void active_open_err(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
2283 cleanup_retrans_entry(cm_node
);
2285 nes_debug(NES_DBG_CM
, "ERROR active err called for cm_node=%p, "
2286 "state=%d\n", cm_node
, cm_node
->state
);
2287 add_ref_cm_node(cm_node
);
2288 send_reset(cm_node
, skb
);
2290 dev_kfree_skb_any(skb
);
2293 cm_node
->state
= NES_CM_STATE_CLOSED
;
2294 create_event(cm_node
, NES_CM_EVENT_ABORTED
);
2298 * passive_open_err() will either do a reset() or will free up the skb and
2299 * remove the cm_node.
2301 static void passive_open_err(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
2304 cleanup_retrans_entry(cm_node
);
2305 cm_node
->state
= NES_CM_STATE_CLOSED
;
2307 nes_debug(NES_DBG_CM
, "passive_open_err sending RST for "
2308 "cm_node=%p state =%d\n", cm_node
, cm_node
->state
);
2309 send_reset(cm_node
, skb
);
2311 dev_kfree_skb_any(skb
);
2312 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
2317 * free_retrans_entry() routines assumes that the retrans_list_lock has
2318 * been acquired before calling.
2320 static void free_retrans_entry(struct nes_cm_node
*cm_node
)
2322 struct nes_timer_entry
*send_entry
;
2324 send_entry
= cm_node
->send_entry
;
2326 cm_node
->send_entry
= NULL
;
2327 dev_kfree_skb_any(send_entry
->skb
);
2329 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
2333 static void cleanup_retrans_entry(struct nes_cm_node
*cm_node
)
2335 unsigned long flags
;
2337 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
2338 free_retrans_entry(cm_node
);
2339 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
2344 * Returns skb if to be freed, else it will return NULL if already used..
2346 static void process_packet(struct nes_cm_node
*cm_node
, struct sk_buff
*skb
,
2347 struct nes_cm_core
*cm_core
)
2349 enum nes_tcpip_pkt_type pkt_type
= NES_PKT_TYPE_UNKNOWN
;
2350 struct tcphdr
*tcph
= tcp_hdr(skb
);
2354 skb_pull(skb
, ip_hdr(skb
)->ihl
<< 2);
2356 nes_debug(NES_DBG_CM
, "process_packet: cm_node=%p state =%d syn=%d "
2357 "ack=%d rst=%d fin=%d\n", cm_node
, cm_node
->state
, tcph
->syn
,
2358 tcph
->ack
, tcph
->rst
, tcph
->fin
);
2361 pkt_type
= NES_PKT_TYPE_RST
;
2362 } else if (tcph
->syn
) {
2363 pkt_type
= NES_PKT_TYPE_SYN
;
2365 pkt_type
= NES_PKT_TYPE_SYNACK
;
2366 } else if (tcph
->ack
) {
2367 pkt_type
= NES_PKT_TYPE_ACK
;
2373 case NES_PKT_TYPE_SYN
:
2374 handle_syn_pkt(cm_node
, skb
, tcph
);
2376 case NES_PKT_TYPE_SYNACK
:
2377 handle_synack_pkt(cm_node
, skb
, tcph
);
2379 case NES_PKT_TYPE_ACK
:
2380 ret
= handle_ack_pkt(cm_node
, skb
, tcph
);
2381 if (fin_set
&& !ret
)
2382 handle_fin_pkt(cm_node
);
2384 case NES_PKT_TYPE_RST
:
2385 handle_rst_pkt(cm_node
, skb
, tcph
);
2388 if ((fin_set
) && (!check_seq(cm_node
, tcph
, skb
)))
2389 handle_fin_pkt(cm_node
);
2396 * mini_cm_listen - create a listen node with params
2398 static struct nes_cm_listener
*mini_cm_listen(struct nes_cm_core
*cm_core
,
2399 struct nes_vnic
*nesvnic
, struct nes_cm_info
*cm_info
)
2401 struct nes_cm_listener
*listener
;
2402 struct iwpm_dev_data pm_reg_msg
;
2403 struct iwpm_sa_data pm_msg
;
2404 unsigned long flags
;
2407 nes_debug(NES_DBG_CM
, "Search for 0x%08x : 0x%04x\n",
2408 cm_info
->loc_addr
, cm_info
->loc_port
);
2410 /* cannot have multiple matching listeners */
2411 listener
= find_listener(cm_core
, cm_info
->loc_addr
, cm_info
->loc_port
,
2412 NES_CM_LISTENER_EITHER_STATE
, 1);
2414 if (listener
&& listener
->listener_state
== NES_CM_LISTENER_ACTIVE_STATE
) {
2415 /* find automatically incs ref count ??? */
2416 atomic_dec(&listener
->ref_count
);
2417 nes_debug(NES_DBG_CM
, "Not creating listener since it already exists\n");
2422 nes_form_reg_msg(nesvnic
, &pm_reg_msg
);
2423 iwpm_err
= iwpm_register_pid(&pm_reg_msg
, RDMA_NL_NES
);
2425 nes_debug(NES_DBG_NLMSG
,
2426 "Port Mapper reg pid fail (err = %d).\n", iwpm_err
);
2428 if (iwpm_valid_pid() && !iwpm_err
) {
2429 nes_form_pm_msg(cm_info
, &pm_msg
);
2430 iwpm_err
= iwpm_add_mapping(&pm_msg
, RDMA_NL_NES
);
2432 nes_debug(NES_DBG_NLMSG
,
2433 "Port Mapper query fail (err = %d).\n", iwpm_err
);
2435 nes_record_pm_msg(cm_info
, &pm_msg
);
2438 /* create a CM listen node (1/2 node to compare incoming traffic to) */
2439 listener
= kzalloc(sizeof(*listener
), GFP_ATOMIC
);
2441 nes_debug(NES_DBG_CM
, "Not creating listener memory allocation failed\n");
2445 listener
->loc_addr
= cm_info
->loc_addr
;
2446 listener
->loc_port
= cm_info
->loc_port
;
2447 listener
->mapped_loc_addr
= cm_info
->mapped_loc_addr
;
2448 listener
->mapped_loc_port
= cm_info
->mapped_loc_port
;
2449 listener
->reused_node
= 0;
2451 atomic_set(&listener
->ref_count
, 1);
2454 /* find already inc'ed the ref count */
2456 listener
->reused_node
= 1;
2459 listener
->cm_id
= cm_info
->cm_id
;
2460 atomic_set(&listener
->pend_accepts_cnt
, 0);
2461 listener
->cm_core
= cm_core
;
2462 listener
->nesvnic
= nesvnic
;
2463 atomic_inc(&cm_core
->node_cnt
);
2465 listener
->conn_type
= cm_info
->conn_type
;
2466 listener
->backlog
= cm_info
->backlog
;
2467 listener
->listener_state
= NES_CM_LISTENER_ACTIVE_STATE
;
2469 if (!listener
->reused_node
) {
2470 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
2471 list_add(&listener
->list
, &cm_core
->listen_list
.list
);
2472 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
2473 atomic_inc(&cm_core
->listen_node_cnt
);
2476 nes_debug(NES_DBG_CM
, "Api - listen(): addr=0x%08X, port=0x%04x,"
2477 " listener = %p, backlog = %d, cm_id = %p.\n",
2478 cm_info
->loc_addr
, cm_info
->loc_port
,
2479 listener
, listener
->backlog
, listener
->cm_id
);
2486 * mini_cm_connect - make a connection node with params
2488 static struct nes_cm_node
*mini_cm_connect(struct nes_cm_core
*cm_core
,
2489 struct nes_vnic
*nesvnic
, u16 private_data_len
,
2490 void *private_data
, struct nes_cm_info
*cm_info
)
2493 struct nes_cm_node
*cm_node
;
2494 struct nes_cm_listener
*loopbackremotelistener
;
2495 struct nes_cm_node
*loopbackremotenode
;
2496 struct nes_cm_info loopback_cm_info
;
2499 /* create a CM connection node */
2500 cm_node
= make_cm_node(cm_core
, nesvnic
, cm_info
, NULL
);
2504 /* set our node side to client (active) side */
2505 cm_node
->tcp_cntxt
.client
= 1;
2506 cm_node
->tcp_cntxt
.rcv_wscale
= NES_CM_DEFAULT_RCV_WND_SCALE
;
2508 if (cm_info
->loc_addr
== cm_info
->rem_addr
) {
2509 loopbackremotelistener
= find_listener(cm_core
,
2510 cm_node
->mapped_loc_addr
, cm_node
->mapped_rem_port
,
2511 NES_CM_LISTENER_ACTIVE_STATE
, 0);
2512 if (loopbackremotelistener
== NULL
) {
2513 create_event(cm_node
, NES_CM_EVENT_ABORTED
);
2515 loopback_cm_info
= *cm_info
;
2516 loopback_cm_info
.loc_port
= cm_info
->rem_port
;
2517 loopback_cm_info
.rem_port
= cm_info
->loc_port
;
2518 loopback_cm_info
.mapped_loc_port
=
2519 cm_info
->mapped_rem_port
;
2520 loopback_cm_info
.mapped_rem_port
=
2521 cm_info
->mapped_loc_port
;
2522 loopback_cm_info
.cm_id
= loopbackremotelistener
->cm_id
;
2523 loopbackremotenode
= make_cm_node(cm_core
, nesvnic
,
2524 &loopback_cm_info
, loopbackremotelistener
);
2525 if (!loopbackremotenode
) {
2526 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
2529 atomic_inc(&cm_loopbacks
);
2530 loopbackremotenode
->loopbackpartner
= cm_node
;
2531 loopbackremotenode
->tcp_cntxt
.rcv_wscale
=
2532 NES_CM_DEFAULT_RCV_WND_SCALE
;
2533 cm_node
->loopbackpartner
= loopbackremotenode
;
2534 memcpy(loopbackremotenode
->mpa_frame_buf
, private_data
,
2536 loopbackremotenode
->mpa_frame_size
= private_data_len
;
2538 /* we are done handling this state. */
2539 /* set node to a TSA state */
2540 cm_node
->state
= NES_CM_STATE_TSA
;
2541 cm_node
->tcp_cntxt
.rcv_nxt
=
2542 loopbackremotenode
->tcp_cntxt
.loc_seq_num
;
2543 loopbackremotenode
->tcp_cntxt
.rcv_nxt
=
2544 cm_node
->tcp_cntxt
.loc_seq_num
;
2545 cm_node
->tcp_cntxt
.max_snd_wnd
=
2546 loopbackremotenode
->tcp_cntxt
.rcv_wnd
;
2547 loopbackremotenode
->tcp_cntxt
.max_snd_wnd
=
2548 cm_node
->tcp_cntxt
.rcv_wnd
;
2549 cm_node
->tcp_cntxt
.snd_wnd
=
2550 loopbackremotenode
->tcp_cntxt
.rcv_wnd
;
2551 loopbackremotenode
->tcp_cntxt
.snd_wnd
=
2552 cm_node
->tcp_cntxt
.rcv_wnd
;
2553 cm_node
->tcp_cntxt
.snd_wscale
=
2554 loopbackremotenode
->tcp_cntxt
.rcv_wscale
;
2555 loopbackremotenode
->tcp_cntxt
.snd_wscale
=
2556 cm_node
->tcp_cntxt
.rcv_wscale
;
2557 loopbackremotenode
->state
= NES_CM_STATE_MPAREQ_RCVD
;
2558 create_event(loopbackremotenode
, NES_CM_EVENT_MPA_REQ
);
2563 start_buff
= &cm_node
->mpa_frame_buf
[0] + sizeof(struct ietf_mpa_v2
);
2564 cm_node
->mpa_frame_size
= private_data_len
;
2566 memcpy(start_buff
, private_data
, private_data_len
);
2568 /* send a syn and goto syn sent state */
2569 cm_node
->state
= NES_CM_STATE_SYN_SENT
;
2570 ret
= send_syn(cm_node
, 0, NULL
);
2573 /* error in sending the syn free up the cm_node struct */
2574 nes_debug(NES_DBG_CM
, "Api - connect() FAILED: dest "
2575 "addr=0x%08X, port=0x%04x, cm_node=%p, cm_id = %p.\n",
2576 cm_node
->rem_addr
, cm_node
->rem_port
, cm_node
,
2578 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
2583 nes_debug(NES_DBG_CM
, "Api - connect(): dest addr=0x%08X,"
2584 "port=0x%04x, cm_node=%p, cm_id = %p.\n",
2585 cm_node
->rem_addr
, cm_node
->rem_port
, cm_node
,
2594 * mini_cm_accept - accept a connection
2595 * This function is never called
2597 static int mini_cm_accept(struct nes_cm_core
*cm_core
, struct nes_cm_node
*cm_node
)
2604 * mini_cm_reject - reject and teardown a connection
2606 static int mini_cm_reject(struct nes_cm_core
*cm_core
, struct nes_cm_node
*cm_node
)
2611 struct nes_cm_event event
;
2612 struct iw_cm_id
*cm_id
= cm_node
->cm_id
;
2613 struct nes_cm_node
*loopback
= cm_node
->loopbackpartner
;
2615 nes_debug(NES_DBG_CM
, "%s cm_node=%p type=%d state=%d\n",
2616 __func__
, cm_node
, cm_node
->tcp_cntxt
.client
, cm_node
->state
);
2618 if (cm_node
->tcp_cntxt
.client
)
2620 cleanup_retrans_entry(cm_node
);
2623 passive_state
= atomic_add_return(1, &cm_node
->passive_state
);
2624 if (passive_state
== NES_SEND_RESET_EVENT
) {
2625 cm_node
->state
= NES_CM_STATE_CLOSED
;
2626 rem_ref_cm_node(cm_core
, cm_node
);
2628 if (cm_node
->state
== NES_CM_STATE_LISTENER_DESTROYED
) {
2629 rem_ref_cm_node(cm_core
, cm_node
);
2631 ret
= send_mpa_reject(cm_node
);
2633 cm_node
->state
= NES_CM_STATE_CLOSED
;
2634 err
= send_reset(cm_node
, NULL
);
2638 cm_id
->add_ref(cm_id
);
2643 cm_node
->cm_id
= NULL
;
2644 if (cm_node
->state
== NES_CM_STATE_LISTENER_DESTROYED
) {
2645 rem_ref_cm_node(cm_core
, cm_node
);
2646 rem_ref_cm_node(cm_core
, loopback
);
2648 event
.cm_node
= loopback
;
2649 event
.cm_info
.rem_addr
= loopback
->rem_addr
;
2650 event
.cm_info
.loc_addr
= loopback
->loc_addr
;
2651 event
.cm_info
.rem_port
= loopback
->rem_port
;
2652 event
.cm_info
.loc_port
= loopback
->loc_port
;
2653 event
.cm_info
.cm_id
= loopback
->cm_id
;
2654 cm_event_mpa_reject(&event
);
2655 rem_ref_cm_node(cm_core
, cm_node
);
2656 loopback
->state
= NES_CM_STATE_CLOSING
;
2658 cm_id
= loopback
->cm_id
;
2659 rem_ref_cm_node(cm_core
, loopback
);
2660 cm_id
->rem_ref(cm_id
);
2671 static int mini_cm_close(struct nes_cm_core
*cm_core
, struct nes_cm_node
*cm_node
)
2675 if (!cm_core
|| !cm_node
)
2678 switch (cm_node
->state
) {
2679 case NES_CM_STATE_SYN_RCVD
:
2680 case NES_CM_STATE_SYN_SENT
:
2681 case NES_CM_STATE_ONE_SIDE_ESTABLISHED
:
2682 case NES_CM_STATE_ESTABLISHED
:
2683 case NES_CM_STATE_ACCEPTING
:
2684 case NES_CM_STATE_MPAREQ_SENT
:
2685 case NES_CM_STATE_MPAREQ_RCVD
:
2686 cleanup_retrans_entry(cm_node
);
2687 send_reset(cm_node
, NULL
);
2689 case NES_CM_STATE_CLOSE_WAIT
:
2690 cm_node
->state
= NES_CM_STATE_LAST_ACK
;
2691 send_fin(cm_node
, NULL
);
2693 case NES_CM_STATE_FIN_WAIT1
:
2694 case NES_CM_STATE_FIN_WAIT2
:
2695 case NES_CM_STATE_LAST_ACK
:
2696 case NES_CM_STATE_TIME_WAIT
:
2697 case NES_CM_STATE_CLOSING
:
2700 case NES_CM_STATE_LISTENING
:
2701 cleanup_retrans_entry(cm_node
);
2702 send_reset(cm_node
, NULL
);
2704 case NES_CM_STATE_MPAREJ_RCVD
:
2705 case NES_CM_STATE_UNKNOWN
:
2706 case NES_CM_STATE_INITED
:
2707 case NES_CM_STATE_CLOSED
:
2708 case NES_CM_STATE_LISTENER_DESTROYED
:
2709 ret
= rem_ref_cm_node(cm_core
, cm_node
);
2711 case NES_CM_STATE_TSA
:
2712 if (cm_node
->send_entry
)
2713 printk(KERN_ERR
"ERROR Close got called from STATE_TSA "
2714 "send_entry=%p\n", cm_node
->send_entry
);
2715 ret
= rem_ref_cm_node(cm_core
, cm_node
);
2723 * recv_pkt - recv an ETHERNET packet, and process it through CM
2724 * node state machine
2726 static int mini_cm_recv_pkt(struct nes_cm_core
*cm_core
,
2727 struct nes_vnic
*nesvnic
, struct sk_buff
*skb
)
2729 struct nes_cm_node
*cm_node
= NULL
;
2730 struct nes_cm_listener
*listener
= NULL
;
2732 struct tcphdr
*tcph
;
2733 struct nes_cm_info nfo
;
2734 int skb_handled
= 1;
2735 __be32 tmp_daddr
, tmp_saddr
;
2739 if (skb
->len
< sizeof(struct iphdr
) + sizeof(struct tcphdr
))
2742 iph
= (struct iphdr
*)skb
->data
;
2743 tcph
= (struct tcphdr
*)(skb
->data
+ sizeof(struct iphdr
));
2745 nfo
.loc_addr
= ntohl(iph
->daddr
);
2746 nfo
.loc_port
= ntohs(tcph
->dest
);
2747 nfo
.rem_addr
= ntohl(iph
->saddr
);
2748 nfo
.rem_port
= ntohs(tcph
->source
);
2750 /* If port mapper is available these should be mapped address info */
2751 nfo
.mapped_loc_addr
= ntohl(iph
->daddr
);
2752 nfo
.mapped_loc_port
= ntohs(tcph
->dest
);
2753 nfo
.mapped_rem_addr
= ntohl(iph
->saddr
);
2754 nfo
.mapped_rem_port
= ntohs(tcph
->source
);
2756 tmp_daddr
= cpu_to_be32(iph
->daddr
);
2757 tmp_saddr
= cpu_to_be32(iph
->saddr
);
2759 nes_debug(NES_DBG_CM
, "Received packet: dest=%pI4:0x%04X src=%pI4:0x%04X\n",
2760 &tmp_daddr
, tcph
->dest
, &tmp_saddr
, tcph
->source
);
2763 cm_node
= find_node(cm_core
,
2764 nfo
.mapped_rem_port
, nfo
.mapped_rem_addr
,
2765 nfo
.mapped_loc_port
, nfo
.mapped_loc_addr
);
2768 /* Only type of packet accepted are for */
2769 /* the PASSIVE open (syn only) */
2770 if ((!tcph
->syn
) || (tcph
->ack
)) {
2774 listener
= find_listener(cm_core
, nfo
.mapped_loc_addr
,
2775 nfo
.mapped_loc_port
,
2776 NES_CM_LISTENER_ACTIVE_STATE
, 0);
2780 nes_debug(NES_DBG_CM
, "Unable to find listener for the pkt\n");
2784 nfo
.cm_id
= listener
->cm_id
;
2785 nfo
.conn_type
= listener
->conn_type
;
2786 cm_node
= make_cm_node(cm_core
, nesvnic
, &nfo
,
2789 nes_debug(NES_DBG_CM
, "Unable to allocate "
2791 cm_packets_dropped
++;
2792 atomic_dec(&listener
->ref_count
);
2793 dev_kfree_skb_any(skb
);
2796 if (!tcph
->rst
&& !tcph
->fin
) {
2797 cm_node
->state
= NES_CM_STATE_LISTENING
;
2799 cm_packets_dropped
++;
2800 rem_ref_cm_node(cm_core
, cm_node
);
2801 dev_kfree_skb_any(skb
);
2804 add_ref_cm_node(cm_node
);
2805 } else if (cm_node
->state
== NES_CM_STATE_TSA
) {
2806 if (cm_node
->nesqp
->pau_mode
)
2807 nes_queue_mgt_skbs(skb
, nesvnic
, cm_node
->nesqp
);
2809 rem_ref_cm_node(cm_core
, cm_node
);
2810 atomic_inc(&cm_accel_dropped_pkts
);
2811 dev_kfree_skb_any(skb
);
2815 skb_reset_network_header(skb
);
2816 skb_set_transport_header(skb
, sizeof(*tcph
));
2817 skb
->len
= ntohs(iph
->tot_len
);
2818 process_packet(cm_node
, skb
, cm_core
);
2819 rem_ref_cm_node(cm_core
, cm_node
);
2826 * nes_cm_alloc_core - allocate a top level instance of a cm core
2828 static struct nes_cm_core
*nes_cm_alloc_core(void)
2830 struct nes_cm_core
*cm_core
;
2832 /* setup the CM core */
2833 /* alloc top level core control structure */
2834 cm_core
= kzalloc(sizeof(*cm_core
), GFP_KERNEL
);
2838 INIT_LIST_HEAD(&cm_core
->connected_nodes
);
2839 init_timer(&cm_core
->tcp_timer
);
2840 cm_core
->tcp_timer
.function
= nes_cm_timer_tick
;
2842 cm_core
->mtu
= NES_CM_DEFAULT_MTU
;
2843 cm_core
->state
= NES_CM_STATE_INITED
;
2844 cm_core
->free_tx_pkt_max
= NES_CM_DEFAULT_FREE_PKTS
;
2846 atomic_set(&cm_core
->events_posted
, 0);
2848 cm_core
->api
= &nes_cm_api
;
2850 spin_lock_init(&cm_core
->ht_lock
);
2851 spin_lock_init(&cm_core
->listen_list_lock
);
2853 INIT_LIST_HEAD(&cm_core
->listen_list
.list
);
2855 nes_debug(NES_DBG_CM
, "Init CM Core completed -- cm_core=%p\n", cm_core
);
2857 nes_debug(NES_DBG_CM
, "Enable QUEUE EVENTS\n");
2858 cm_core
->event_wq
= create_singlethread_workqueue("nesewq");
2859 cm_core
->post_event
= nes_cm_post_event
;
2860 nes_debug(NES_DBG_CM
, "Enable QUEUE DISCONNECTS\n");
2861 cm_core
->disconn_wq
= create_singlethread_workqueue("nesdwq");
2863 print_core(cm_core
);
2869 * mini_cm_dealloc_core - deallocate a top level instance of a cm core
2871 static int mini_cm_dealloc_core(struct nes_cm_core
*cm_core
)
2873 nes_debug(NES_DBG_CM
, "De-Alloc CM Core (%p)\n", cm_core
);
2880 if (timer_pending(&cm_core
->tcp_timer
))
2881 del_timer(&cm_core
->tcp_timer
);
2883 destroy_workqueue(cm_core
->event_wq
);
2884 destroy_workqueue(cm_core
->disconn_wq
);
2885 nes_debug(NES_DBG_CM
, "\n");
2895 static int mini_cm_get(struct nes_cm_core
*cm_core
)
2897 return cm_core
->state
;
2904 static int mini_cm_set(struct nes_cm_core
*cm_core
, u32 type
, u32 value
)
2909 case NES_CM_SET_PKT_SIZE
:
2910 cm_core
->mtu
= value
;
2912 case NES_CM_SET_FREE_PKT_Q_SIZE
:
2913 cm_core
->free_tx_pkt_max
= value
;
2916 /* unknown set option */
2925 * nes_cm_init_tsa_conn setup HW; MPA frames must be
2926 * successfully exchanged when this is called
2928 static int nes_cm_init_tsa_conn(struct nes_qp
*nesqp
, struct nes_cm_node
*cm_node
)
2935 nesqp
->nesqp_context
->misc
|= cpu_to_le32(NES_QPCONTEXT_MISC_IPV4
|
2936 NES_QPCONTEXT_MISC_NO_NAGLE
| NES_QPCONTEXT_MISC_DO_NOT_FRAG
|
2937 NES_QPCONTEXT_MISC_DROS
);
2939 if (cm_node
->tcp_cntxt
.snd_wscale
|| cm_node
->tcp_cntxt
.rcv_wscale
)
2940 nesqp
->nesqp_context
->misc
|= cpu_to_le32(NES_QPCONTEXT_MISC_WSCALE
);
2942 nesqp
->nesqp_context
->misc2
|= cpu_to_le32(64 << NES_QPCONTEXT_MISC2_TTL_SHIFT
);
2944 nesqp
->nesqp_context
->misc2
|= cpu_to_le32(
2945 cm_node
->tos
<< NES_QPCONTEXT_MISC2_TOS_SHIFT
);
2947 nesqp
->nesqp_context
->mss
|= cpu_to_le32(((u32
)cm_node
->tcp_cntxt
.mss
) << 16);
2949 nesqp
->nesqp_context
->tcp_state_flow_label
|= cpu_to_le32(
2950 (u32
)NES_QPCONTEXT_TCPSTATE_EST
<< NES_QPCONTEXT_TCPFLOW_TCP_STATE_SHIFT
);
2952 nesqp
->nesqp_context
->pd_index_wscale
|= cpu_to_le32(
2953 (cm_node
->tcp_cntxt
.snd_wscale
<< NES_QPCONTEXT_PDWSCALE_SND_WSCALE_SHIFT
) &
2954 NES_QPCONTEXT_PDWSCALE_SND_WSCALE_MASK
);
2956 nesqp
->nesqp_context
->pd_index_wscale
|= cpu_to_le32(
2957 (cm_node
->tcp_cntxt
.rcv_wscale
<< NES_QPCONTEXT_PDWSCALE_RCV_WSCALE_SHIFT
) &
2958 NES_QPCONTEXT_PDWSCALE_RCV_WSCALE_MASK
);
2960 nesqp
->nesqp_context
->keepalive
= cpu_to_le32(0x80);
2961 nesqp
->nesqp_context
->ts_recent
= 0;
2962 nesqp
->nesqp_context
->ts_age
= 0;
2963 nesqp
->nesqp_context
->snd_nxt
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
2964 nesqp
->nesqp_context
->snd_wnd
= cpu_to_le32(cm_node
->tcp_cntxt
.snd_wnd
);
2965 nesqp
->nesqp_context
->rcv_nxt
= cpu_to_le32(cm_node
->tcp_cntxt
.rcv_nxt
);
2966 nesqp
->nesqp_context
->rcv_wnd
= cpu_to_le32(cm_node
->tcp_cntxt
.rcv_wnd
<<
2967 cm_node
->tcp_cntxt
.rcv_wscale
);
2968 nesqp
->nesqp_context
->snd_max
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
2969 nesqp
->nesqp_context
->snd_una
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
2970 nesqp
->nesqp_context
->srtt
= 0;
2971 nesqp
->nesqp_context
->rttvar
= cpu_to_le32(0x6);
2972 nesqp
->nesqp_context
->ssthresh
= cpu_to_le32(0x3FFFC000);
2973 nesqp
->nesqp_context
->cwnd
= cpu_to_le32(2 * cm_node
->tcp_cntxt
.mss
);
2974 nesqp
->nesqp_context
->snd_wl1
= cpu_to_le32(cm_node
->tcp_cntxt
.rcv_nxt
);
2975 nesqp
->nesqp_context
->snd_wl2
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
2976 nesqp
->nesqp_context
->max_snd_wnd
= cpu_to_le32(cm_node
->tcp_cntxt
.max_snd_wnd
);
2978 nes_debug(NES_DBG_CM
, "QP%u: rcv_nxt = 0x%08X, snd_nxt = 0x%08X,"
2979 " Setting MSS to %u, PDWscale = 0x%08X, rcv_wnd = %u, context misc = 0x%08X.\n",
2980 nesqp
->hwqp
.qp_id
, le32_to_cpu(nesqp
->nesqp_context
->rcv_nxt
),
2981 le32_to_cpu(nesqp
->nesqp_context
->snd_nxt
),
2982 cm_node
->tcp_cntxt
.mss
, le32_to_cpu(nesqp
->nesqp_context
->pd_index_wscale
),
2983 le32_to_cpu(nesqp
->nesqp_context
->rcv_wnd
),
2984 le32_to_cpu(nesqp
->nesqp_context
->misc
));
2985 nes_debug(NES_DBG_CM
, " snd_wnd = 0x%08X.\n", le32_to_cpu(nesqp
->nesqp_context
->snd_wnd
));
2986 nes_debug(NES_DBG_CM
, " snd_cwnd = 0x%08X.\n", le32_to_cpu(nesqp
->nesqp_context
->cwnd
));
2987 nes_debug(NES_DBG_CM
, " max_swnd = 0x%08X.\n", le32_to_cpu(nesqp
->nesqp_context
->max_snd_wnd
));
2989 nes_debug(NES_DBG_CM
, "Change cm_node state to TSA\n");
2990 cm_node
->state
= NES_CM_STATE_TSA
;
2999 int nes_cm_disconn(struct nes_qp
*nesqp
)
3001 struct disconn_work
*work
;
3003 work
= kzalloc(sizeof *work
, GFP_ATOMIC
);
3005 return -ENOMEM
; /* Timer will clean up */
3007 nes_add_ref(&nesqp
->ibqp
);
3008 work
->nesqp
= nesqp
;
3009 INIT_WORK(&work
->work
, nes_disconnect_worker
);
3010 queue_work(g_cm_core
->disconn_wq
, &work
->work
);
3016 * nes_disconnect_worker
3018 static void nes_disconnect_worker(struct work_struct
*work
)
3020 struct disconn_work
*dwork
= container_of(work
, struct disconn_work
, work
);
3021 struct nes_qp
*nesqp
= dwork
->nesqp
;
3024 nes_debug(NES_DBG_CM
, "processing AEQE id 0x%04X for QP%u.\n",
3025 nesqp
->last_aeq
, nesqp
->hwqp
.qp_id
);
3026 nes_cm_disconn_true(nesqp
);
3027 nes_rem_ref(&nesqp
->ibqp
);
3032 * nes_cm_disconn_true
3034 static int nes_cm_disconn_true(struct nes_qp
*nesqp
)
3036 unsigned long flags
;
3038 struct iw_cm_id
*cm_id
;
3039 struct iw_cm_event cm_event
;
3040 struct nes_vnic
*nesvnic
;
3042 u8 original_hw_tcp_state
;
3043 u8 original_ibqp_state
;
3044 int disconn_status
= 0;
3045 int issue_disconn
= 0;
3046 int issue_close
= 0;
3047 int issue_flush
= 0;
3048 u32 flush_q
= NES_CQP_FLUSH_RQ
;
3049 struct ib_event ibevent
;
3052 nes_debug(NES_DBG_CM
, "disconnect_worker nesqp is NULL\n");
3056 spin_lock_irqsave(&nesqp
->lock
, flags
);
3057 cm_id
= nesqp
->cm_id
;
3058 /* make sure we havent already closed this connection */
3060 nes_debug(NES_DBG_CM
, "QP%u disconnect_worker cmid is NULL\n",
3062 spin_unlock_irqrestore(&nesqp
->lock
, flags
);
3066 nesvnic
= to_nesvnic(nesqp
->ibqp
.device
);
3067 nes_debug(NES_DBG_CM
, "Disconnecting QP%u\n", nesqp
->hwqp
.qp_id
);
3069 original_hw_tcp_state
= nesqp
->hw_tcp_state
;
3070 original_ibqp_state
= nesqp
->ibqp_state
;
3071 last_ae
= nesqp
->last_aeq
;
3073 if (nesqp
->term_flags
) {
3076 nesqp
->cm_id
= NULL
;
3077 del_timer(&nesqp
->terminate_timer
);
3078 if (nesqp
->flush_issued
== 0) {
3079 nesqp
->flush_issued
= 1;
3082 } else if ((original_hw_tcp_state
== NES_AEQE_TCP_STATE_CLOSE_WAIT
) ||
3083 ((original_ibqp_state
== IB_QPS_RTS
) &&
3084 (last_ae
== NES_AEQE_AEID_LLP_CONNECTION_RESET
))) {
3086 if (last_ae
== NES_AEQE_AEID_LLP_CONNECTION_RESET
)
3087 disconn_status
= -ECONNRESET
;
3090 if (((original_hw_tcp_state
== NES_AEQE_TCP_STATE_CLOSED
) ||
3091 (original_hw_tcp_state
== NES_AEQE_TCP_STATE_TIME_WAIT
) ||
3092 (last_ae
== NES_AEQE_AEID_RDMAP_ROE_BAD_LLP_CLOSE
) ||
3093 (last_ae
== NES_AEQE_AEID_LLP_CONNECTION_RESET
))) {
3095 nesqp
->cm_id
= NULL
;
3096 if (nesqp
->flush_issued
== 0) {
3097 nesqp
->flush_issued
= 1;
3102 spin_unlock_irqrestore(&nesqp
->lock
, flags
);
3104 if ((issue_flush
) && (nesqp
->destroyed
== 0)) {
3105 /* Flush the queue(s) */
3106 if (nesqp
->hw_iwarp_state
>= NES_AEQE_IWARP_STATE_TERMINATE
)
3107 flush_q
|= NES_CQP_FLUSH_SQ
;
3108 flush_wqes(nesvnic
->nesdev
, nesqp
, flush_q
, 1);
3110 if (nesqp
->term_flags
) {
3111 ibevent
.device
= nesqp
->ibqp
.device
;
3112 ibevent
.event
= nesqp
->terminate_eventtype
;
3113 ibevent
.element
.qp
= &nesqp
->ibqp
;
3114 if (nesqp
->ibqp
.event_handler
)
3115 nesqp
->ibqp
.event_handler(&ibevent
, nesqp
->ibqp
.qp_context
);
3119 if ((cm_id
) && (cm_id
->event_handler
)) {
3120 if (issue_disconn
) {
3121 atomic_inc(&cm_disconnects
);
3122 cm_event
.event
= IW_CM_EVENT_DISCONNECT
;
3123 cm_event
.status
= disconn_status
;
3124 cm_event
.local_addr
= cm_id
->local_addr
;
3125 cm_event
.remote_addr
= cm_id
->remote_addr
;
3126 cm_event
.private_data
= NULL
;
3127 cm_event
.private_data_len
= 0;
3129 nes_debug(NES_DBG_CM
, "Generating a CM Disconnect Event"
3130 " for QP%u, SQ Head = %u, SQ Tail = %u. "
3131 "cm_id = %p, refcount = %u.\n",
3132 nesqp
->hwqp
.qp_id
, nesqp
->hwqp
.sq_head
,
3133 nesqp
->hwqp
.sq_tail
, cm_id
,
3134 atomic_read(&nesqp
->refcount
));
3136 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
3138 nes_debug(NES_DBG_CM
, "OFA CM event_handler "
3139 "returned, ret=%d\n", ret
);
3143 atomic_inc(&cm_closes
);
3144 nes_disconnect(nesqp
, 1);
3146 cm_id
->provider_data
= nesqp
;
3147 /* Send up the close complete event */
3148 cm_event
.event
= IW_CM_EVENT_CLOSE
;
3149 cm_event
.status
= 0;
3150 cm_event
.provider_data
= cm_id
->provider_data
;
3151 cm_event
.local_addr
= cm_id
->local_addr
;
3152 cm_event
.remote_addr
= cm_id
->remote_addr
;
3153 cm_event
.private_data
= NULL
;
3154 cm_event
.private_data_len
= 0;
3156 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
3158 nes_debug(NES_DBG_CM
, "OFA CM event_handler returned, ret=%d\n", ret
);
3160 cm_id
->rem_ref(cm_id
);
3171 static int nes_disconnect(struct nes_qp
*nesqp
, int abrupt
)
3174 struct nes_vnic
*nesvnic
;
3175 struct nes_device
*nesdev
;
3176 struct nes_ib_device
*nesibdev
;
3178 nesvnic
= to_nesvnic(nesqp
->ibqp
.device
);
3182 nesdev
= nesvnic
->nesdev
;
3183 nesibdev
= nesvnic
->nesibdev
;
3185 nes_debug(NES_DBG_CM
, "netdev refcnt = %u.\n",
3186 netdev_refcnt_read(nesvnic
->netdev
));
3188 if (nesqp
->active_conn
) {
3190 /* indicate this connection is NOT active */
3191 nesqp
->active_conn
= 0;
3193 /* Need to free the Last Streaming Mode Message */
3194 if (nesqp
->ietf_frame
) {
3196 nesibdev
->ibdev
.dereg_mr(nesqp
->lsmm_mr
);
3197 pci_free_consistent(nesdev
->pcidev
,
3198 nesqp
->private_data_len
+ nesqp
->ietf_frame_size
,
3199 nesqp
->ietf_frame
, nesqp
->ietf_frame_pbase
);
3203 /* close the CM node down if it is still active */
3204 if (nesqp
->cm_node
) {
3205 nes_debug(NES_DBG_CM
, "Call close API\n");
3207 g_cm_core
->api
->close(g_cm_core
, nesqp
->cm_node
);
3217 int nes_accept(struct iw_cm_id
*cm_id
, struct iw_cm_conn_param
*conn_param
)
3221 struct nes_qp
*nesqp
;
3222 struct nes_vnic
*nesvnic
;
3223 struct nes_device
*nesdev
;
3224 struct nes_cm_node
*cm_node
;
3225 struct nes_adapter
*adapter
;
3226 struct ib_qp_attr attr
;
3227 struct iw_cm_event cm_event
;
3228 struct nes_hw_qp_wqe
*wqe
;
3229 struct nes_v4_quad nes_quad
;
3233 struct nes_ib_device
*nesibdev
;
3234 struct ib_mr
*ibmr
= NULL
;
3235 struct ib_phys_buf ibphysbuf
;
3236 struct nes_pd
*nespd
;
3238 u8 mpa_frame_offset
= 0;
3239 struct ietf_mpa_v2
*mpa_v2_frame
;
3241 u8
*start_ptr
= &start_addr
;
3242 u8
**start_buff
= &start_ptr
;
3244 struct sockaddr_in
*laddr
= (struct sockaddr_in
*)&cm_id
->local_addr
;
3245 struct sockaddr_in
*raddr
= (struct sockaddr_in
*)&cm_id
->remote_addr
;
3247 ibqp
= nes_get_qp(cm_id
->device
, conn_param
->qpn
);
3251 /* get all our handles */
3252 nesqp
= to_nesqp(ibqp
);
3253 nesvnic
= to_nesvnic(nesqp
->ibqp
.device
);
3254 nesdev
= nesvnic
->nesdev
;
3255 adapter
= nesdev
->nesadapter
;
3257 cm_node
= (struct nes_cm_node
*)cm_id
->provider_data
;
3258 nes_debug(NES_DBG_CM
, "nes_accept: cm_node= %p nesvnic=%p, netdev=%p,"
3259 "%s\n", cm_node
, nesvnic
, nesvnic
->netdev
,
3260 nesvnic
->netdev
->name
);
3262 if (NES_CM_STATE_LISTENER_DESTROYED
== cm_node
->state
) {
3263 if (cm_node
->loopbackpartner
)
3264 rem_ref_cm_node(cm_node
->cm_core
, cm_node
->loopbackpartner
);
3265 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
3269 passive_state
= atomic_add_return(1, &cm_node
->passive_state
);
3270 if (passive_state
== NES_SEND_RESET_EVENT
) {
3271 rem_ref_cm_node(cm_node
->cm_core
, cm_node
);
3274 /* associate the node with the QP */
3275 nesqp
->cm_node
= (void *)cm_node
;
3276 cm_node
->nesqp
= nesqp
;
3279 nes_debug(NES_DBG_CM
, "QP%u, cm_node=%p, jiffies = %lu listener = %p\n",
3280 nesqp
->hwqp
.qp_id
, cm_node
, jiffies
, cm_node
->listener
);
3281 atomic_inc(&cm_accepts
);
3283 nes_debug(NES_DBG_CM
, "netdev refcnt = %u.\n",
3284 netdev_refcnt_read(nesvnic
->netdev
));
3286 nesqp
->ietf_frame_size
= sizeof(struct ietf_mpa_v2
);
3287 /* allocate the ietf frame and space for private data */
3288 nesqp
->ietf_frame
= pci_alloc_consistent(nesdev
->pcidev
,
3289 nesqp
->ietf_frame_size
+ conn_param
->private_data_len
,
3290 &nesqp
->ietf_frame_pbase
);
3292 if (!nesqp
->ietf_frame
) {
3293 nes_debug(NES_DBG_CM
, "Unable to allocate memory for private data\n");
3296 mpa_v2_frame
= (struct ietf_mpa_v2
*)nesqp
->ietf_frame
;
3298 if (cm_node
->mpa_frame_rev
== IETF_MPA_V1
)
3299 mpa_frame_offset
= 4;
3301 if (cm_node
->mpa_frame_rev
== IETF_MPA_V1
||
3302 cm_node
->mpav2_ird_ord
== IETF_NO_IRD_ORD
) {
3303 record_ird_ord(cm_node
, (u16
)conn_param
->ird
, (u16
)conn_param
->ord
);
3306 memcpy(mpa_v2_frame
->priv_data
, conn_param
->private_data
,
3307 conn_param
->private_data_len
);
3309 cm_build_mpa_frame(cm_node
, start_buff
, &buff_len
, nesqp
->ietf_frame
, MPA_KEY_REPLY
);
3310 nesqp
->private_data_len
= conn_param
->private_data_len
;
3312 /* setup our first outgoing iWarp send WQE (the IETF frame response) */
3313 wqe
= &nesqp
->hwqp
.sq_vbase
[0];
3315 if (raddr
->sin_addr
.s_addr
!= laddr
->sin_addr
.s_addr
) {
3316 u64temp
= (unsigned long)nesqp
;
3317 nesibdev
= nesvnic
->nesibdev
;
3318 nespd
= nesqp
->nespd
;
3319 ibphysbuf
.addr
= nesqp
->ietf_frame_pbase
+ mpa_frame_offset
;
3320 ibphysbuf
.size
= buff_len
;
3321 tagged_offset
= (u64
)(unsigned long)*start_buff
;
3322 ibmr
= nesibdev
->ibdev
.reg_phys_mr((struct ib_pd
*)nespd
,
3324 IB_ACCESS_LOCAL_WRITE
,
3327 nes_debug(NES_DBG_CM
, "Unable to register memory region"
3328 "for lSMM for cm_node = %p \n",
3330 pci_free_consistent(nesdev
->pcidev
,
3331 nesqp
->private_data_len
+ nesqp
->ietf_frame_size
,
3332 nesqp
->ietf_frame
, nesqp
->ietf_frame_pbase
);
3336 ibmr
->pd
= &nespd
->ibpd
;
3337 ibmr
->device
= nespd
->ibpd
.device
;
3338 nesqp
->lsmm_mr
= ibmr
;
3340 u64temp
|= NES_SW_CONTEXT_ALIGN
>> 1;
3341 set_wqe_64bit_value(wqe
->wqe_words
,
3342 NES_IWARP_SQ_WQE_COMP_CTX_LOW_IDX
,
3344 wqe
->wqe_words
[NES_IWARP_SQ_WQE_MISC_IDX
] =
3345 cpu_to_le32(NES_IWARP_SQ_WQE_STREAMING
|
3346 NES_IWARP_SQ_WQE_WRPDU
);
3347 wqe
->wqe_words
[NES_IWARP_SQ_WQE_TOTAL_PAYLOAD_IDX
] =
3348 cpu_to_le32(buff_len
);
3349 set_wqe_64bit_value(wqe
->wqe_words
,
3350 NES_IWARP_SQ_WQE_FRAG0_LOW_IDX
,
3351 (u64
)(unsigned long)(*start_buff
));
3352 wqe
->wqe_words
[NES_IWARP_SQ_WQE_LENGTH0_IDX
] =
3353 cpu_to_le32(buff_len
);
3354 wqe
->wqe_words
[NES_IWARP_SQ_WQE_STAG0_IDX
] = ibmr
->lkey
;
3355 if (nesqp
->sq_kmapped
) {
3356 nesqp
->sq_kmapped
= 0;
3357 kunmap(nesqp
->page
);
3360 nesqp
->nesqp_context
->ird_ord_sizes
|=
3361 cpu_to_le32(NES_QPCONTEXT_ORDIRD_LSMM_PRESENT
|
3362 NES_QPCONTEXT_ORDIRD_WRPDU
);
3364 nesqp
->nesqp_context
->ird_ord_sizes
|=
3365 cpu_to_le32(NES_QPCONTEXT_ORDIRD_WRPDU
);
3367 nesqp
->skip_lsmm
= 1;
3369 /* Cache the cm_id in the qp */
3370 nesqp
->cm_id
= cm_id
;
3371 cm_node
->cm_id
= cm_id
;
3373 /* nesqp->cm_node = (void *)cm_id->provider_data; */
3374 cm_id
->provider_data
= nesqp
;
3375 nesqp
->active_conn
= 0;
3377 if (cm_node
->state
== NES_CM_STATE_TSA
)
3378 nes_debug(NES_DBG_CM
, "Already state = TSA for cm_node=%p\n",
3381 nes_cm_init_tsa_conn(nesqp
, cm_node
);
3383 nesqp
->nesqp_context
->tcpPorts
[0] =
3384 cpu_to_le16(cm_node
->mapped_loc_port
);
3385 nesqp
->nesqp_context
->tcpPorts
[1] =
3386 cpu_to_le16(cm_node
->mapped_rem_port
);
3388 nesqp
->nesqp_context
->ip0
= cpu_to_le32(cm_node
->mapped_rem_addr
);
3390 nesqp
->nesqp_context
->misc2
|= cpu_to_le32(
3391 (u32
)PCI_FUNC(nesdev
->pcidev
->devfn
) <<
3392 NES_QPCONTEXT_MISC2_SRC_IP_SHIFT
);
3394 nesqp
->nesqp_context
->arp_index_vlan
|=
3395 cpu_to_le32(nes_arp_table(nesdev
,
3396 le32_to_cpu(nesqp
->nesqp_context
->ip0
), NULL
,
3397 NES_ARP_RESOLVE
) << 16);
3399 nesqp
->nesqp_context
->ts_val_delta
= cpu_to_le32(
3400 jiffies
- nes_read_indexed(nesdev
, NES_IDX_TCP_NOW
));
3402 nesqp
->nesqp_context
->ird_index
= cpu_to_le32(nesqp
->hwqp
.qp_id
);
3404 nesqp
->nesqp_context
->ird_ord_sizes
|= cpu_to_le32(
3405 ((u32
)1 << NES_QPCONTEXT_ORDIRD_IWARP_MODE_SHIFT
));
3406 nesqp
->nesqp_context
->ird_ord_sizes
|=
3407 cpu_to_le32((u32
)cm_node
->ord_size
);
3409 memset(&nes_quad
, 0, sizeof(nes_quad
));
3410 nes_quad
.DstIpAdrIndex
=
3411 cpu_to_le32((u32
)PCI_FUNC(nesdev
->pcidev
->devfn
) << 24);
3412 nes_quad
.SrcIpadr
= htonl(cm_node
->mapped_rem_addr
);
3413 nes_quad
.TcpPorts
[0] = htons(cm_node
->mapped_rem_port
);
3414 nes_quad
.TcpPorts
[1] = htons(cm_node
->mapped_loc_port
);
3416 /* Produce hash key */
3417 crc_value
= get_crc_value(&nes_quad
);
3418 nesqp
->hte_index
= cpu_to_be32(crc_value
^ 0xffffffff);
3419 nes_debug(NES_DBG_CM
, "HTE Index = 0x%08X, CRC = 0x%08X\n",
3420 nesqp
->hte_index
, nesqp
->hte_index
& adapter
->hte_index_mask
);
3422 nesqp
->hte_index
&= adapter
->hte_index_mask
;
3423 nesqp
->nesqp_context
->hte_index
= cpu_to_le32(nesqp
->hte_index
);
3425 cm_node
->cm_core
->api
->accelerated(cm_node
->cm_core
, cm_node
);
3427 nes_debug(NES_DBG_CM
, "QP%u, Destination IP = 0x%08X:0x%04X, local = "
3428 "0x%08X:0x%04X, rcv_nxt=0x%08X, snd_nxt=0x%08X, mpa + "
3429 "private data length=%u.\n", nesqp
->hwqp
.qp_id
,
3430 ntohl(raddr
->sin_addr
.s_addr
), ntohs(raddr
->sin_port
),
3431 ntohl(laddr
->sin_addr
.s_addr
), ntohs(laddr
->sin_port
),
3432 le32_to_cpu(nesqp
->nesqp_context
->rcv_nxt
),
3433 le32_to_cpu(nesqp
->nesqp_context
->snd_nxt
),
3436 /* notify OF layer that accept event was successful */
3437 cm_id
->add_ref(cm_id
);
3438 nes_add_ref(&nesqp
->ibqp
);
3440 cm_event
.event
= IW_CM_EVENT_ESTABLISHED
;
3441 cm_event
.status
= 0;
3442 cm_event
.provider_data
= (void *)nesqp
;
3443 cm_event
.local_addr
= cm_id
->local_addr
;
3444 cm_event
.remote_addr
= cm_id
->remote_addr
;
3445 cm_event
.private_data
= NULL
;
3446 cm_event
.private_data_len
= 0;
3447 cm_event
.ird
= cm_node
->ird_size
;
3448 cm_event
.ord
= cm_node
->ord_size
;
3450 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
3451 attr
.qp_state
= IB_QPS_RTS
;
3452 nes_modify_qp(&nesqp
->ibqp
, &attr
, IB_QP_STATE
, NULL
);
3453 if (cm_node
->loopbackpartner
) {
3454 cm_node
->loopbackpartner
->mpa_frame_size
=
3455 nesqp
->private_data_len
;
3456 /* copy entire MPA frame to our cm_node's frame */
3457 memcpy(cm_node
->loopbackpartner
->mpa_frame_buf
,
3458 conn_param
->private_data
, conn_param
->private_data_len
);
3459 create_event(cm_node
->loopbackpartner
, NES_CM_EVENT_CONNECTED
);
3462 printk(KERN_ERR
"%s[%u] OFA CM event_handler returned, "
3463 "ret=%d\n", __func__
, __LINE__
, ret
);
3472 int nes_reject(struct iw_cm_id
*cm_id
, const void *pdata
, u8 pdata_len
)
3474 struct nes_cm_node
*cm_node
;
3475 struct nes_cm_node
*loopback
;
3476 struct nes_cm_core
*cm_core
;
3479 atomic_inc(&cm_rejects
);
3480 cm_node
= (struct nes_cm_node
*)cm_id
->provider_data
;
3481 loopback
= cm_node
->loopbackpartner
;
3482 cm_core
= cm_node
->cm_core
;
3483 cm_node
->cm_id
= cm_id
;
3485 if (pdata_len
+ sizeof(struct ietf_mpa_v2
) > MAX_CM_BUFFER
)
3489 memcpy(&loopback
->mpa_frame
.priv_data
, pdata
, pdata_len
);
3490 loopback
->mpa_frame
.priv_data_len
= pdata_len
;
3491 loopback
->mpa_frame_size
= pdata_len
;
3493 start_buff
= &cm_node
->mpa_frame_buf
[0] + sizeof(struct ietf_mpa_v2
);
3494 cm_node
->mpa_frame_size
= pdata_len
;
3495 memcpy(start_buff
, pdata
, pdata_len
);
3497 return cm_core
->api
->reject(cm_core
, cm_node
);
3503 * setup and launch cm connect node
3505 int nes_connect(struct iw_cm_id
*cm_id
, struct iw_cm_conn_param
*conn_param
)
3508 struct nes_qp
*nesqp
;
3509 struct nes_vnic
*nesvnic
;
3510 struct nes_device
*nesdev
;
3511 struct nes_cm_node
*cm_node
;
3512 struct nes_cm_info cm_info
;
3514 struct sockaddr_in
*laddr
= (struct sockaddr_in
*)&cm_id
->local_addr
;
3515 struct sockaddr_in
*raddr
= (struct sockaddr_in
*)&cm_id
->remote_addr
;
3516 struct iwpm_dev_data pm_reg_msg
;
3517 struct iwpm_sa_data pm_msg
;
3520 if (cm_id
->remote_addr
.ss_family
!= AF_INET
)
3522 ibqp
= nes_get_qp(cm_id
->device
, conn_param
->qpn
);
3525 nesqp
= to_nesqp(ibqp
);
3528 nesvnic
= to_nesvnic(nesqp
->ibqp
.device
);
3531 nesdev
= nesvnic
->nesdev
;
3535 if (!laddr
->sin_port
|| !raddr
->sin_port
)
3538 nes_debug(NES_DBG_CM
, "QP%u, current IP = 0x%08X, Destination IP = "
3539 "0x%08X:0x%04X, local = 0x%08X:0x%04X.\n", nesqp
->hwqp
.qp_id
,
3540 ntohl(nesvnic
->local_ipaddr
), ntohl(raddr
->sin_addr
.s_addr
),
3541 ntohs(raddr
->sin_port
), ntohl(laddr
->sin_addr
.s_addr
),
3542 ntohs(laddr
->sin_port
));
3544 atomic_inc(&cm_connects
);
3545 nesqp
->active_conn
= 1;
3547 /* cache the cm_id in the qp */
3548 nesqp
->cm_id
= cm_id
;
3549 cm_id
->provider_data
= nesqp
;
3550 nesqp
->private_data_len
= conn_param
->private_data_len
;
3552 nes_debug(NES_DBG_CM
, "requested ord = 0x%08X.\n", (u32
)conn_param
->ord
);
3553 nes_debug(NES_DBG_CM
, "mpa private data len =%u\n",
3554 conn_param
->private_data_len
);
3556 /* set up the connection params for the node */
3557 cm_info
.loc_addr
= ntohl(laddr
->sin_addr
.s_addr
);
3558 cm_info
.loc_port
= ntohs(laddr
->sin_port
);
3559 cm_info
.rem_addr
= ntohl(raddr
->sin_addr
.s_addr
);
3560 cm_info
.rem_port
= ntohs(raddr
->sin_port
);
3561 cm_info
.cm_id
= cm_id
;
3562 cm_info
.conn_type
= NES_CM_IWARP_CONN_TYPE
;
3564 /* No port mapper available, go with the specified peer information */
3565 cm_info
.mapped_loc_addr
= cm_info
.loc_addr
;
3566 cm_info
.mapped_loc_port
= cm_info
.loc_port
;
3567 cm_info
.mapped_rem_addr
= cm_info
.rem_addr
;
3568 cm_info
.mapped_rem_port
= cm_info
.rem_port
;
3570 nes_form_reg_msg(nesvnic
, &pm_reg_msg
);
3571 iwpm_err
= iwpm_register_pid(&pm_reg_msg
, RDMA_NL_NES
);
3573 nes_debug(NES_DBG_NLMSG
,
3574 "Port Mapper reg pid fail (err = %d).\n", iwpm_err
);
3576 if (iwpm_valid_pid() && !iwpm_err
) {
3577 nes_form_pm_msg(&cm_info
, &pm_msg
);
3578 iwpm_err
= iwpm_add_and_query_mapping(&pm_msg
, RDMA_NL_NES
);
3580 nes_debug(NES_DBG_NLMSG
,
3581 "Port Mapper query fail (err = %d).\n", iwpm_err
);
3583 nes_record_pm_msg(&cm_info
, &pm_msg
);
3586 if (laddr
->sin_addr
.s_addr
!= raddr
->sin_addr
.s_addr
) {
3587 nes_manage_apbvt(nesvnic
, cm_info
.mapped_loc_port
,
3588 PCI_FUNC(nesdev
->pcidev
->devfn
), NES_MANAGE_APBVT_ADD
);
3592 if (nes_create_mapinfo(&cm_info
))
3595 cm_id
->add_ref(cm_id
);
3597 /* create a connect CM node connection */
3598 cm_node
= g_cm_core
->api
->connect(g_cm_core
, nesvnic
,
3599 conn_param
->private_data_len
, (void *)conn_param
->private_data
,
3603 nes_manage_apbvt(nesvnic
, cm_info
.mapped_loc_port
,
3604 PCI_FUNC(nesdev
->pcidev
->devfn
),
3605 NES_MANAGE_APBVT_DEL
);
3607 nes_debug(NES_DBG_NLMSG
, "Delete mapped_loc_port = %04X\n",
3608 cm_info
.mapped_loc_port
);
3609 nes_remove_mapinfo(cm_info
.loc_addr
, cm_info
.loc_port
,
3610 cm_info
.mapped_loc_addr
, cm_info
.mapped_loc_port
);
3611 cm_id
->rem_ref(cm_id
);
3615 record_ird_ord(cm_node
, (u16
)conn_param
->ird
, (u16
)conn_param
->ord
);
3616 if (cm_node
->send_rdma0_op
== SEND_RDMA_READ_ZERO
&&
3617 cm_node
->ord_size
== 0)
3618 cm_node
->ord_size
= 1;
3620 cm_node
->apbvt_set
= apbvt_set
;
3621 cm_node
->tos
= cm_id
->tos
;
3622 nesqp
->cm_node
= cm_node
;
3623 cm_node
->nesqp
= nesqp
;
3624 nes_add_ref(&nesqp
->ibqp
);
3633 int nes_create_listen(struct iw_cm_id
*cm_id
, int backlog
)
3635 struct nes_vnic
*nesvnic
;
3636 struct nes_cm_listener
*cm_node
;
3637 struct nes_cm_info cm_info
;
3639 struct sockaddr_in
*laddr
= (struct sockaddr_in
*)&cm_id
->local_addr
;
3641 nes_debug(NES_DBG_CM
, "cm_id = %p, local port = 0x%04X.\n",
3642 cm_id
, ntohs(laddr
->sin_port
));
3644 if (cm_id
->local_addr
.ss_family
!= AF_INET
)
3646 nesvnic
= to_nesvnic(cm_id
->device
);
3650 nes_debug(NES_DBG_CM
, "nesvnic=%p, netdev=%p, %s\n",
3651 nesvnic
, nesvnic
->netdev
, nesvnic
->netdev
->name
);
3653 nes_debug(NES_DBG_CM
, "nesvnic->local_ipaddr=0x%08x, sin_addr.s_addr=0x%08x\n",
3654 nesvnic
->local_ipaddr
, laddr
->sin_addr
.s_addr
);
3656 /* setup listen params in our api call struct */
3657 cm_info
.loc_addr
= ntohl(nesvnic
->local_ipaddr
);
3658 cm_info
.loc_port
= ntohs(laddr
->sin_port
);
3659 cm_info
.backlog
= backlog
;
3660 cm_info
.cm_id
= cm_id
;
3662 cm_info
.conn_type
= NES_CM_IWARP_CONN_TYPE
;
3664 /* No port mapper available, go with the specified info */
3665 cm_info
.mapped_loc_addr
= cm_info
.loc_addr
;
3666 cm_info
.mapped_loc_port
= cm_info
.loc_port
;
3668 cm_node
= g_cm_core
->api
->listen(g_cm_core
, nesvnic
, &cm_info
);
3670 printk(KERN_ERR
"%s[%u] Error returned from listen API call\n",
3671 __func__
, __LINE__
);
3675 cm_id
->provider_data
= cm_node
;
3676 cm_node
->tos
= cm_id
->tos
;
3678 if (!cm_node
->reused_node
) {
3679 if (nes_create_mapinfo(&cm_info
))
3682 err
= nes_manage_apbvt(nesvnic
, cm_node
->mapped_loc_port
,
3683 PCI_FUNC(nesvnic
->nesdev
->pcidev
->devfn
),
3684 NES_MANAGE_APBVT_ADD
);
3686 printk(KERN_ERR
"nes_manage_apbvt call returned %d.\n",
3688 g_cm_core
->api
->stop_listener(g_cm_core
, (void *)cm_node
);
3691 atomic_inc(&cm_listens_created
);
3694 cm_id
->add_ref(cm_id
);
3695 cm_id
->provider_data
= (void *)cm_node
;
3703 * nes_destroy_listen
3705 int nes_destroy_listen(struct iw_cm_id
*cm_id
)
3707 if (cm_id
->provider_data
)
3708 g_cm_core
->api
->stop_listener(g_cm_core
, cm_id
->provider_data
);
3710 nes_debug(NES_DBG_CM
, "cm_id->provider_data was NULL\n");
3712 cm_id
->rem_ref(cm_id
);
3721 int nes_cm_recv(struct sk_buff
*skb
, struct net_device
*netdevice
)
3725 cm_packets_received
++;
3726 if ((g_cm_core
) && (g_cm_core
->api
))
3727 rc
= g_cm_core
->api
->recv_pkt(g_cm_core
, netdev_priv(netdevice
), skb
);
3729 nes_debug(NES_DBG_CM
, "Unable to process packet for CM,"
3730 " cm is not setup properly.\n");
3738 * Start and init a cm core module
3740 int nes_cm_start(void)
3742 nes_debug(NES_DBG_CM
, "\n");
3743 /* create the primary CM core, pass this handle to subsequent core inits */
3744 g_cm_core
= nes_cm_alloc_core();
3754 * stop and dealloc all cm core instances
3756 int nes_cm_stop(void)
3758 g_cm_core
->api
->destroy_cm_core(g_cm_core
);
3764 * cm_event_connected
3765 * handle a connected event, setup QPs and HW
3767 static void cm_event_connected(struct nes_cm_event
*event
)
3769 struct nes_qp
*nesqp
;
3770 struct nes_vnic
*nesvnic
;
3771 struct nes_device
*nesdev
;
3772 struct nes_cm_node
*cm_node
;
3773 struct nes_adapter
*nesadapter
;
3774 struct ib_qp_attr attr
;
3775 struct iw_cm_id
*cm_id
;
3776 struct iw_cm_event cm_event
;
3777 struct nes_v4_quad nes_quad
;
3780 struct sockaddr_in
*laddr
;
3781 struct sockaddr_in
*raddr
;
3782 struct sockaddr_in
*cm_event_laddr
;
3784 /* get all our handles */
3785 cm_node
= event
->cm_node
;
3786 cm_id
= cm_node
->cm_id
;
3787 nes_debug(NES_DBG_CM
, "cm_event_connected - %p - cm_id = %p\n", cm_node
, cm_id
);
3788 nesqp
= (struct nes_qp
*)cm_id
->provider_data
;
3789 nesvnic
= to_nesvnic(nesqp
->ibqp
.device
);
3790 nesdev
= nesvnic
->nesdev
;
3791 nesadapter
= nesdev
->nesadapter
;
3792 laddr
= (struct sockaddr_in
*)&cm_id
->local_addr
;
3793 raddr
= (struct sockaddr_in
*)&cm_id
->remote_addr
;
3794 cm_event_laddr
= (struct sockaddr_in
*)&cm_event
.local_addr
;
3796 if (nesqp
->destroyed
)
3798 atomic_inc(&cm_connecteds
);
3799 nes_debug(NES_DBG_CM
, "QP%u attempting to connect to 0x%08X:0x%04X on"
3800 " local port 0x%04X. jiffies = %lu.\n",
3801 nesqp
->hwqp
.qp_id
, ntohl(raddr
->sin_addr
.s_addr
),
3802 ntohs(raddr
->sin_port
), ntohs(laddr
->sin_port
), jiffies
);
3804 nes_cm_init_tsa_conn(nesqp
, cm_node
);
3806 /* set the QP tsa context */
3807 nesqp
->nesqp_context
->tcpPorts
[0] =
3808 cpu_to_le16(cm_node
->mapped_loc_port
);
3809 nesqp
->nesqp_context
->tcpPorts
[1] =
3810 cpu_to_le16(cm_node
->mapped_rem_port
);
3811 nesqp
->nesqp_context
->ip0
= cpu_to_le32(cm_node
->mapped_rem_addr
);
3813 nesqp
->nesqp_context
->misc2
|= cpu_to_le32(
3814 (u32
)PCI_FUNC(nesdev
->pcidev
->devfn
) <<
3815 NES_QPCONTEXT_MISC2_SRC_IP_SHIFT
);
3816 nesqp
->nesqp_context
->arp_index_vlan
|= cpu_to_le32(
3817 nes_arp_table(nesdev
,
3818 le32_to_cpu(nesqp
->nesqp_context
->ip0
),
3819 NULL
, NES_ARP_RESOLVE
) << 16);
3820 nesqp
->nesqp_context
->ts_val_delta
= cpu_to_le32(
3821 jiffies
- nes_read_indexed(nesdev
, NES_IDX_TCP_NOW
));
3822 nesqp
->nesqp_context
->ird_index
= cpu_to_le32(nesqp
->hwqp
.qp_id
);
3823 nesqp
->nesqp_context
->ird_ord_sizes
|=
3824 cpu_to_le32((u32
)1 <<
3825 NES_QPCONTEXT_ORDIRD_IWARP_MODE_SHIFT
);
3826 nesqp
->nesqp_context
->ird_ord_sizes
|=
3827 cpu_to_le32((u32
)cm_node
->ord_size
);
3829 /* Adjust tail for not having a LSMM */
3830 /*nesqp->hwqp.sq_tail = 1;*/
3832 build_rdma0_msg(cm_node
, &nesqp
);
3834 nes_write32(nesdev
->regs
+ NES_WQE_ALLOC
,
3835 (1 << 24) | 0x00800000 | nesqp
->hwqp
.qp_id
);
3837 memset(&nes_quad
, 0, sizeof(nes_quad
));
3839 nes_quad
.DstIpAdrIndex
=
3840 cpu_to_le32((u32
)PCI_FUNC(nesdev
->pcidev
->devfn
) << 24);
3841 nes_quad
.SrcIpadr
= htonl(cm_node
->mapped_rem_addr
);
3842 nes_quad
.TcpPorts
[0] = htons(cm_node
->mapped_rem_port
);
3843 nes_quad
.TcpPorts
[1] = htons(cm_node
->mapped_loc_port
);
3845 /* Produce hash key */
3846 crc_value
= get_crc_value(&nes_quad
);
3847 nesqp
->hte_index
= cpu_to_be32(crc_value
^ 0xffffffff);
3848 nes_debug(NES_DBG_CM
, "HTE Index = 0x%08X, After CRC = 0x%08X\n",
3849 nesqp
->hte_index
, nesqp
->hte_index
& nesadapter
->hte_index_mask
);
3851 nesqp
->hte_index
&= nesadapter
->hte_index_mask
;
3852 nesqp
->nesqp_context
->hte_index
= cpu_to_le32(nesqp
->hte_index
);
3854 nesqp
->ietf_frame
= &cm_node
->mpa_frame
;
3855 nesqp
->private_data_len
= (u8
)cm_node
->mpa_frame_size
;
3856 cm_node
->cm_core
->api
->accelerated(cm_node
->cm_core
, cm_node
);
3858 /* notify OF layer we successfully created the requested connection */
3859 cm_event
.event
= IW_CM_EVENT_CONNECT_REPLY
;
3860 cm_event
.status
= 0;
3861 cm_event
.provider_data
= cm_id
->provider_data
;
3862 cm_event_laddr
->sin_family
= AF_INET
;
3863 cm_event_laddr
->sin_port
= laddr
->sin_port
;
3864 cm_event
.remote_addr
= cm_id
->remote_addr
;
3866 cm_event
.private_data
= (void *)event
->cm_node
->mpa_frame_buf
;
3867 cm_event
.private_data_len
= (u8
)event
->cm_node
->mpa_frame_size
;
3868 cm_event
.ird
= cm_node
->ird_size
;
3869 cm_event
.ord
= cm_node
->ord_size
;
3871 cm_event_laddr
->sin_addr
.s_addr
= htonl(event
->cm_info
.rem_addr
);
3872 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
3873 nes_debug(NES_DBG_CM
, "OFA CM event_handler returned, ret=%d\n", ret
);
3876 printk(KERN_ERR
"%s[%u] OFA CM event_handler returned, "
3877 "ret=%d\n", __func__
, __LINE__
, ret
);
3878 attr
.qp_state
= IB_QPS_RTS
;
3879 nes_modify_qp(&nesqp
->ibqp
, &attr
, IB_QP_STATE
, NULL
);
3881 nes_debug(NES_DBG_CM
, "Exiting connect thread for QP%u. jiffies = "
3882 "%lu\n", nesqp
->hwqp
.qp_id
, jiffies
);
3889 * cm_event_connect_error
3891 static void cm_event_connect_error(struct nes_cm_event
*event
)
3893 struct nes_qp
*nesqp
;
3894 struct iw_cm_id
*cm_id
;
3895 struct iw_cm_event cm_event
;
3896 /* struct nes_cm_info cm_info; */
3899 if (!event
->cm_node
)
3902 cm_id
= event
->cm_node
->cm_id
;
3906 nes_debug(NES_DBG_CM
, "cm_node=%p, cm_id=%p\n", event
->cm_node
, cm_id
);
3907 nesqp
= cm_id
->provider_data
;
3912 /* notify OF layer about this connection error event */
3913 /* cm_id->rem_ref(cm_id); */
3914 nesqp
->cm_id
= NULL
;
3915 cm_id
->provider_data
= NULL
;
3916 cm_event
.event
= IW_CM_EVENT_CONNECT_REPLY
;
3917 cm_event
.status
= -ECONNRESET
;
3918 cm_event
.provider_data
= cm_id
->provider_data
;
3919 cm_event
.local_addr
= cm_id
->local_addr
;
3920 cm_event
.remote_addr
= cm_id
->remote_addr
;
3921 cm_event
.private_data
= NULL
;
3922 cm_event
.private_data_len
= 0;
3924 #ifdef CONFIG_INFINIBAND_NES_DEBUG
3926 struct sockaddr_in
*cm_event_laddr
= (struct sockaddr_in
*)
3927 &cm_event
.local_addr
;
3928 struct sockaddr_in
*cm_event_raddr
= (struct sockaddr_in
*)
3929 &cm_event
.remote_addr
;
3930 nes_debug(NES_DBG_CM
, "call CM_EVENT REJECTED, local_addr=%08x, remote_addr=%08x\n",
3931 cm_event_laddr
->sin_addr
.s_addr
, cm_event_raddr
->sin_addr
.s_addr
);
3935 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
3936 nes_debug(NES_DBG_CM
, "OFA CM event_handler returned, ret=%d\n", ret
);
3938 printk(KERN_ERR
"%s[%u] OFA CM event_handler returned, "
3939 "ret=%d\n", __func__
, __LINE__
, ret
);
3940 cm_id
->rem_ref(cm_id
);
3942 rem_ref_cm_node(event
->cm_node
->cm_core
, event
->cm_node
);
3950 static void cm_event_reset(struct nes_cm_event
*event
)
3952 struct nes_qp
*nesqp
;
3953 struct iw_cm_id
*cm_id
;
3954 struct iw_cm_event cm_event
;
3955 /* struct nes_cm_info cm_info; */
3958 if (!event
->cm_node
)
3961 if (!event
->cm_node
->cm_id
)
3964 cm_id
= event
->cm_node
->cm_id
;
3966 nes_debug(NES_DBG_CM
, "%p - cm_id = %p\n", event
->cm_node
, cm_id
);
3967 nesqp
= cm_id
->provider_data
;
3971 nesqp
->cm_id
= NULL
;
3972 /* cm_id->provider_data = NULL; */
3973 cm_event
.event
= IW_CM_EVENT_DISCONNECT
;
3974 cm_event
.status
= -ECONNRESET
;
3975 cm_event
.provider_data
= cm_id
->provider_data
;
3976 cm_event
.local_addr
= cm_id
->local_addr
;
3977 cm_event
.remote_addr
= cm_id
->remote_addr
;
3978 cm_event
.private_data
= NULL
;
3979 cm_event
.private_data_len
= 0;
3981 cm_id
->add_ref(cm_id
);
3982 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
3983 atomic_inc(&cm_closes
);
3984 cm_event
.event
= IW_CM_EVENT_CLOSE
;
3985 cm_event
.status
= 0;
3986 cm_event
.provider_data
= cm_id
->provider_data
;
3987 cm_event
.local_addr
= cm_id
->local_addr
;
3988 cm_event
.remote_addr
= cm_id
->remote_addr
;
3989 cm_event
.private_data
= NULL
;
3990 cm_event
.private_data_len
= 0;
3991 nes_debug(NES_DBG_CM
, "NODE %p Generating CLOSE\n", event
->cm_node
);
3992 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
3994 nes_debug(NES_DBG_CM
, "OFA CM event_handler returned, ret=%d\n", ret
);
3997 /* notify OF layer about this connection error event */
3998 cm_id
->rem_ref(cm_id
);
4007 static void cm_event_mpa_req(struct nes_cm_event
*event
)
4009 struct iw_cm_id
*cm_id
;
4010 struct iw_cm_event cm_event
;
4012 struct nes_cm_node
*cm_node
;
4013 struct sockaddr_in
*cm_event_laddr
= (struct sockaddr_in
*)
4014 &cm_event
.local_addr
;
4015 struct sockaddr_in
*cm_event_raddr
= (struct sockaddr_in
*)
4016 &cm_event
.remote_addr
;
4018 cm_node
= event
->cm_node
;
4021 cm_id
= cm_node
->cm_id
;
4023 atomic_inc(&cm_connect_reqs
);
4024 nes_debug(NES_DBG_CM
, "cm_node = %p - cm_id = %p, jiffies = %lu\n",
4025 cm_node
, cm_id
, jiffies
);
4027 cm_event
.event
= IW_CM_EVENT_CONNECT_REQUEST
;
4028 cm_event
.status
= 0;
4029 cm_event
.provider_data
= (void *)cm_node
;
4031 cm_event_laddr
->sin_family
= AF_INET
;
4032 cm_event_laddr
->sin_port
= htons(event
->cm_info
.loc_port
);
4033 cm_event_laddr
->sin_addr
.s_addr
= htonl(event
->cm_info
.loc_addr
);
4035 cm_event_raddr
->sin_family
= AF_INET
;
4036 cm_event_raddr
->sin_port
= htons(event
->cm_info
.rem_port
);
4037 cm_event_raddr
->sin_addr
.s_addr
= htonl(event
->cm_info
.rem_addr
);
4038 cm_event
.private_data
= cm_node
->mpa_frame_buf
;
4039 cm_event
.private_data_len
= (u8
)cm_node
->mpa_frame_size
;
4040 if (cm_node
->mpa_frame_rev
== IETF_MPA_V1
) {
4041 cm_event
.ird
= NES_MAX_IRD
;
4042 cm_event
.ord
= NES_MAX_ORD
;
4044 cm_event
.ird
= cm_node
->ird_size
;
4045 cm_event
.ord
= cm_node
->ord_size
;
4048 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
4050 printk(KERN_ERR
"%s[%u] OFA CM event_handler returned, ret=%d\n",
4051 __func__
, __LINE__
, ret
);
4056 static void cm_event_mpa_reject(struct nes_cm_event
*event
)
4058 struct iw_cm_id
*cm_id
;
4059 struct iw_cm_event cm_event
;
4060 struct nes_cm_node
*cm_node
;
4062 struct sockaddr_in
*cm_event_laddr
= (struct sockaddr_in
*)
4063 &cm_event
.local_addr
;
4064 struct sockaddr_in
*cm_event_raddr
= (struct sockaddr_in
*)
4065 &cm_event
.remote_addr
;
4067 cm_node
= event
->cm_node
;
4070 cm_id
= cm_node
->cm_id
;
4072 atomic_inc(&cm_connect_reqs
);
4073 nes_debug(NES_DBG_CM
, "cm_node = %p - cm_id = %p, jiffies = %lu\n",
4074 cm_node
, cm_id
, jiffies
);
4076 cm_event
.event
= IW_CM_EVENT_CONNECT_REPLY
;
4077 cm_event
.status
= -ECONNREFUSED
;
4078 cm_event
.provider_data
= cm_id
->provider_data
;
4080 cm_event_laddr
->sin_family
= AF_INET
;
4081 cm_event_laddr
->sin_port
= htons(event
->cm_info
.loc_port
);
4082 cm_event_laddr
->sin_addr
.s_addr
= htonl(event
->cm_info
.loc_addr
);
4084 cm_event_raddr
->sin_family
= AF_INET
;
4085 cm_event_raddr
->sin_port
= htons(event
->cm_info
.rem_port
);
4086 cm_event_raddr
->sin_addr
.s_addr
= htonl(event
->cm_info
.rem_addr
);
4088 cm_event
.private_data
= cm_node
->mpa_frame_buf
;
4089 cm_event
.private_data_len
= (u8
)cm_node
->mpa_frame_size
;
4091 nes_debug(NES_DBG_CM
, "call CM_EVENT_MPA_REJECTED, local_addr=%08x, "
4092 "remove_addr=%08x\n",
4093 cm_event_laddr
->sin_addr
.s_addr
,
4094 cm_event_raddr
->sin_addr
.s_addr
);
4096 ret
= cm_id
->event_handler(cm_id
, &cm_event
);
4098 printk(KERN_ERR
"%s[%u] OFA CM event_handler returned, ret=%d\n",
4099 __func__
, __LINE__
, ret
);
4105 static void nes_cm_event_handler(struct work_struct
*);
4109 * post an event to the cm event handler
4111 static int nes_cm_post_event(struct nes_cm_event
*event
)
4113 atomic_inc(&event
->cm_node
->cm_core
->events_posted
);
4114 add_ref_cm_node(event
->cm_node
);
4115 event
->cm_info
.cm_id
->add_ref(event
->cm_info
.cm_id
);
4116 INIT_WORK(&event
->event_work
, nes_cm_event_handler
);
4117 nes_debug(NES_DBG_CM
, "cm_node=%p queue_work, event=%p\n",
4118 event
->cm_node
, event
);
4120 queue_work(event
->cm_node
->cm_core
->event_wq
, &event
->event_work
);
4122 nes_debug(NES_DBG_CM
, "Exit\n");
4128 * nes_cm_event_handler
4129 * worker function to handle cm events
4130 * will free instance of nes_cm_event
4132 static void nes_cm_event_handler(struct work_struct
*work
)
4134 struct nes_cm_event
*event
= container_of(work
, struct nes_cm_event
,
4136 struct nes_cm_core
*cm_core
;
4138 if ((!event
) || (!event
->cm_node
) || (!event
->cm_node
->cm_core
))
4141 cm_core
= event
->cm_node
->cm_core
;
4142 nes_debug(NES_DBG_CM
, "event=%p, event->type=%u, events posted=%u\n",
4143 event
, event
->type
, atomic_read(&cm_core
->events_posted
));
4145 switch (event
->type
) {
4146 case NES_CM_EVENT_MPA_REQ
:
4147 cm_event_mpa_req(event
);
4148 nes_debug(NES_DBG_CM
, "cm_node=%p CM Event: MPA REQUEST\n",
4151 case NES_CM_EVENT_RESET
:
4152 nes_debug(NES_DBG_CM
, "cm_node = %p CM Event: RESET\n",
4154 cm_event_reset(event
);
4156 case NES_CM_EVENT_CONNECTED
:
4157 if ((!event
->cm_node
->cm_id
) ||
4158 (event
->cm_node
->state
!= NES_CM_STATE_TSA
))
4160 cm_event_connected(event
);
4161 nes_debug(NES_DBG_CM
, "CM Event: CONNECTED\n");
4163 case NES_CM_EVENT_MPA_REJECT
:
4164 if ((!event
->cm_node
->cm_id
) ||
4165 (event
->cm_node
->state
== NES_CM_STATE_TSA
))
4167 cm_event_mpa_reject(event
);
4168 nes_debug(NES_DBG_CM
, "CM Event: REJECT\n");
4171 case NES_CM_EVENT_ABORTED
:
4172 if ((!event
->cm_node
->cm_id
) ||
4173 (event
->cm_node
->state
== NES_CM_STATE_TSA
))
4175 cm_event_connect_error(event
);
4176 nes_debug(NES_DBG_CM
, "CM Event: ABORTED\n");
4178 case NES_CM_EVENT_DROPPED_PKT
:
4179 nes_debug(NES_DBG_CM
, "CM Event: DROPPED PKT\n");
4182 nes_debug(NES_DBG_CM
, "CM Event: UNKNOWN EVENT TYPE\n");
4186 atomic_dec(&cm_core
->events_posted
);
4187 event
->cm_info
.cm_id
->rem_ref(event
->cm_info
.cm_id
);
4188 rem_ref_cm_node(cm_core
, event
->cm_node
);