1 /*******************************************************************************
3 * Copyright (c) 2015-2016 Intel Corporation. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenFabrics.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
33 *******************************************************************************/
35 #include <linux/atomic.h>
37 #include <linux/tcp.h>
38 #include <linux/init.h>
39 #include <linux/if_arp.h>
40 #include <linux/if_vlan.h>
41 #include <linux/notifier.h>
42 #include <linux/net.h>
43 #include <linux/types.h>
44 #include <linux/timer.h>
45 #include <linux/time.h>
46 #include <linux/delay.h>
47 #include <linux/etherdevice.h>
48 #include <linux/netdevice.h>
49 #include <linux/random.h>
50 #include <linux/list.h>
51 #include <linux/threads.h>
52 #include <linux/highmem.h>
54 #include <net/ndisc.h>
55 #include <net/neighbour.h>
56 #include <net/route.h>
57 #include <net/addrconf.h>
58 #include <net/ip6_route.h>
59 #include <net/ip_fib.h>
60 #include <net/secure_seq.h>
62 #include <asm/checksum.h>
66 static void i40iw_rem_ref_cm_node(struct i40iw_cm_node
*);
67 static void i40iw_cm_post_event(struct i40iw_cm_event
*event
);
68 static void i40iw_disconnect_worker(struct work_struct
*work
);
71 * i40iw_free_sqbuf - put back puda buffer if refcount = 0
72 * @vsi: pointer to vsi structure
73 * @buf: puda buffer to free
75 void i40iw_free_sqbuf(struct i40iw_sc_vsi
*vsi
, void *bufp
)
77 struct i40iw_puda_buf
*buf
= (struct i40iw_puda_buf
*)bufp
;
78 struct i40iw_puda_rsrc
*ilq
= vsi
->ilq
;
80 if (!atomic_dec_return(&buf
->refcount
))
81 i40iw_puda_ret_bufpool(ilq
, buf
);
85 * i40iw_derive_hw_ird_setting - Calculate IRD
87 * @cm_ird: IRD of connection's node
89 * The ird from the connection is rounded to a supported HW
90 * setting (2,8,32,64) and then encoded for ird_size field of
93 static u8
i40iw_derive_hw_ird_setting(u16 cm_ird
)
97 /* ird_size field is encoded in qp_ctx */
98 switch (cm_ird
? roundup_pow_of_two(cm_ird
) : 0) {
99 case I40IW_HW_IRD_SETTING_64
:
100 encoded_ird_size
= 3;
102 case I40IW_HW_IRD_SETTING_32
:
103 case I40IW_HW_IRD_SETTING_16
:
104 encoded_ird_size
= 2;
106 case I40IW_HW_IRD_SETTING_8
:
107 case I40IW_HW_IRD_SETTING_4
:
108 encoded_ird_size
= 1;
110 case I40IW_HW_IRD_SETTING_2
:
112 encoded_ird_size
= 0;
115 return encoded_ird_size
;
119 * i40iw_record_ird_ord - Record IRD/ORD passed in
120 * @cm_node: connection's node
121 * @conn_ird: connection IRD
122 * @conn_ord: connection ORD
124 static void i40iw_record_ird_ord(struct i40iw_cm_node
*cm_node
, u32 conn_ird
,
127 if (conn_ird
> I40IW_MAX_IRD_SIZE
)
128 conn_ird
= I40IW_MAX_IRD_SIZE
;
130 if (conn_ord
> I40IW_MAX_ORD_SIZE
)
131 conn_ord
= I40IW_MAX_ORD_SIZE
;
132 else if (!conn_ord
&& cm_node
->send_rdma0_op
== SEND_RDMA_READ_ZERO
)
135 cm_node
->ird_size
= conn_ird
;
136 cm_node
->ord_size
= conn_ord
;
140 * i40iw_copy_ip_ntohl - change network to host ip
144 void i40iw_copy_ip_ntohl(u32
*dst
, __be32
*src
)
146 *dst
++ = ntohl(*src
++);
147 *dst
++ = ntohl(*src
++);
148 *dst
++ = ntohl(*src
++);
153 * i40iw_copy_ip_htonl - change host addr to network ip
155 * @src: little endian
157 static inline void i40iw_copy_ip_htonl(__be32
*dst
, u32
*src
)
159 *dst
++ = htonl(*src
++);
160 *dst
++ = htonl(*src
++);
161 *dst
++ = htonl(*src
++);
166 * i40iw_fill_sockaddr4 - get addr info for passive connection
167 * @cm_node: connection's node
168 * @event: upper layer's cm event
170 static inline void i40iw_fill_sockaddr4(struct i40iw_cm_node
*cm_node
,
171 struct iw_cm_event
*event
)
173 struct sockaddr_in
*laddr
= (struct sockaddr_in
*)&event
->local_addr
;
174 struct sockaddr_in
*raddr
= (struct sockaddr_in
*)&event
->remote_addr
;
176 laddr
->sin_family
= AF_INET
;
177 raddr
->sin_family
= AF_INET
;
179 laddr
->sin_port
= htons(cm_node
->loc_port
);
180 raddr
->sin_port
= htons(cm_node
->rem_port
);
182 laddr
->sin_addr
.s_addr
= htonl(cm_node
->loc_addr
[0]);
183 raddr
->sin_addr
.s_addr
= htonl(cm_node
->rem_addr
[0]);
187 * i40iw_fill_sockaddr6 - get ipv6 addr info for passive side
188 * @cm_node: connection's node
189 * @event: upper layer's cm event
191 static inline void i40iw_fill_sockaddr6(struct i40iw_cm_node
*cm_node
,
192 struct iw_cm_event
*event
)
194 struct sockaddr_in6
*laddr6
= (struct sockaddr_in6
*)&event
->local_addr
;
195 struct sockaddr_in6
*raddr6
= (struct sockaddr_in6
*)&event
->remote_addr
;
197 laddr6
->sin6_family
= AF_INET6
;
198 raddr6
->sin6_family
= AF_INET6
;
200 laddr6
->sin6_port
= htons(cm_node
->loc_port
);
201 raddr6
->sin6_port
= htons(cm_node
->rem_port
);
203 i40iw_copy_ip_htonl(laddr6
->sin6_addr
.in6_u
.u6_addr32
,
205 i40iw_copy_ip_htonl(raddr6
->sin6_addr
.in6_u
.u6_addr32
,
210 * i40iw_get_addr_info
211 * @cm_node: contains ip/tcp info
212 * @cm_info: to get a copy of the cm_node ip/tcp info
214 static void i40iw_get_addr_info(struct i40iw_cm_node
*cm_node
,
215 struct i40iw_cm_info
*cm_info
)
217 cm_info
->ipv4
= cm_node
->ipv4
;
218 cm_info
->vlan_id
= cm_node
->vlan_id
;
219 memcpy(cm_info
->loc_addr
, cm_node
->loc_addr
, sizeof(cm_info
->loc_addr
));
220 memcpy(cm_info
->rem_addr
, cm_node
->rem_addr
, sizeof(cm_info
->rem_addr
));
221 cm_info
->loc_port
= cm_node
->loc_port
;
222 cm_info
->rem_port
= cm_node
->rem_port
;
223 cm_info
->user_pri
= cm_node
->user_pri
;
227 * i40iw_get_cmevent_info - for cm event upcall
228 * @cm_node: connection's node
229 * @cm_id: upper layers cm struct for the event
230 * @event: upper layer's cm event
232 static inline void i40iw_get_cmevent_info(struct i40iw_cm_node
*cm_node
,
233 struct iw_cm_id
*cm_id
,
234 struct iw_cm_event
*event
)
236 memcpy(&event
->local_addr
, &cm_id
->m_local_addr
,
237 sizeof(event
->local_addr
));
238 memcpy(&event
->remote_addr
, &cm_id
->m_remote_addr
,
239 sizeof(event
->remote_addr
));
241 event
->private_data
= (void *)cm_node
->pdata_buf
;
242 event
->private_data_len
= (u8
)cm_node
->pdata
.size
;
243 event
->ird
= cm_node
->ird_size
;
244 event
->ord
= cm_node
->ord_size
;
249 * i40iw_send_cm_event - upcall cm's event handler
250 * @cm_node: connection's node
251 * @cm_id: upper layer's cm info struct
252 * @type: Event type to indicate
253 * @status: status for the event type
255 static int i40iw_send_cm_event(struct i40iw_cm_node
*cm_node
,
256 struct iw_cm_id
*cm_id
,
257 enum iw_cm_event_type type
,
260 struct iw_cm_event event
;
262 memset(&event
, 0, sizeof(event
));
264 event
.status
= status
;
266 case IW_CM_EVENT_CONNECT_REQUEST
:
268 i40iw_fill_sockaddr4(cm_node
, &event
);
270 i40iw_fill_sockaddr6(cm_node
, &event
);
271 event
.provider_data
= (void *)cm_node
;
272 event
.private_data
= (void *)cm_node
->pdata_buf
;
273 event
.private_data_len
= (u8
)cm_node
->pdata
.size
;
274 event
.ird
= cm_node
->ird_size
;
276 case IW_CM_EVENT_CONNECT_REPLY
:
277 i40iw_get_cmevent_info(cm_node
, cm_id
, &event
);
279 case IW_CM_EVENT_ESTABLISHED
:
280 event
.ird
= cm_node
->ird_size
;
281 event
.ord
= cm_node
->ord_size
;
283 case IW_CM_EVENT_DISCONNECT
:
285 case IW_CM_EVENT_CLOSE
:
288 i40iw_pr_err("event type received type = %d\n", type
);
291 return cm_id
->event_handler(cm_id
, &event
);
295 * i40iw_create_event - create cm event
296 * @cm_node: connection's node
297 * @type: Event type to generate
299 static struct i40iw_cm_event
*i40iw_create_event(struct i40iw_cm_node
*cm_node
,
300 enum i40iw_cm_event_type type
)
302 struct i40iw_cm_event
*event
;
307 event
= kzalloc(sizeof(*event
), GFP_ATOMIC
);
313 event
->cm_node
= cm_node
;
314 memcpy(event
->cm_info
.rem_addr
, cm_node
->rem_addr
, sizeof(event
->cm_info
.rem_addr
));
315 memcpy(event
->cm_info
.loc_addr
, cm_node
->loc_addr
, sizeof(event
->cm_info
.loc_addr
));
316 event
->cm_info
.rem_port
= cm_node
->rem_port
;
317 event
->cm_info
.loc_port
= cm_node
->loc_port
;
318 event
->cm_info
.cm_id
= cm_node
->cm_id
;
320 i40iw_debug(cm_node
->dev
,
322 "node=%p event=%p type=%u dst=%pI4 src=%pI4\n",
326 event
->cm_info
.loc_addr
,
327 event
->cm_info
.rem_addr
);
329 i40iw_cm_post_event(event
);
334 * i40iw_free_retrans_entry - free send entry
335 * @cm_node: connection's node
337 static void i40iw_free_retrans_entry(struct i40iw_cm_node
*cm_node
)
339 struct i40iw_device
*iwdev
= cm_node
->iwdev
;
340 struct i40iw_timer_entry
*send_entry
;
342 send_entry
= cm_node
->send_entry
;
344 cm_node
->send_entry
= NULL
;
345 i40iw_free_sqbuf(&iwdev
->vsi
, (void *)send_entry
->sqbuf
);
347 atomic_dec(&cm_node
->ref_count
);
352 * i40iw_cleanup_retrans_entry - free send entry with lock
353 * @cm_node: connection's node
355 static void i40iw_cleanup_retrans_entry(struct i40iw_cm_node
*cm_node
)
359 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
360 i40iw_free_retrans_entry(cm_node
);
361 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
365 * i40iw_form_cm_frame - get a free packet and build frame
366 * @cm_node: connection's node ionfo to use in frame
367 * @options: pointer to options info
368 * @hdr: pointer mpa header
369 * @pdata: pointer to private data
370 * @flags: indicates FIN or ACK
372 static struct i40iw_puda_buf
*i40iw_form_cm_frame(struct i40iw_cm_node
*cm_node
,
373 struct i40iw_kmem_info
*options
,
374 struct i40iw_kmem_info
*hdr
,
375 struct i40iw_kmem_info
*pdata
,
378 struct i40iw_puda_buf
*sqbuf
;
379 struct i40iw_sc_vsi
*vsi
= &cm_node
->iwdev
->vsi
;
384 struct ipv6hdr
*ip6h
;
387 u16 eth_hlen
= ETH_HLEN
;
393 sqbuf
= i40iw_puda_get_bufpool(vsi
->ilq
);
399 opts_len
= (u32
)options
->size
;
405 pd_len
= pdata
->size
;
407 if (cm_node
->vlan_id
<= VLAN_VID_MASK
)
411 packetsize
= sizeof(*iph
) + sizeof(*tcph
);
413 packetsize
= sizeof(*ip6h
) + sizeof(*tcph
);
414 packetsize
+= opts_len
+ hdr_len
+ pd_len
;
416 memset(buf
, 0x00, eth_hlen
+ packetsize
);
418 sqbuf
->totallen
= packetsize
+ eth_hlen
;
419 sqbuf
->maclen
= eth_hlen
;
420 sqbuf
->tcphlen
= sizeof(*tcph
) + opts_len
;
421 sqbuf
->scratch
= (void *)cm_node
;
423 ethh
= (struct ethhdr
*)buf
;
429 iph
= (struct iphdr
*)buf
;
431 tcph
= (struct tcphdr
*)buf
;
432 buf
+= sizeof(*tcph
);
434 ether_addr_copy(ethh
->h_dest
, cm_node
->rem_mac
);
435 ether_addr_copy(ethh
->h_source
, cm_node
->loc_mac
);
436 if (cm_node
->vlan_id
<= VLAN_VID_MASK
) {
437 ((struct vlan_ethhdr
*)ethh
)->h_vlan_proto
= htons(ETH_P_8021Q
);
438 vtag
= (cm_node
->user_pri
<< VLAN_PRIO_SHIFT
) | cm_node
->vlan_id
;
439 ((struct vlan_ethhdr
*)ethh
)->h_vlan_TCI
= htons(vtag
);
441 ((struct vlan_ethhdr
*)ethh
)->h_vlan_encapsulated_proto
= htons(ETH_P_IP
);
443 ethh
->h_proto
= htons(ETH_P_IP
);
446 iph
->version
= IPVERSION
;
447 iph
->ihl
= 5; /* 5 * 4Byte words, IP headr len */
448 iph
->tos
= cm_node
->tos
;
449 iph
->tot_len
= htons(packetsize
);
450 iph
->id
= htons(++cm_node
->tcp_cntxt
.loc_id
);
452 iph
->frag_off
= htons(0x4000);
454 iph
->protocol
= IPPROTO_TCP
;
455 iph
->saddr
= htonl(cm_node
->loc_addr
[0]);
456 iph
->daddr
= htonl(cm_node
->rem_addr
[0]);
459 ip6h
= (struct ipv6hdr
*)buf
;
460 buf
+= sizeof(*ip6h
);
461 tcph
= (struct tcphdr
*)buf
;
462 buf
+= sizeof(*tcph
);
464 ether_addr_copy(ethh
->h_dest
, cm_node
->rem_mac
);
465 ether_addr_copy(ethh
->h_source
, cm_node
->loc_mac
);
466 if (cm_node
->vlan_id
<= VLAN_VID_MASK
) {
467 ((struct vlan_ethhdr
*)ethh
)->h_vlan_proto
= htons(ETH_P_8021Q
);
468 vtag
= (cm_node
->user_pri
<< VLAN_PRIO_SHIFT
) | cm_node
->vlan_id
;
469 ((struct vlan_ethhdr
*)ethh
)->h_vlan_TCI
= htons(vtag
);
470 ((struct vlan_ethhdr
*)ethh
)->h_vlan_encapsulated_proto
= htons(ETH_P_IPV6
);
472 ethh
->h_proto
= htons(ETH_P_IPV6
);
475 ip6h
->priority
= cm_node
->tos
>> 4;
476 ip6h
->flow_lbl
[0] = cm_node
->tos
<< 4;
477 ip6h
->flow_lbl
[1] = 0;
478 ip6h
->flow_lbl
[2] = 0;
479 ip6h
->payload_len
= htons(packetsize
- sizeof(*ip6h
));
481 ip6h
->hop_limit
= 128;
482 i40iw_copy_ip_htonl(ip6h
->saddr
.in6_u
.u6_addr32
,
484 i40iw_copy_ip_htonl(ip6h
->daddr
.in6_u
.u6_addr32
,
488 tcph
->source
= htons(cm_node
->loc_port
);
489 tcph
->dest
= htons(cm_node
->rem_port
);
491 tcph
->seq
= htonl(cm_node
->tcp_cntxt
.loc_seq_num
);
493 if (flags
& SET_ACK
) {
494 cm_node
->tcp_cntxt
.loc_ack_num
= cm_node
->tcp_cntxt
.rcv_nxt
;
495 tcph
->ack_seq
= htonl(cm_node
->tcp_cntxt
.loc_ack_num
);
501 if (flags
& SET_SYN
) {
502 cm_node
->tcp_cntxt
.loc_seq_num
++;
505 cm_node
->tcp_cntxt
.loc_seq_num
+= hdr_len
+ pd_len
;
508 if (flags
& SET_FIN
) {
509 cm_node
->tcp_cntxt
.loc_seq_num
++;
516 tcph
->doff
= (u16
)((sizeof(*tcph
) + opts_len
+ 3) >> 2);
517 sqbuf
->tcphlen
= tcph
->doff
<< 2;
518 tcph
->window
= htons(cm_node
->tcp_cntxt
.rcv_wnd
);
522 memcpy(buf
, options
->addr
, opts_len
);
527 memcpy(buf
, hdr
->addr
, hdr_len
);
531 if (pdata
&& pdata
->addr
)
532 memcpy(buf
, pdata
->addr
, pdata
->size
);
534 atomic_set(&sqbuf
->refcount
, 1);
540 * i40iw_send_reset - Send RST packet
541 * @cm_node: connection's node
543 int i40iw_send_reset(struct i40iw_cm_node
*cm_node
)
545 struct i40iw_puda_buf
*sqbuf
;
546 int flags
= SET_RST
| SET_ACK
;
548 sqbuf
= i40iw_form_cm_frame(cm_node
, NULL
, NULL
, NULL
, flags
);
550 i40iw_pr_err("no sqbuf\n");
554 return i40iw_schedule_cm_timer(cm_node
, sqbuf
, I40IW_TIMER_TYPE_SEND
, 0, 1);
558 * i40iw_active_open_err - send event for active side cm error
559 * @cm_node: connection's node
560 * @reset: Flag to send reset or not
562 static void i40iw_active_open_err(struct i40iw_cm_node
*cm_node
, bool reset
)
564 i40iw_cleanup_retrans_entry(cm_node
);
565 cm_node
->cm_core
->stats_connect_errs
++;
567 i40iw_debug(cm_node
->dev
,
569 "%s cm_node=%p state=%d\n",
573 atomic_inc(&cm_node
->ref_count
);
574 i40iw_send_reset(cm_node
);
577 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
578 i40iw_create_event(cm_node
, I40IW_CM_EVENT_ABORTED
);
582 * i40iw_passive_open_err - handle passive side cm error
583 * @cm_node: connection's node
584 * @reset: send reset or just free cm_node
586 static void i40iw_passive_open_err(struct i40iw_cm_node
*cm_node
, bool reset
)
588 i40iw_cleanup_retrans_entry(cm_node
);
589 cm_node
->cm_core
->stats_passive_errs
++;
590 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
591 i40iw_debug(cm_node
->dev
,
593 "%s cm_node=%p state =%d\n",
598 i40iw_send_reset(cm_node
);
600 i40iw_rem_ref_cm_node(cm_node
);
604 * i40iw_event_connect_error - to create connect error event
605 * @event: cm information for connect event
607 static void i40iw_event_connect_error(struct i40iw_cm_event
*event
)
609 struct i40iw_qp
*iwqp
;
610 struct iw_cm_id
*cm_id
;
612 cm_id
= event
->cm_node
->cm_id
;
616 iwqp
= cm_id
->provider_data
;
618 if (!iwqp
|| !iwqp
->iwdev
)
622 cm_id
->provider_data
= NULL
;
623 i40iw_send_cm_event(event
->cm_node
, cm_id
,
624 IW_CM_EVENT_CONNECT_REPLY
,
626 cm_id
->rem_ref(cm_id
);
627 i40iw_rem_ref_cm_node(event
->cm_node
);
631 * i40iw_process_options
632 * @cm_node: connection's node
633 * @optionsloc: point to start of options
634 * @optionsize: size of all options
635 * @syn_packet: flag if syn packet
637 static int i40iw_process_options(struct i40iw_cm_node
*cm_node
,
644 union all_known_options
*all_options
;
645 char got_mss_option
= 0;
647 while (offset
< optionsize
) {
648 all_options
= (union all_known_options
*)(optionsloc
+ offset
);
649 switch (all_options
->as_base
.optionnum
) {
650 case OPTION_NUMBER_END
:
653 case OPTION_NUMBER_NONE
:
656 case OPTION_NUMBER_MSS
:
657 i40iw_debug(cm_node
->dev
,
659 "%s: MSS Length: %d Offset: %d Size: %d\n",
661 all_options
->as_mss
.length
,
665 if (all_options
->as_mss
.length
!= 4)
667 tmp
= ntohs(all_options
->as_mss
.mss
);
668 if (tmp
> 0 && tmp
< cm_node
->tcp_cntxt
.mss
)
669 cm_node
->tcp_cntxt
.mss
= tmp
;
671 case OPTION_NUMBER_WINDOW_SCALE
:
672 cm_node
->tcp_cntxt
.snd_wscale
=
673 all_options
->as_windowscale
.shiftcount
;
676 i40iw_debug(cm_node
->dev
,
678 "TCP Option not understood: %x\n",
679 all_options
->as_base
.optionnum
);
682 offset
+= all_options
->as_base
.length
;
684 if (!got_mss_option
&& syn_packet
)
685 cm_node
->tcp_cntxt
.mss
= I40IW_CM_DEFAULT_MSS
;
690 * i40iw_handle_tcp_options -
691 * @cm_node: connection's node
692 * @tcph: pointer tcp header
693 * @optionsize: size of options rcvd
694 * @passive: active or passive flag
696 static int i40iw_handle_tcp_options(struct i40iw_cm_node
*cm_node
,
701 u8
*optionsloc
= (u8
*)&tcph
[1];
704 if (i40iw_process_options(cm_node
,
708 i40iw_debug(cm_node
->dev
,
710 "%s: Node %p, Sending RESET\n",
714 i40iw_passive_open_err(cm_node
, true);
716 i40iw_active_open_err(cm_node
, true);
721 cm_node
->tcp_cntxt
.snd_wnd
= ntohs(tcph
->window
) <<
722 cm_node
->tcp_cntxt
.snd_wscale
;
724 if (cm_node
->tcp_cntxt
.snd_wnd
> cm_node
->tcp_cntxt
.max_snd_wnd
)
725 cm_node
->tcp_cntxt
.max_snd_wnd
= cm_node
->tcp_cntxt
.snd_wnd
;
730 * i40iw_build_mpa_v1 - build a MPA V1 frame
731 * @cm_node: connection's node
732 * @mpa_key: to do read0 or write0
734 static void i40iw_build_mpa_v1(struct i40iw_cm_node
*cm_node
,
738 struct ietf_mpa_v1
*mpa_frame
= (struct ietf_mpa_v1
*)start_addr
;
741 case MPA_KEY_REQUEST
:
742 memcpy(mpa_frame
->key
, IEFT_MPA_KEY_REQ
, IETF_MPA_KEY_SIZE
);
745 memcpy(mpa_frame
->key
, IEFT_MPA_KEY_REP
, IETF_MPA_KEY_SIZE
);
750 mpa_frame
->flags
= IETF_MPA_FLAGS_CRC
;
751 mpa_frame
->rev
= cm_node
->mpa_frame_rev
;
752 mpa_frame
->priv_data_len
= htons(cm_node
->pdata
.size
);
756 * i40iw_build_mpa_v2 - build a MPA V2 frame
757 * @cm_node: connection's node
758 * @start_addr: buffer start address
759 * @mpa_key: to do read0 or write0
761 static void i40iw_build_mpa_v2(struct i40iw_cm_node
*cm_node
,
765 struct ietf_mpa_v2
*mpa_frame
= (struct ietf_mpa_v2
*)start_addr
;
766 struct ietf_rtr_msg
*rtr_msg
= &mpa_frame
->rtr_msg
;
767 u16 ctrl_ird
, ctrl_ord
;
769 /* initialize the upper 5 bytes of the frame */
770 i40iw_build_mpa_v1(cm_node
, start_addr
, mpa_key
);
771 mpa_frame
->flags
|= IETF_MPA_V2_FLAG
;
772 mpa_frame
->priv_data_len
+= htons(IETF_RTR_MSG_SIZE
);
774 /* initialize RTR msg */
775 if (cm_node
->mpav2_ird_ord
== IETF_NO_IRD_ORD
) {
776 ctrl_ird
= IETF_NO_IRD_ORD
;
777 ctrl_ord
= IETF_NO_IRD_ORD
;
779 ctrl_ird
= (cm_node
->ird_size
> IETF_NO_IRD_ORD
) ?
780 IETF_NO_IRD_ORD
: cm_node
->ird_size
;
781 ctrl_ord
= (cm_node
->ord_size
> IETF_NO_IRD_ORD
) ?
782 IETF_NO_IRD_ORD
: cm_node
->ord_size
;
785 ctrl_ird
|= IETF_PEER_TO_PEER
;
788 case MPA_KEY_REQUEST
:
789 ctrl_ord
|= IETF_RDMA0_WRITE
;
790 ctrl_ord
|= IETF_RDMA0_READ
;
793 switch (cm_node
->send_rdma0_op
) {
794 case SEND_RDMA_WRITE_ZERO
:
795 ctrl_ord
|= IETF_RDMA0_WRITE
;
797 case SEND_RDMA_READ_ZERO
:
798 ctrl_ord
|= IETF_RDMA0_READ
;
805 rtr_msg
->ctrl_ird
= htons(ctrl_ird
);
806 rtr_msg
->ctrl_ord
= htons(ctrl_ord
);
810 * i40iw_cm_build_mpa_frame - build mpa frame for mpa version 1 or version 2
811 * @cm_node: connection's node
812 * @mpa: mpa: data buffer
813 * @mpa_key: to do read0 or write0
815 static int i40iw_cm_build_mpa_frame(struct i40iw_cm_node
*cm_node
,
816 struct i40iw_kmem_info
*mpa
,
821 switch (cm_node
->mpa_frame_rev
) {
823 hdr_len
= sizeof(struct ietf_mpa_v1
);
824 i40iw_build_mpa_v1(cm_node
, mpa
->addr
, mpa_key
);
827 hdr_len
= sizeof(struct ietf_mpa_v2
);
828 i40iw_build_mpa_v2(cm_node
, mpa
->addr
, mpa_key
);
838 * i40iw_send_mpa_request - active node send mpa request to passive node
839 * @cm_node: connection's node
841 static int i40iw_send_mpa_request(struct i40iw_cm_node
*cm_node
)
843 struct i40iw_puda_buf
*sqbuf
;
846 i40iw_pr_err("cm_node == NULL\n");
850 cm_node
->mpa_hdr
.addr
= &cm_node
->mpa_frame
;
851 cm_node
->mpa_hdr
.size
= i40iw_cm_build_mpa_frame(cm_node
,
854 if (!cm_node
->mpa_hdr
.size
) {
855 i40iw_pr_err("mpa size = %d\n", cm_node
->mpa_hdr
.size
);
859 sqbuf
= i40iw_form_cm_frame(cm_node
,
865 i40iw_pr_err("sq_buf == NULL\n");
868 return i40iw_schedule_cm_timer(cm_node
, sqbuf
, I40IW_TIMER_TYPE_SEND
, 1, 0);
872 * i40iw_send_mpa_reject -
873 * @cm_node: connection's node
874 * @pdata: reject data for connection
875 * @plen: length of reject data
877 static int i40iw_send_mpa_reject(struct i40iw_cm_node
*cm_node
,
881 struct i40iw_puda_buf
*sqbuf
;
882 struct i40iw_kmem_info priv_info
;
884 cm_node
->mpa_hdr
.addr
= &cm_node
->mpa_frame
;
885 cm_node
->mpa_hdr
.size
= i40iw_cm_build_mpa_frame(cm_node
,
889 cm_node
->mpa_frame
.flags
|= IETF_MPA_FLAGS_REJECT
;
890 priv_info
.addr
= (void *)pdata
;
891 priv_info
.size
= plen
;
893 sqbuf
= i40iw_form_cm_frame(cm_node
,
899 i40iw_pr_err("no sqbuf\n");
902 cm_node
->state
= I40IW_CM_STATE_FIN_WAIT1
;
903 return i40iw_schedule_cm_timer(cm_node
, sqbuf
, I40IW_TIMER_TYPE_SEND
, 1, 0);
907 * recv_mpa - process an IETF MPA frame
908 * @cm_node: connection's node
909 * @buffer: Data pointer
910 * @type: to return accept or reject
911 * @len: Len of mpa buffer
913 static int i40iw_parse_mpa(struct i40iw_cm_node
*cm_node
, u8
*buffer
, u32
*type
, u32 len
)
915 struct ietf_mpa_v1
*mpa_frame
;
916 struct ietf_mpa_v2
*mpa_v2_frame
;
917 struct ietf_rtr_msg
*rtr_msg
;
921 *type
= I40IW_MPA_REQUEST_ACCEPT
;
923 if (len
< sizeof(struct ietf_mpa_v1
)) {
924 i40iw_pr_err("ietf buffer small (%x)\n", len
);
928 mpa_frame
= (struct ietf_mpa_v1
*)buffer
;
929 mpa_hdr_len
= sizeof(struct ietf_mpa_v1
);
930 priv_data_len
= ntohs(mpa_frame
->priv_data_len
);
932 if (priv_data_len
> IETF_MAX_PRIV_DATA_LEN
) {
933 i40iw_pr_err("large pri_data %d\n", priv_data_len
);
936 if (mpa_frame
->rev
!= IETF_MPA_V1
&& mpa_frame
->rev
!= IETF_MPA_V2
) {
937 i40iw_pr_err("unsupported mpa rev = %d\n", mpa_frame
->rev
);
940 if (mpa_frame
->rev
> cm_node
->mpa_frame_rev
) {
941 i40iw_pr_err("rev %d\n", mpa_frame
->rev
);
944 cm_node
->mpa_frame_rev
= mpa_frame
->rev
;
946 if (cm_node
->state
!= I40IW_CM_STATE_MPAREQ_SENT
) {
947 if (memcmp(mpa_frame
->key
, IEFT_MPA_KEY_REQ
, IETF_MPA_KEY_SIZE
)) {
948 i40iw_pr_err("Unexpected MPA Key received\n");
952 if (memcmp(mpa_frame
->key
, IEFT_MPA_KEY_REP
, IETF_MPA_KEY_SIZE
)) {
953 i40iw_pr_err("Unexpected MPA Key received\n");
958 if (priv_data_len
+ mpa_hdr_len
> len
) {
959 i40iw_pr_err("ietf buffer len(%x + %x != %x)\n",
960 priv_data_len
, mpa_hdr_len
, len
);
963 if (len
> MAX_CM_BUFFER
) {
964 i40iw_pr_err("ietf buffer large len = %d\n", len
);
968 switch (mpa_frame
->rev
) {
975 mpa_v2_frame
= (struct ietf_mpa_v2
*)buffer
;
976 mpa_hdr_len
+= IETF_RTR_MSG_SIZE
;
977 rtr_msg
= &mpa_v2_frame
->rtr_msg
;
979 /* parse rtr message */
980 ctrl_ord
= ntohs(rtr_msg
->ctrl_ord
);
981 ctrl_ird
= ntohs(rtr_msg
->ctrl_ird
);
982 ird_size
= ctrl_ird
& IETF_NO_IRD_ORD
;
983 ord_size
= ctrl_ord
& IETF_NO_IRD_ORD
;
985 if (!(ctrl_ird
& IETF_PEER_TO_PEER
))
988 if (ird_size
== IETF_NO_IRD_ORD
|| ord_size
== IETF_NO_IRD_ORD
) {
989 cm_node
->mpav2_ird_ord
= IETF_NO_IRD_ORD
;
993 if (cm_node
->state
!= I40IW_CM_STATE_MPAREQ_SENT
) {
995 if (!ord_size
&& (ctrl_ord
& IETF_RDMA0_READ
))
996 cm_node
->ird_size
= 1;
997 if (cm_node
->ord_size
> ird_size
)
998 cm_node
->ord_size
= ird_size
;
1001 if (!ird_size
&& (ctrl_ord
& IETF_RDMA0_READ
))
1003 if (cm_node
->ord_size
> ird_size
)
1004 cm_node
->ord_size
= ird_size
;
1006 if (cm_node
->ird_size
< ord_size
)
1007 /* no resources available */
1012 if (ctrl_ord
& IETF_RDMA0_READ
)
1013 cm_node
->send_rdma0_op
= SEND_RDMA_READ_ZERO
;
1014 else if (ctrl_ord
& IETF_RDMA0_WRITE
)
1015 cm_node
->send_rdma0_op
= SEND_RDMA_WRITE_ZERO
;
1016 else /* Not supported RDMA0 operation */
1018 i40iw_debug(cm_node
->dev
, I40IW_DEBUG_CM
,
1019 "MPAV2: Negotiated ORD: %d, IRD: %d\n",
1020 cm_node
->ord_size
, cm_node
->ird_size
);
1029 memcpy(cm_node
->pdata_buf
, buffer
+ mpa_hdr_len
, priv_data_len
);
1030 cm_node
->pdata
.size
= priv_data_len
;
1032 if (mpa_frame
->flags
& IETF_MPA_FLAGS_REJECT
)
1033 *type
= I40IW_MPA_REQUEST_REJECT
;
1035 if (mpa_frame
->flags
& IETF_MPA_FLAGS_MARKERS
)
1036 cm_node
->snd_mark_en
= true;
1042 * i40iw_schedule_cm_timer
1043 * @@cm_node: connection's node
1044 * @sqbuf: buffer to send
1045 * @type: if it is send or close
1046 * @send_retrans: if rexmits to be done
1047 * @close_when_complete: is cm_node to be removed
1049 * note - cm_node needs to be protected before calling this. Encase in:
1050 * i40iw_rem_ref_cm_node(cm_core, cm_node);
1051 * i40iw_schedule_cm_timer(...)
1052 * atomic_inc(&cm_node->ref_count);
1054 int i40iw_schedule_cm_timer(struct i40iw_cm_node
*cm_node
,
1055 struct i40iw_puda_buf
*sqbuf
,
1056 enum i40iw_timer_type type
,
1058 int close_when_complete
)
1060 struct i40iw_sc_vsi
*vsi
= &cm_node
->iwdev
->vsi
;
1061 struct i40iw_cm_core
*cm_core
= cm_node
->cm_core
;
1062 struct i40iw_timer_entry
*new_send
;
1065 unsigned long flags
;
1067 new_send
= kzalloc(sizeof(*new_send
), GFP_ATOMIC
);
1069 if (type
!= I40IW_TIMER_TYPE_CLOSE
)
1070 i40iw_free_sqbuf(vsi
, (void *)sqbuf
);
1073 new_send
->retrycount
= I40IW_DEFAULT_RETRYS
;
1074 new_send
->retranscount
= I40IW_DEFAULT_RETRANS
;
1075 new_send
->sqbuf
= sqbuf
;
1076 new_send
->timetosend
= jiffies
;
1077 new_send
->type
= type
;
1078 new_send
->send_retrans
= send_retrans
;
1079 new_send
->close_when_complete
= close_when_complete
;
1081 if (type
== I40IW_TIMER_TYPE_CLOSE
) {
1082 new_send
->timetosend
+= (HZ
/ 10);
1083 if (cm_node
->close_entry
) {
1085 i40iw_pr_err("already close entry\n");
1088 cm_node
->close_entry
= new_send
;
1091 if (type
== I40IW_TIMER_TYPE_SEND
) {
1092 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
1093 cm_node
->send_entry
= new_send
;
1094 atomic_inc(&cm_node
->ref_count
);
1095 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
1096 new_send
->timetosend
= jiffies
+ I40IW_RETRY_TIMEOUT
;
1098 atomic_inc(&sqbuf
->refcount
);
1099 i40iw_puda_send_buf(vsi
->ilq
, sqbuf
);
1100 if (!send_retrans
) {
1101 i40iw_cleanup_retrans_entry(cm_node
);
1102 if (close_when_complete
)
1103 i40iw_rem_ref_cm_node(cm_node
);
1108 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1109 was_timer_set
= timer_pending(&cm_core
->tcp_timer
);
1111 if (!was_timer_set
) {
1112 cm_core
->tcp_timer
.expires
= new_send
->timetosend
;
1113 add_timer(&cm_core
->tcp_timer
);
1115 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1121 * i40iw_retrans_expired - Could not rexmit the packet
1122 * @cm_node: connection's node
1124 static void i40iw_retrans_expired(struct i40iw_cm_node
*cm_node
)
1126 struct iw_cm_id
*cm_id
= cm_node
->cm_id
;
1127 enum i40iw_cm_node_state state
= cm_node
->state
;
1129 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
1131 case I40IW_CM_STATE_SYN_RCVD
:
1132 case I40IW_CM_STATE_CLOSING
:
1133 i40iw_rem_ref_cm_node(cm_node
);
1135 case I40IW_CM_STATE_FIN_WAIT1
:
1136 case I40IW_CM_STATE_LAST_ACK
:
1138 cm_id
->rem_ref(cm_id
);
1139 i40iw_send_reset(cm_node
);
1142 atomic_inc(&cm_node
->ref_count
);
1143 i40iw_send_reset(cm_node
);
1144 i40iw_create_event(cm_node
, I40IW_CM_EVENT_ABORTED
);
1150 * i40iw_handle_close_entry - for handling retry/timeouts
1151 * @cm_node: connection's node
1152 * @rem_node: flag for remove cm_node
1154 static void i40iw_handle_close_entry(struct i40iw_cm_node
*cm_node
, u32 rem_node
)
1156 struct i40iw_timer_entry
*close_entry
= cm_node
->close_entry
;
1157 struct iw_cm_id
*cm_id
= cm_node
->cm_id
;
1158 struct i40iw_qp
*iwqp
;
1159 unsigned long flags
;
1163 iwqp
= (struct i40iw_qp
*)close_entry
->sqbuf
;
1165 spin_lock_irqsave(&iwqp
->lock
, flags
);
1167 iwqp
->hw_tcp_state
= I40IW_TCP_STATE_CLOSED
;
1168 iwqp
->hw_iwarp_state
= I40IW_QP_STATE_ERROR
;
1169 iwqp
->last_aeq
= I40IW_AE_RESET_SENT
;
1170 iwqp
->ibqp_state
= IB_QPS_ERR
;
1171 spin_unlock_irqrestore(&iwqp
->lock
, flags
);
1172 i40iw_cm_disconn(iwqp
);
1174 spin_unlock_irqrestore(&iwqp
->lock
, flags
);
1176 } else if (rem_node
) {
1177 /* TIME_WAIT state */
1178 i40iw_rem_ref_cm_node(cm_node
);
1181 cm_id
->rem_ref(cm_id
);
1183 cm_node
->close_entry
= NULL
;
1187 * i40iw_build_timer_list - Add cm_nodes to timer list
1188 * @timer_list: ptr to timer list
1189 * @hte: ptr to accelerated or non-accelerated list
1191 static void i40iw_build_timer_list(struct list_head
*timer_list
,
1192 struct list_head
*hte
)
1194 struct i40iw_cm_node
*cm_node
;
1195 struct list_head
*list_core_temp
, *list_node
;
1197 list_for_each_safe(list_node
, list_core_temp
, hte
) {
1198 cm_node
= container_of(list_node
, struct i40iw_cm_node
, list
);
1199 if (cm_node
->close_entry
|| cm_node
->send_entry
) {
1200 atomic_inc(&cm_node
->ref_count
);
1201 list_add(&cm_node
->timer_entry
, timer_list
);
1207 * i40iw_cm_timer_tick - system's timer expired callback
1208 * @pass: Pointing to cm_core
1210 static void i40iw_cm_timer_tick(struct timer_list
*t
)
1212 unsigned long nexttimeout
= jiffies
+ I40IW_LONG_TIME
;
1213 struct i40iw_cm_node
*cm_node
;
1214 struct i40iw_timer_entry
*send_entry
, *close_entry
;
1215 struct list_head
*list_core_temp
;
1216 struct i40iw_sc_vsi
*vsi
;
1217 struct list_head
*list_node
;
1218 struct i40iw_cm_core
*cm_core
= from_timer(cm_core
, t
, tcp_timer
);
1220 unsigned long timetosend
;
1221 unsigned long flags
;
1223 struct list_head timer_list
;
1225 INIT_LIST_HEAD(&timer_list
);
1227 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1228 i40iw_build_timer_list(&timer_list
, &cm_core
->non_accelerated_list
);
1229 i40iw_build_timer_list(&timer_list
, &cm_core
->accelerated_list
);
1230 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1232 list_for_each_safe(list_node
, list_core_temp
, &timer_list
) {
1233 cm_node
= container_of(list_node
,
1234 struct i40iw_cm_node
,
1236 close_entry
= cm_node
->close_entry
;
1239 if (time_after(close_entry
->timetosend
, jiffies
)) {
1240 if (nexttimeout
> close_entry
->timetosend
||
1242 nexttimeout
= close_entry
->timetosend
;
1246 i40iw_handle_close_entry(cm_node
, 1);
1250 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
1252 send_entry
= cm_node
->send_entry
;
1255 if (time_after(send_entry
->timetosend
, jiffies
)) {
1256 if (cm_node
->state
!= I40IW_CM_STATE_OFFLOADED
) {
1257 if ((nexttimeout
> send_entry
->timetosend
) ||
1259 nexttimeout
= send_entry
->timetosend
;
1263 i40iw_free_retrans_entry(cm_node
);
1268 if ((cm_node
->state
== I40IW_CM_STATE_OFFLOADED
) ||
1269 (cm_node
->state
== I40IW_CM_STATE_CLOSED
)) {
1270 i40iw_free_retrans_entry(cm_node
);
1274 if (!send_entry
->retranscount
|| !send_entry
->retrycount
) {
1275 i40iw_free_retrans_entry(cm_node
);
1277 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
1278 i40iw_retrans_expired(cm_node
);
1279 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
1280 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
1283 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
1285 vsi
= &cm_node
->iwdev
->vsi
;
1287 if (!cm_node
->ack_rcvd
) {
1288 atomic_inc(&send_entry
->sqbuf
->refcount
);
1289 i40iw_puda_send_buf(vsi
->ilq
, send_entry
->sqbuf
);
1290 cm_node
->cm_core
->stats_pkt_retrans
++;
1292 spin_lock_irqsave(&cm_node
->retrans_list_lock
, flags
);
1293 if (send_entry
->send_retrans
) {
1294 send_entry
->retranscount
--;
1295 timetosend
= (I40IW_RETRY_TIMEOUT
<<
1296 (I40IW_DEFAULT_RETRANS
-
1297 send_entry
->retranscount
));
1299 send_entry
->timetosend
= jiffies
+
1300 min(timetosend
, I40IW_MAX_TIMEOUT
);
1301 if (nexttimeout
> send_entry
->timetosend
|| !settimer
) {
1302 nexttimeout
= send_entry
->timetosend
;
1306 int close_when_complete
;
1308 close_when_complete
= send_entry
->close_when_complete
;
1309 i40iw_debug(cm_node
->dev
,
1311 "cm_node=%p state=%d\n",
1314 i40iw_free_retrans_entry(cm_node
);
1315 if (close_when_complete
)
1316 i40iw_rem_ref_cm_node(cm_node
);
1319 spin_unlock_irqrestore(&cm_node
->retrans_list_lock
, flags
);
1320 i40iw_rem_ref_cm_node(cm_node
);
1324 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1325 if (!timer_pending(&cm_core
->tcp_timer
)) {
1326 cm_core
->tcp_timer
.expires
= nexttimeout
;
1327 add_timer(&cm_core
->tcp_timer
);
1329 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1334 * i40iw_send_syn - send SYN packet
1335 * @cm_node: connection's node
1336 * @sendack: flag to set ACK bit or not
1338 int i40iw_send_syn(struct i40iw_cm_node
*cm_node
, u32 sendack
)
1340 struct i40iw_puda_buf
*sqbuf
;
1341 int flags
= SET_SYN
;
1342 char optionsbuffer
[sizeof(struct option_mss
) +
1343 sizeof(struct option_windowscale
) +
1344 sizeof(struct option_base
) + TCP_OPTIONS_PADDING
];
1345 struct i40iw_kmem_info opts
;
1347 int optionssize
= 0;
1348 /* Sending MSS option */
1349 union all_known_options
*options
;
1351 opts
.addr
= optionsbuffer
;
1353 i40iw_pr_err("no cm_node\n");
1357 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1358 options
->as_mss
.optionnum
= OPTION_NUMBER_MSS
;
1359 options
->as_mss
.length
= sizeof(struct option_mss
);
1360 options
->as_mss
.mss
= htons(cm_node
->tcp_cntxt
.mss
);
1361 optionssize
+= sizeof(struct option_mss
);
1363 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1364 options
->as_windowscale
.optionnum
= OPTION_NUMBER_WINDOW_SCALE
;
1365 options
->as_windowscale
.length
= sizeof(struct option_windowscale
);
1366 options
->as_windowscale
.shiftcount
= cm_node
->tcp_cntxt
.rcv_wscale
;
1367 optionssize
+= sizeof(struct option_windowscale
);
1368 options
= (union all_known_options
*)&optionsbuffer
[optionssize
];
1369 options
->as_end
= OPTION_NUMBER_END
;
1375 opts
.size
= optionssize
;
1377 sqbuf
= i40iw_form_cm_frame(cm_node
, &opts
, NULL
, NULL
, flags
);
1379 i40iw_pr_err("no sqbuf\n");
1382 return i40iw_schedule_cm_timer(cm_node
, sqbuf
, I40IW_TIMER_TYPE_SEND
, 1, 0);
1386 * i40iw_send_ack - Send ACK packet
1387 * @cm_node: connection's node
1389 static void i40iw_send_ack(struct i40iw_cm_node
*cm_node
)
1391 struct i40iw_puda_buf
*sqbuf
;
1392 struct i40iw_sc_vsi
*vsi
= &cm_node
->iwdev
->vsi
;
1394 sqbuf
= i40iw_form_cm_frame(cm_node
, NULL
, NULL
, NULL
, SET_ACK
);
1396 i40iw_puda_send_buf(vsi
->ilq
, sqbuf
);
1398 i40iw_pr_err("no sqbuf\n");
1402 * i40iw_send_fin - Send FIN pkt
1403 * @cm_node: connection's node
1405 static int i40iw_send_fin(struct i40iw_cm_node
*cm_node
)
1407 struct i40iw_puda_buf
*sqbuf
;
1409 sqbuf
= i40iw_form_cm_frame(cm_node
, NULL
, NULL
, NULL
, SET_ACK
| SET_FIN
);
1411 i40iw_pr_err("no sqbuf\n");
1414 return i40iw_schedule_cm_timer(cm_node
, sqbuf
, I40IW_TIMER_TYPE_SEND
, 1, 0);
1418 * i40iw_find_node - find a cm node that matches the reference cm node
1419 * @cm_core: cm's core
1420 * @rem_port: remote tcp port num
1421 * @rem_addr: remote ip addr
1422 * @loc_port: local tcp port num
1423 * @loc_addr: loc ip addr
1424 * @add_refcnt: flag to increment refcount of cm_node
1425 * @accelerated_list: flag for accelerated vs non-accelerated list to search
1427 struct i40iw_cm_node
*i40iw_find_node(struct i40iw_cm_core
*cm_core
,
1433 bool accelerated_list
)
1435 struct list_head
*hte
;
1436 struct i40iw_cm_node
*cm_node
;
1437 unsigned long flags
;
1439 hte
= accelerated_list
?
1440 &cm_core
->accelerated_list
: &cm_core
->non_accelerated_list
;
1442 /* walk list and find cm_node associated with this session ID */
1443 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1444 list_for_each_entry(cm_node
, hte
, list
) {
1445 if (!memcmp(cm_node
->loc_addr
, loc_addr
, sizeof(cm_node
->loc_addr
)) &&
1446 (cm_node
->loc_port
== loc_port
) &&
1447 !memcmp(cm_node
->rem_addr
, rem_addr
, sizeof(cm_node
->rem_addr
)) &&
1448 (cm_node
->rem_port
== rem_port
)) {
1450 atomic_inc(&cm_node
->ref_count
);
1451 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1455 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1462 * i40iw_find_listener - find a cm node listening on this addr-port pair
1463 * @cm_core: cm's core
1464 * @dst_port: listener tcp port num
1465 * @dst_addr: listener ip addr
1466 * @listener_state: state to match with listen node's
1468 static struct i40iw_cm_listener
*i40iw_find_listener(
1469 struct i40iw_cm_core
*cm_core
,
1473 enum i40iw_cm_listener_state
1476 struct i40iw_cm_listener
*listen_node
;
1477 static const u32 ip_zero
[4] = { 0, 0, 0, 0 };
1480 unsigned long flags
;
1482 /* walk list and find cm_node associated with this session ID */
1483 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
1484 list_for_each_entry(listen_node
, &cm_core
->listen_nodes
, list
) {
1485 memcpy(listen_addr
, listen_node
->loc_addr
, sizeof(listen_addr
));
1486 listen_port
= listen_node
->loc_port
;
1487 /* compare node pair, return node handle if a match */
1488 if ((!memcmp(listen_addr
, dst_addr
, sizeof(listen_addr
)) ||
1489 !memcmp(listen_addr
, ip_zero
, sizeof(listen_addr
))) &&
1490 (listen_port
== dst_port
) &&
1491 (listener_state
& listen_node
->listener_state
)) {
1492 atomic_inc(&listen_node
->ref_count
);
1493 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1497 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1502 * i40iw_add_hte_node - add a cm node to the hash table
1503 * @cm_core: cm's core
1504 * @cm_node: connection's node
1506 static void i40iw_add_hte_node(struct i40iw_cm_core
*cm_core
,
1507 struct i40iw_cm_node
*cm_node
)
1509 unsigned long flags
;
1511 if (!cm_node
|| !cm_core
) {
1512 i40iw_pr_err("cm_node or cm_core == NULL\n");
1516 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1517 list_add_tail(&cm_node
->list
, &cm_core
->non_accelerated_list
);
1518 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1522 * i40iw_find_port - find port that matches reference port
1523 * @hte: ptr to accelerated or non-accelerated list
1524 * @accelerated_list: flag for accelerated vs non-accelerated list
1526 static bool i40iw_find_port(struct list_head
*hte
, u16 port
)
1528 struct i40iw_cm_node
*cm_node
;
1530 list_for_each_entry(cm_node
, hte
, list
) {
1531 if (cm_node
->loc_port
== port
)
1538 * i40iw_port_in_use - determine if port is in use
1539 * @cm_core: cm's core
1540 * @port: port number
1542 bool i40iw_port_in_use(struct i40iw_cm_core
*cm_core
, u16 port
)
1544 struct i40iw_cm_listener
*listen_node
;
1545 unsigned long flags
;
1547 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1548 if (i40iw_find_port(&cm_core
->accelerated_list
, port
) ||
1549 i40iw_find_port(&cm_core
->non_accelerated_list
, port
)) {
1550 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1553 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1555 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
1556 list_for_each_entry(listen_node
, &cm_core
->listen_nodes
, list
) {
1557 if (listen_node
->loc_port
== port
) {
1558 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1562 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1568 * i40iw_del_multiple_qhash - Remove qhash and child listens
1569 * @iwdev: iWarp device
1570 * @cm_info: CM info for parent listen node
1571 * @cm_parent_listen_node: The parent listen node
1573 static enum i40iw_status_code
i40iw_del_multiple_qhash(
1574 struct i40iw_device
*iwdev
,
1575 struct i40iw_cm_info
*cm_info
,
1576 struct i40iw_cm_listener
*cm_parent_listen_node
)
1578 struct i40iw_cm_listener
*child_listen_node
;
1579 enum i40iw_status_code ret
= I40IW_ERR_CONFIG
;
1580 struct list_head
*pos
, *tpos
;
1581 unsigned long flags
;
1583 spin_lock_irqsave(&iwdev
->cm_core
.listen_list_lock
, flags
);
1584 list_for_each_safe(pos
, tpos
, &cm_parent_listen_node
->child_listen_list
) {
1585 child_listen_node
= list_entry(pos
, struct i40iw_cm_listener
, child_listen_list
);
1586 if (child_listen_node
->ipv4
)
1587 i40iw_debug(&iwdev
->sc_dev
,
1589 "removing child listen for IP=%pI4, port=%d, vlan=%d\n",
1590 child_listen_node
->loc_addr
,
1591 child_listen_node
->loc_port
,
1592 child_listen_node
->vlan_id
);
1594 i40iw_debug(&iwdev
->sc_dev
, I40IW_DEBUG_CM
,
1595 "removing child listen for IP=%pI6, port=%d, vlan=%d\n",
1596 child_listen_node
->loc_addr
,
1597 child_listen_node
->loc_port
,
1598 child_listen_node
->vlan_id
);
1600 memcpy(cm_info
->loc_addr
, child_listen_node
->loc_addr
,
1601 sizeof(cm_info
->loc_addr
));
1602 cm_info
->vlan_id
= child_listen_node
->vlan_id
;
1603 if (child_listen_node
->qhash_set
) {
1604 ret
= i40iw_manage_qhash(iwdev
, cm_info
,
1605 I40IW_QHASH_TYPE_TCP_SYN
,
1606 I40IW_QHASH_MANAGE_TYPE_DELETE
,
1608 child_listen_node
->qhash_set
= false;
1610 ret
= I40IW_SUCCESS
;
1612 i40iw_debug(&iwdev
->sc_dev
,
1614 "freed pointer = %p\n",
1616 kfree(child_listen_node
);
1617 cm_parent_listen_node
->cm_core
->stats_listen_nodes_destroyed
++;
1619 spin_unlock_irqrestore(&iwdev
->cm_core
.listen_list_lock
, flags
);
1625 * i40iw_netdev_vlan_ipv6 - Gets the netdev and vlan
1626 * @addr: local IPv6 address
1627 * @vlan_id: vlan id for the given IPv6 address
1629 * Returns the net_device of the IPv6 address and also sets the
1630 * vlan id for that address.
1632 static struct net_device
*i40iw_netdev_vlan_ipv6(u32
*addr
, u16
*vlan_id
)
1634 struct net_device
*ip_dev
= NULL
;
1635 struct in6_addr laddr6
;
1637 if (!IS_ENABLED(CONFIG_IPV6
))
1639 i40iw_copy_ip_htonl(laddr6
.in6_u
.u6_addr32
, addr
);
1641 *vlan_id
= I40IW_NO_VLAN
;
1643 for_each_netdev_rcu(&init_net
, ip_dev
) {
1644 if (ipv6_chk_addr(&init_net
, &laddr6
, ip_dev
, 1)) {
1646 *vlan_id
= rdma_vlan_dev_vlan_id(ip_dev
);
1655 * i40iw_get_vlan_ipv4 - Returns the vlan_id for IPv4 address
1656 * @addr: local IPv4 address
1658 static u16
i40iw_get_vlan_ipv4(u32
*addr
)
1660 struct net_device
*netdev
;
1661 u16 vlan_id
= I40IW_NO_VLAN
;
1663 netdev
= ip_dev_find(&init_net
, htonl(addr
[0]));
1665 vlan_id
= rdma_vlan_dev_vlan_id(netdev
);
1672 * i40iw_add_mqh_6 - Adds multiple qhashes for IPv6
1673 * @iwdev: iWarp device
1674 * @cm_info: CM info for parent listen node
1675 * @cm_parent_listen_node: The parent listen node
1677 * Adds a qhash and a child listen node for every IPv6 address
1678 * on the adapter and adds the associated qhash filter
1680 static enum i40iw_status_code
i40iw_add_mqh_6(struct i40iw_device
*iwdev
,
1681 struct i40iw_cm_info
*cm_info
,
1682 struct i40iw_cm_listener
*cm_parent_listen_node
)
1684 struct net_device
*ip_dev
;
1685 struct inet6_dev
*idev
;
1686 struct inet6_ifaddr
*ifp
, *tmp
;
1687 enum i40iw_status_code ret
= 0;
1688 struct i40iw_cm_listener
*child_listen_node
;
1689 unsigned long flags
;
1692 for_each_netdev(&init_net
, ip_dev
) {
1693 if ((((rdma_vlan_dev_vlan_id(ip_dev
) < I40IW_NO_VLAN
) &&
1694 (rdma_vlan_dev_real_dev(ip_dev
) == iwdev
->netdev
)) ||
1695 (ip_dev
== iwdev
->netdev
)) && (ip_dev
->flags
& IFF_UP
)) {
1696 idev
= __in6_dev_get(ip_dev
);
1698 i40iw_pr_err("idev == NULL\n");
1701 list_for_each_entry_safe(ifp
, tmp
, &idev
->addr_list
, if_list
) {
1702 i40iw_debug(&iwdev
->sc_dev
,
1704 "IP=%pI6, vlan_id=%d, MAC=%pM\n",
1706 rdma_vlan_dev_vlan_id(ip_dev
),
1709 kzalloc(sizeof(*child_listen_node
), GFP_ATOMIC
);
1710 i40iw_debug(&iwdev
->sc_dev
,
1712 "Allocating child listener %p\n",
1714 if (!child_listen_node
) {
1715 ret
= I40IW_ERR_NO_MEMORY
;
1718 cm_info
->vlan_id
= rdma_vlan_dev_vlan_id(ip_dev
);
1719 cm_parent_listen_node
->vlan_id
= cm_info
->vlan_id
;
1721 memcpy(child_listen_node
, cm_parent_listen_node
,
1722 sizeof(*child_listen_node
));
1724 i40iw_copy_ip_ntohl(child_listen_node
->loc_addr
,
1725 ifp
->addr
.in6_u
.u6_addr32
);
1726 memcpy(cm_info
->loc_addr
, child_listen_node
->loc_addr
,
1727 sizeof(cm_info
->loc_addr
));
1729 ret
= i40iw_manage_qhash(iwdev
, cm_info
,
1730 I40IW_QHASH_TYPE_TCP_SYN
,
1731 I40IW_QHASH_MANAGE_TYPE_ADD
,
1734 child_listen_node
->qhash_set
= true;
1735 spin_lock_irqsave(&iwdev
->cm_core
.listen_list_lock
, flags
);
1736 list_add(&child_listen_node
->child_listen_list
,
1737 &cm_parent_listen_node
->child_listen_list
);
1738 spin_unlock_irqrestore(&iwdev
->cm_core
.listen_list_lock
, flags
);
1739 cm_parent_listen_node
->cm_core
->stats_listen_nodes_created
++;
1741 kfree(child_listen_node
);
1752 * i40iw_add_mqh_4 - Adds multiple qhashes for IPv4
1753 * @iwdev: iWarp device
1754 * @cm_info: CM info for parent listen node
1755 * @cm_parent_listen_node: The parent listen node
1757 * Adds a qhash and a child listen node for every IPv4 address
1758 * on the adapter and adds the associated qhash filter
1760 static enum i40iw_status_code
i40iw_add_mqh_4(
1761 struct i40iw_device
*iwdev
,
1762 struct i40iw_cm_info
*cm_info
,
1763 struct i40iw_cm_listener
*cm_parent_listen_node
)
1765 struct net_device
*dev
;
1766 struct in_device
*idev
;
1767 struct i40iw_cm_listener
*child_listen_node
;
1768 enum i40iw_status_code ret
= 0;
1769 unsigned long flags
;
1772 for_each_netdev(&init_net
, dev
) {
1773 if ((((rdma_vlan_dev_vlan_id(dev
) < I40IW_NO_VLAN
) &&
1774 (rdma_vlan_dev_real_dev(dev
) == iwdev
->netdev
)) ||
1775 (dev
== iwdev
->netdev
)) && (dev
->flags
& IFF_UP
)) {
1776 const struct in_ifaddr
*ifa
;
1778 idev
= in_dev_get(dev
);
1780 in_dev_for_each_ifa_rtnl(ifa
, idev
) {
1781 i40iw_debug(&iwdev
->sc_dev
,
1783 "Allocating child CM Listener forIP=%pI4, vlan_id=%d, MAC=%pM\n",
1785 rdma_vlan_dev_vlan_id(dev
),
1787 child_listen_node
= kzalloc(sizeof(*child_listen_node
), GFP_KERNEL
);
1788 cm_parent_listen_node
->cm_core
->stats_listen_nodes_created
++;
1789 i40iw_debug(&iwdev
->sc_dev
,
1791 "Allocating child listener %p\n",
1793 if (!child_listen_node
) {
1795 ret
= I40IW_ERR_NO_MEMORY
;
1798 cm_info
->vlan_id
= rdma_vlan_dev_vlan_id(dev
);
1799 cm_parent_listen_node
->vlan_id
= cm_info
->vlan_id
;
1800 memcpy(child_listen_node
,
1801 cm_parent_listen_node
,
1802 sizeof(*child_listen_node
));
1804 child_listen_node
->loc_addr
[0] = ntohl(ifa
->ifa_address
);
1805 memcpy(cm_info
->loc_addr
, child_listen_node
->loc_addr
,
1806 sizeof(cm_info
->loc_addr
));
1808 ret
= i40iw_manage_qhash(iwdev
,
1810 I40IW_QHASH_TYPE_TCP_SYN
,
1811 I40IW_QHASH_MANAGE_TYPE_ADD
,
1815 child_listen_node
->qhash_set
= true;
1816 spin_lock_irqsave(&iwdev
->cm_core
.listen_list_lock
, flags
);
1817 list_add(&child_listen_node
->child_listen_list
,
1818 &cm_parent_listen_node
->child_listen_list
);
1819 spin_unlock_irqrestore(&iwdev
->cm_core
.listen_list_lock
, flags
);
1821 kfree(child_listen_node
);
1822 cm_parent_listen_node
->cm_core
->stats_listen_nodes_created
--;
1835 * i40iw_dec_refcnt_listen - delete listener and associated cm nodes
1836 * @cm_core: cm's core
1837 * @free_hanging_nodes: to free associated cm_nodes
1838 * @apbvt_del: flag to delete the apbvt
1840 static int i40iw_dec_refcnt_listen(struct i40iw_cm_core
*cm_core
,
1841 struct i40iw_cm_listener
*listener
,
1842 int free_hanging_nodes
, bool apbvt_del
)
1846 struct list_head
*list_pos
;
1847 struct list_head
*list_temp
;
1848 struct i40iw_cm_node
*cm_node
;
1849 struct list_head reset_list
;
1850 struct i40iw_cm_info nfo
;
1851 struct i40iw_cm_node
*loopback
;
1852 enum i40iw_cm_node_state old_state
;
1853 unsigned long flags
;
1855 /* free non-accelerated child nodes for this listener */
1856 INIT_LIST_HEAD(&reset_list
);
1857 if (free_hanging_nodes
) {
1858 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
1859 list_for_each_safe(list_pos
,
1860 list_temp
, &cm_core
->non_accelerated_list
) {
1861 cm_node
= container_of(list_pos
, struct i40iw_cm_node
, list
);
1862 if ((cm_node
->listener
== listener
) &&
1863 !cm_node
->accelerated
) {
1864 atomic_inc(&cm_node
->ref_count
);
1865 list_add(&cm_node
->reset_entry
, &reset_list
);
1868 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
1871 list_for_each_safe(list_pos
, list_temp
, &reset_list
) {
1872 cm_node
= container_of(list_pos
, struct i40iw_cm_node
, reset_entry
);
1873 loopback
= cm_node
->loopbackpartner
;
1874 if (cm_node
->state
>= I40IW_CM_STATE_FIN_WAIT1
) {
1875 i40iw_rem_ref_cm_node(cm_node
);
1878 i40iw_cleanup_retrans_entry(cm_node
);
1879 err
= i40iw_send_reset(cm_node
);
1881 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
1882 i40iw_pr_err("send reset\n");
1884 old_state
= cm_node
->state
;
1885 cm_node
->state
= I40IW_CM_STATE_LISTENER_DESTROYED
;
1886 if (old_state
!= I40IW_CM_STATE_MPAREQ_RCVD
)
1887 i40iw_rem_ref_cm_node(cm_node
);
1890 struct i40iw_cm_event event
;
1892 event
.cm_node
= loopback
;
1893 memcpy(event
.cm_info
.rem_addr
,
1894 loopback
->rem_addr
, sizeof(event
.cm_info
.rem_addr
));
1895 memcpy(event
.cm_info
.loc_addr
,
1896 loopback
->loc_addr
, sizeof(event
.cm_info
.loc_addr
));
1897 event
.cm_info
.rem_port
= loopback
->rem_port
;
1898 event
.cm_info
.loc_port
= loopback
->loc_port
;
1899 event
.cm_info
.cm_id
= loopback
->cm_id
;
1900 event
.cm_info
.ipv4
= loopback
->ipv4
;
1901 atomic_inc(&loopback
->ref_count
);
1902 loopback
->state
= I40IW_CM_STATE_CLOSED
;
1903 i40iw_event_connect_error(&event
);
1904 cm_node
->state
= I40IW_CM_STATE_LISTENER_DESTROYED
;
1905 i40iw_rem_ref_cm_node(cm_node
);
1910 if (!atomic_dec_return(&listener
->ref_count
)) {
1911 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
1912 list_del(&listener
->list
);
1913 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
1915 if (listener
->iwdev
) {
1917 i40iw_manage_apbvt(listener
->iwdev
,
1919 I40IW_MANAGE_APBVT_DEL
);
1921 memcpy(nfo
.loc_addr
, listener
->loc_addr
, sizeof(nfo
.loc_addr
));
1922 nfo
.loc_port
= listener
->loc_port
;
1923 nfo
.ipv4
= listener
->ipv4
;
1924 nfo
.vlan_id
= listener
->vlan_id
;
1925 nfo
.user_pri
= listener
->user_pri
;
1927 if (!list_empty(&listener
->child_listen_list
)) {
1928 i40iw_del_multiple_qhash(listener
->iwdev
, &nfo
, listener
);
1930 if (listener
->qhash_set
)
1931 i40iw_manage_qhash(listener
->iwdev
,
1933 I40IW_QHASH_TYPE_TCP_SYN
,
1934 I40IW_QHASH_MANAGE_TYPE_DELETE
,
1940 cm_core
->stats_listen_destroyed
++;
1942 cm_core
->stats_listen_nodes_destroyed
++;
1948 if (atomic_read(&listener
->pend_accepts_cnt
) > 0)
1949 i40iw_debug(cm_core
->dev
,
1951 "%s: listener (%p) pending accepts=%u\n",
1954 atomic_read(&listener
->pend_accepts_cnt
));
1961 * i40iw_cm_del_listen - delete a linstener
1962 * @cm_core: cm's core
1963 * @listener: passive connection's listener
1964 * @apbvt_del: flag to delete apbvt
1966 static int i40iw_cm_del_listen(struct i40iw_cm_core
*cm_core
,
1967 struct i40iw_cm_listener
*listener
,
1970 listener
->listener_state
= I40IW_CM_LISTENER_PASSIVE_STATE
;
1971 listener
->cm_id
= NULL
; /* going to be destroyed pretty soon */
1972 return i40iw_dec_refcnt_listen(cm_core
, listener
, 1, apbvt_del
);
1976 * i40iw_addr_resolve_neigh - resolve neighbor address
1977 * @iwdev: iwarp device structure
1978 * @src_ip: local ip address
1979 * @dst_ip: remote ip address
1980 * @arpindex: if there is an arp entry
1982 static int i40iw_addr_resolve_neigh(struct i40iw_device
*iwdev
,
1988 struct neighbour
*neigh
;
1990 struct net_device
*netdev
= iwdev
->netdev
;
1991 __be32 dst_ipaddr
= htonl(dst_ip
);
1992 __be32 src_ipaddr
= htonl(src_ip
);
1994 rt
= ip_route_output(&init_net
, dst_ipaddr
, src_ipaddr
, 0, 0);
1996 i40iw_pr_err("ip_route_output\n");
2000 if (netif_is_bond_slave(netdev
))
2001 netdev
= netdev_master_upper_dev_get(netdev
);
2003 neigh
= dst_neigh_lookup(&rt
->dst
, &dst_ipaddr
);
2007 if (neigh
->nud_state
& NUD_VALID
) {
2008 if (arpindex
>= 0) {
2009 if (ether_addr_equal(iwdev
->arp_table
[arpindex
].mac_addr
,
2011 /* Mac address same as arp table */
2012 goto resolve_neigh_exit
;
2013 i40iw_manage_arp_cache(iwdev
,
2014 iwdev
->arp_table
[arpindex
].mac_addr
,
2020 i40iw_manage_arp_cache(iwdev
, neigh
->ha
, &dst_ip
, true, I40IW_ARP_ADD
);
2021 rc
= i40iw_arp_table(iwdev
, &dst_ip
, true, NULL
, I40IW_ARP_RESOLVE
);
2023 neigh_event_send(neigh
, NULL
);
2030 neigh_release(neigh
);
2037 * i40iw_get_dst_ipv6
2039 static struct dst_entry
*i40iw_get_dst_ipv6(struct sockaddr_in6
*src_addr
,
2040 struct sockaddr_in6
*dst_addr
)
2042 struct dst_entry
*dst
;
2045 memset(&fl6
, 0, sizeof(fl6
));
2046 fl6
.daddr
= dst_addr
->sin6_addr
;
2047 fl6
.saddr
= src_addr
->sin6_addr
;
2048 if (ipv6_addr_type(&fl6
.daddr
) & IPV6_ADDR_LINKLOCAL
)
2049 fl6
.flowi6_oif
= dst_addr
->sin6_scope_id
;
2051 dst
= ip6_route_output(&init_net
, NULL
, &fl6
);
2056 * i40iw_addr_resolve_neigh_ipv6 - resolve neighbor ipv6 address
2057 * @iwdev: iwarp device structure
2058 * @dst_ip: remote ip address
2059 * @arpindex: if there is an arp entry
2061 static int i40iw_addr_resolve_neigh_ipv6(struct i40iw_device
*iwdev
,
2066 struct neighbour
*neigh
;
2068 struct net_device
*netdev
= iwdev
->netdev
;
2069 struct dst_entry
*dst
;
2070 struct sockaddr_in6 dst_addr
;
2071 struct sockaddr_in6 src_addr
;
2073 memset(&dst_addr
, 0, sizeof(dst_addr
));
2074 dst_addr
.sin6_family
= AF_INET6
;
2075 i40iw_copy_ip_htonl(dst_addr
.sin6_addr
.in6_u
.u6_addr32
, dest
);
2076 memset(&src_addr
, 0, sizeof(src_addr
));
2077 src_addr
.sin6_family
= AF_INET6
;
2078 i40iw_copy_ip_htonl(src_addr
.sin6_addr
.in6_u
.u6_addr32
, src
);
2079 dst
= i40iw_get_dst_ipv6(&src_addr
, &dst_addr
);
2080 if (!dst
|| dst
->error
) {
2082 i40iw_pr_err("ip6_route_output returned dst->error = %d\n",
2089 if (netif_is_bond_slave(netdev
))
2090 netdev
= netdev_master_upper_dev_get(netdev
);
2092 neigh
= dst_neigh_lookup(dst
, dst_addr
.sin6_addr
.in6_u
.u6_addr32
);
2096 i40iw_debug(&iwdev
->sc_dev
, I40IW_DEBUG_CM
, "dst_neigh_lookup MAC=%pM\n", neigh
->ha
);
2097 if (neigh
->nud_state
& NUD_VALID
) {
2098 if (arpindex
>= 0) {
2099 if (ether_addr_equal
2100 (iwdev
->arp_table
[arpindex
].mac_addr
,
2102 /* Mac address same as in arp table */
2103 goto resolve_neigh_exit6
;
2105 i40iw_manage_arp_cache(iwdev
,
2106 iwdev
->arp_table
[arpindex
].mac_addr
,
2111 i40iw_manage_arp_cache(iwdev
,
2116 rc
= i40iw_arp_table(iwdev
,
2122 neigh_event_send(neigh
, NULL
);
2126 resolve_neigh_exit6
:
2129 neigh_release(neigh
);
2135 * i40iw_ipv4_is_loopback - check if loopback
2136 * @loc_addr: local addr to compare
2137 * @rem_addr: remote address
2139 static bool i40iw_ipv4_is_loopback(u32 loc_addr
, u32 rem_addr
)
2141 return ipv4_is_loopback(htonl(rem_addr
)) || (loc_addr
== rem_addr
);
2145 * i40iw_ipv6_is_loopback - check if loopback
2146 * @loc_addr: local addr to compare
2147 * @rem_addr: remote address
2149 static bool i40iw_ipv6_is_loopback(u32
*loc_addr
, u32
*rem_addr
)
2151 struct in6_addr raddr6
;
2153 i40iw_copy_ip_htonl(raddr6
.in6_u
.u6_addr32
, rem_addr
);
2154 return !memcmp(loc_addr
, rem_addr
, 16) || ipv6_addr_loopback(&raddr6
);
2158 * i40iw_make_cm_node - create a new instance of a cm node
2159 * @cm_core: cm's core
2160 * @iwdev: iwarp device structure
2161 * @cm_info: quad info for connection
2162 * @listener: passive connection's listener
2164 static struct i40iw_cm_node
*i40iw_make_cm_node(
2165 struct i40iw_cm_core
*cm_core
,
2166 struct i40iw_device
*iwdev
,
2167 struct i40iw_cm_info
*cm_info
,
2168 struct i40iw_cm_listener
*listener
)
2170 struct i40iw_cm_node
*cm_node
;
2173 struct net_device
*netdev
= iwdev
->netdev
;
2175 /* create an hte and cm_node for this instance */
2176 cm_node
= kzalloc(sizeof(*cm_node
), GFP_ATOMIC
);
2180 /* set our node specific transport info */
2181 cm_node
->ipv4
= cm_info
->ipv4
;
2182 cm_node
->vlan_id
= cm_info
->vlan_id
;
2183 if ((cm_node
->vlan_id
== I40IW_NO_VLAN
) && iwdev
->dcb
)
2184 cm_node
->vlan_id
= 0;
2185 cm_node
->tos
= cm_info
->tos
;
2186 cm_node
->user_pri
= cm_info
->user_pri
;
2188 if (listener
->tos
!= cm_info
->tos
)
2189 i40iw_debug(&iwdev
->sc_dev
, I40IW_DEBUG_DCB
,
2190 "application TOS[%d] and remote client TOS[%d] mismatch\n",
2191 listener
->tos
, cm_info
->tos
);
2192 cm_node
->tos
= max(listener
->tos
, cm_info
->tos
);
2193 cm_node
->user_pri
= rt_tos2priority(cm_node
->tos
);
2194 i40iw_debug(&iwdev
->sc_dev
, I40IW_DEBUG_DCB
, "listener: TOS:[%d] UP:[%d]\n",
2195 cm_node
->tos
, cm_node
->user_pri
);
2197 memcpy(cm_node
->loc_addr
, cm_info
->loc_addr
, sizeof(cm_node
->loc_addr
));
2198 memcpy(cm_node
->rem_addr
, cm_info
->rem_addr
, sizeof(cm_node
->rem_addr
));
2199 cm_node
->loc_port
= cm_info
->loc_port
;
2200 cm_node
->rem_port
= cm_info
->rem_port
;
2202 cm_node
->mpa_frame_rev
= iwdev
->mpa_version
;
2203 cm_node
->send_rdma0_op
= SEND_RDMA_READ_ZERO
;
2204 cm_node
->ird_size
= I40IW_MAX_IRD_SIZE
;
2205 cm_node
->ord_size
= I40IW_MAX_ORD_SIZE
;
2207 cm_node
->listener
= listener
;
2208 cm_node
->cm_id
= cm_info
->cm_id
;
2209 ether_addr_copy(cm_node
->loc_mac
, netdev
->dev_addr
);
2210 spin_lock_init(&cm_node
->retrans_list_lock
);
2211 cm_node
->ack_rcvd
= false;
2213 atomic_set(&cm_node
->ref_count
, 1);
2214 /* associate our parent CM core */
2215 cm_node
->cm_core
= cm_core
;
2216 cm_node
->tcp_cntxt
.loc_id
= I40IW_CM_DEF_LOCAL_ID
;
2217 cm_node
->tcp_cntxt
.rcv_wscale
= I40IW_CM_DEFAULT_RCV_WND_SCALE
;
2218 cm_node
->tcp_cntxt
.rcv_wnd
=
2219 I40IW_CM_DEFAULT_RCV_WND_SCALED
>> I40IW_CM_DEFAULT_RCV_WND_SCALE
;
2220 if (cm_node
->ipv4
) {
2221 cm_node
->tcp_cntxt
.loc_seq_num
= secure_tcp_seq(htonl(cm_node
->loc_addr
[0]),
2222 htonl(cm_node
->rem_addr
[0]),
2223 htons(cm_node
->loc_port
),
2224 htons(cm_node
->rem_port
));
2225 cm_node
->tcp_cntxt
.mss
= iwdev
->vsi
.mtu
- I40IW_MTU_TO_MSS_IPV4
;
2226 } else if (IS_ENABLED(CONFIG_IPV6
)) {
2228 htonl(cm_node
->loc_addr
[0]), htonl(cm_node
->loc_addr
[1]),
2229 htonl(cm_node
->loc_addr
[2]), htonl(cm_node
->loc_addr
[3])
2232 htonl(cm_node
->rem_addr
[0]), htonl(cm_node
->rem_addr
[1]),
2233 htonl(cm_node
->rem_addr
[2]), htonl(cm_node
->rem_addr
[3])
2235 cm_node
->tcp_cntxt
.loc_seq_num
= secure_tcpv6_seq(loc
, rem
,
2236 htons(cm_node
->loc_port
),
2237 htons(cm_node
->rem_port
));
2238 cm_node
->tcp_cntxt
.mss
= iwdev
->vsi
.mtu
- I40IW_MTU_TO_MSS_IPV6
;
2241 cm_node
->iwdev
= iwdev
;
2242 cm_node
->dev
= &iwdev
->sc_dev
;
2244 if ((cm_node
->ipv4
&&
2245 i40iw_ipv4_is_loopback(cm_node
->loc_addr
[0], cm_node
->rem_addr
[0])) ||
2246 (!cm_node
->ipv4
&& i40iw_ipv6_is_loopback(cm_node
->loc_addr
,
2247 cm_node
->rem_addr
))) {
2248 arpindex
= i40iw_arp_table(iwdev
,
2254 oldarpindex
= i40iw_arp_table(iwdev
,
2260 arpindex
= i40iw_addr_resolve_neigh(iwdev
,
2261 cm_info
->loc_addr
[0],
2262 cm_info
->rem_addr
[0],
2264 else if (IS_ENABLED(CONFIG_IPV6
))
2265 arpindex
= i40iw_addr_resolve_neigh_ipv6(iwdev
,
2273 i40iw_pr_err("cm_node arpindex\n");
2277 ether_addr_copy(cm_node
->rem_mac
, iwdev
->arp_table
[arpindex
].mac_addr
);
2278 i40iw_add_hte_node(cm_core
, cm_node
);
2279 cm_core
->stats_nodes_created
++;
2284 * i40iw_rem_ref_cm_node - destroy an instance of a cm node
2285 * @cm_node: connection's node
2287 static void i40iw_rem_ref_cm_node(struct i40iw_cm_node
*cm_node
)
2289 struct i40iw_cm_core
*cm_core
= cm_node
->cm_core
;
2290 struct i40iw_qp
*iwqp
;
2291 struct i40iw_cm_info nfo
;
2292 unsigned long flags
;
2294 spin_lock_irqsave(&cm_node
->cm_core
->ht_lock
, flags
);
2295 if (atomic_dec_return(&cm_node
->ref_count
)) {
2296 spin_unlock_irqrestore(&cm_node
->cm_core
->ht_lock
, flags
);
2299 list_del(&cm_node
->list
);
2300 spin_unlock_irqrestore(&cm_node
->cm_core
->ht_lock
, flags
);
2302 /* if the node is destroyed before connection was accelerated */
2303 if (!cm_node
->accelerated
&& cm_node
->accept_pend
) {
2304 pr_err("node destroyed before established\n");
2305 atomic_dec(&cm_node
->listener
->pend_accepts_cnt
);
2307 if (cm_node
->close_entry
)
2308 i40iw_handle_close_entry(cm_node
, 0);
2309 if (cm_node
->listener
) {
2310 i40iw_dec_refcnt_listen(cm_core
, cm_node
->listener
, 0, true);
2312 if (cm_node
->apbvt_set
) {
2313 i40iw_manage_apbvt(cm_node
->iwdev
,
2315 I40IW_MANAGE_APBVT_DEL
);
2316 cm_node
->apbvt_set
= 0;
2318 i40iw_get_addr_info(cm_node
, &nfo
);
2319 if (cm_node
->qhash_set
) {
2320 i40iw_manage_qhash(cm_node
->iwdev
,
2322 I40IW_QHASH_TYPE_TCP_ESTABLISHED
,
2323 I40IW_QHASH_MANAGE_TYPE_DELETE
,
2326 cm_node
->qhash_set
= 0;
2330 iwqp
= cm_node
->iwqp
;
2332 iwqp
->cm_node
= NULL
;
2333 i40iw_rem_ref(&iwqp
->ibqp
);
2334 cm_node
->iwqp
= NULL
;
2335 } else if (cm_node
->qhash_set
) {
2336 i40iw_get_addr_info(cm_node
, &nfo
);
2337 i40iw_manage_qhash(cm_node
->iwdev
,
2339 I40IW_QHASH_TYPE_TCP_ESTABLISHED
,
2340 I40IW_QHASH_MANAGE_TYPE_DELETE
,
2343 cm_node
->qhash_set
= 0;
2346 cm_node
->cm_core
->stats_nodes_destroyed
++;
2351 * i40iw_handle_fin_pkt - FIN packet received
2352 * @cm_node: connection's node
2354 static void i40iw_handle_fin_pkt(struct i40iw_cm_node
*cm_node
)
2358 switch (cm_node
->state
) {
2359 case I40IW_CM_STATE_SYN_RCVD
:
2360 case I40IW_CM_STATE_SYN_SENT
:
2361 case I40IW_CM_STATE_ESTABLISHED
:
2362 case I40IW_CM_STATE_MPAREJ_RCVD
:
2363 cm_node
->tcp_cntxt
.rcv_nxt
++;
2364 i40iw_cleanup_retrans_entry(cm_node
);
2365 cm_node
->state
= I40IW_CM_STATE_LAST_ACK
;
2366 i40iw_send_fin(cm_node
);
2368 case I40IW_CM_STATE_MPAREQ_SENT
:
2369 i40iw_create_event(cm_node
, I40IW_CM_EVENT_ABORTED
);
2370 cm_node
->tcp_cntxt
.rcv_nxt
++;
2371 i40iw_cleanup_retrans_entry(cm_node
);
2372 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
2373 atomic_inc(&cm_node
->ref_count
);
2374 i40iw_send_reset(cm_node
);
2376 case I40IW_CM_STATE_FIN_WAIT1
:
2377 cm_node
->tcp_cntxt
.rcv_nxt
++;
2378 i40iw_cleanup_retrans_entry(cm_node
);
2379 cm_node
->state
= I40IW_CM_STATE_CLOSING
;
2380 i40iw_send_ack(cm_node
);
2382 * Wait for ACK as this is simultaneous close.
2383 * After we receive ACK, do not send anything.
2387 case I40IW_CM_STATE_FIN_WAIT2
:
2388 cm_node
->tcp_cntxt
.rcv_nxt
++;
2389 i40iw_cleanup_retrans_entry(cm_node
);
2390 cm_node
->state
= I40IW_CM_STATE_TIME_WAIT
;
2391 i40iw_send_ack(cm_node
);
2393 i40iw_schedule_cm_timer(cm_node
, NULL
, I40IW_TIMER_TYPE_CLOSE
, 1, 0);
2395 i40iw_pr_err("node %p state = %d\n", cm_node
, cm_node
->state
);
2397 case I40IW_CM_STATE_TIME_WAIT
:
2398 cm_node
->tcp_cntxt
.rcv_nxt
++;
2399 i40iw_cleanup_retrans_entry(cm_node
);
2400 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
2401 i40iw_rem_ref_cm_node(cm_node
);
2403 case I40IW_CM_STATE_OFFLOADED
:
2405 i40iw_pr_err("bad state node %p state = %d\n", cm_node
, cm_node
->state
);
2411 * i40iw_handle_rst_pkt - process received RST packet
2412 * @cm_node: connection's node
2413 * @rbuf: receive buffer
2415 static void i40iw_handle_rst_pkt(struct i40iw_cm_node
*cm_node
,
2416 struct i40iw_puda_buf
*rbuf
)
2418 i40iw_cleanup_retrans_entry(cm_node
);
2419 switch (cm_node
->state
) {
2420 case I40IW_CM_STATE_SYN_SENT
:
2421 case I40IW_CM_STATE_MPAREQ_SENT
:
2422 switch (cm_node
->mpa_frame_rev
) {
2424 cm_node
->mpa_frame_rev
= IETF_MPA_V1
;
2425 /* send a syn and goto syn sent state */
2426 cm_node
->state
= I40IW_CM_STATE_SYN_SENT
;
2427 if (i40iw_send_syn(cm_node
, 0))
2428 i40iw_active_open_err(cm_node
, false);
2432 i40iw_active_open_err(cm_node
, false);
2436 case I40IW_CM_STATE_MPAREQ_RCVD
:
2437 atomic_add_return(1, &cm_node
->passive_state
);
2439 case I40IW_CM_STATE_ESTABLISHED
:
2440 case I40IW_CM_STATE_SYN_RCVD
:
2441 case I40IW_CM_STATE_LISTENING
:
2442 i40iw_pr_err("Bad state state = %d\n", cm_node
->state
);
2443 i40iw_passive_open_err(cm_node
, false);
2445 case I40IW_CM_STATE_OFFLOADED
:
2446 i40iw_active_open_err(cm_node
, false);
2448 case I40IW_CM_STATE_CLOSED
:
2450 case I40IW_CM_STATE_FIN_WAIT2
:
2451 case I40IW_CM_STATE_FIN_WAIT1
:
2452 case I40IW_CM_STATE_LAST_ACK
:
2453 cm_node
->cm_id
->rem_ref(cm_node
->cm_id
);
2455 case I40IW_CM_STATE_TIME_WAIT
:
2456 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
2457 i40iw_rem_ref_cm_node(cm_node
);
2465 * i40iw_handle_rcv_mpa - Process a recv'd mpa buffer
2466 * @cm_node: connection's node
2467 * @rbuf: receive buffer
2469 static void i40iw_handle_rcv_mpa(struct i40iw_cm_node
*cm_node
,
2470 struct i40iw_puda_buf
*rbuf
)
2473 int datasize
= rbuf
->datalen
;
2474 u8
*dataloc
= rbuf
->data
;
2476 enum i40iw_cm_event_type type
= I40IW_CM_EVENT_UNKNOWN
;
2479 ret
= i40iw_parse_mpa(cm_node
, dataloc
, &res_type
, datasize
);
2481 if (cm_node
->state
== I40IW_CM_STATE_MPAREQ_SENT
)
2482 i40iw_active_open_err(cm_node
, true);
2484 i40iw_passive_open_err(cm_node
, true);
2488 switch (cm_node
->state
) {
2489 case I40IW_CM_STATE_ESTABLISHED
:
2490 if (res_type
== I40IW_MPA_REQUEST_REJECT
)
2491 i40iw_pr_err("state for reject\n");
2492 cm_node
->state
= I40IW_CM_STATE_MPAREQ_RCVD
;
2493 type
= I40IW_CM_EVENT_MPA_REQ
;
2494 i40iw_send_ack(cm_node
); /* ACK received MPA request */
2495 atomic_set(&cm_node
->passive_state
,
2496 I40IW_PASSIVE_STATE_INDICATED
);
2498 case I40IW_CM_STATE_MPAREQ_SENT
:
2499 i40iw_cleanup_retrans_entry(cm_node
);
2500 if (res_type
== I40IW_MPA_REQUEST_REJECT
) {
2501 type
= I40IW_CM_EVENT_MPA_REJECT
;
2502 cm_node
->state
= I40IW_CM_STATE_MPAREJ_RCVD
;
2504 type
= I40IW_CM_EVENT_CONNECTED
;
2505 cm_node
->state
= I40IW_CM_STATE_OFFLOADED
;
2507 i40iw_send_ack(cm_node
);
2510 pr_err("%s wrong cm_node state =%d\n", __func__
, cm_node
->state
);
2513 i40iw_create_event(cm_node
, type
);
2517 * i40iw_indicate_pkt_err - Send up err event to cm
2518 * @cm_node: connection's node
2520 static void i40iw_indicate_pkt_err(struct i40iw_cm_node
*cm_node
)
2522 switch (cm_node
->state
) {
2523 case I40IW_CM_STATE_SYN_SENT
:
2524 case I40IW_CM_STATE_MPAREQ_SENT
:
2525 i40iw_active_open_err(cm_node
, true);
2527 case I40IW_CM_STATE_ESTABLISHED
:
2528 case I40IW_CM_STATE_SYN_RCVD
:
2529 i40iw_passive_open_err(cm_node
, true);
2531 case I40IW_CM_STATE_OFFLOADED
:
2538 * i40iw_check_syn - Check for error on received syn ack
2539 * @cm_node: connection's node
2540 * @tcph: pointer tcp header
2542 static int i40iw_check_syn(struct i40iw_cm_node
*cm_node
, struct tcphdr
*tcph
)
2546 if (ntohl(tcph
->ack_seq
) != cm_node
->tcp_cntxt
.loc_seq_num
) {
2548 i40iw_active_open_err(cm_node
, true);
2554 * i40iw_check_seq - check seq numbers if OK
2555 * @cm_node: connection's node
2556 * @tcph: pointer tcp header
2558 static int i40iw_check_seq(struct i40iw_cm_node
*cm_node
, struct tcphdr
*tcph
)
2563 u32 loc_seq_num
= cm_node
->tcp_cntxt
.loc_seq_num
;
2564 u32 rcv_nxt
= cm_node
->tcp_cntxt
.rcv_nxt
;
2567 seq
= ntohl(tcph
->seq
);
2568 ack_seq
= ntohl(tcph
->ack_seq
);
2569 rcv_wnd
= cm_node
->tcp_cntxt
.rcv_wnd
;
2570 if (ack_seq
!= loc_seq_num
)
2572 else if (!between(seq
, rcv_nxt
, (rcv_nxt
+ rcv_wnd
)))
2575 i40iw_pr_err("seq number\n");
2576 i40iw_indicate_pkt_err(cm_node
);
2582 * i40iw_handle_syn_pkt - is for Passive node
2583 * @cm_node: connection's node
2584 * @rbuf: receive buffer
2586 static void i40iw_handle_syn_pkt(struct i40iw_cm_node
*cm_node
,
2587 struct i40iw_puda_buf
*rbuf
)
2589 struct tcphdr
*tcph
= (struct tcphdr
*)rbuf
->tcph
;
2593 struct i40iw_cm_info nfo
;
2595 optionsize
= (tcph
->doff
<< 2) - sizeof(struct tcphdr
);
2596 inc_sequence
= ntohl(tcph
->seq
);
2598 switch (cm_node
->state
) {
2599 case I40IW_CM_STATE_SYN_SENT
:
2600 case I40IW_CM_STATE_MPAREQ_SENT
:
2601 /* Rcvd syn on active open connection */
2602 i40iw_active_open_err(cm_node
, 1);
2604 case I40IW_CM_STATE_LISTENING
:
2606 if (atomic_read(&cm_node
->listener
->pend_accepts_cnt
) >
2607 cm_node
->listener
->backlog
) {
2608 cm_node
->cm_core
->stats_backlog_drops
++;
2609 i40iw_passive_open_err(cm_node
, false);
2612 ret
= i40iw_handle_tcp_options(cm_node
, tcph
, optionsize
, 1);
2614 i40iw_passive_open_err(cm_node
, false);
2618 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ 1;
2619 cm_node
->accept_pend
= 1;
2620 atomic_inc(&cm_node
->listener
->pend_accepts_cnt
);
2622 cm_node
->state
= I40IW_CM_STATE_SYN_RCVD
;
2623 i40iw_get_addr_info(cm_node
, &nfo
);
2624 ret
= i40iw_manage_qhash(cm_node
->iwdev
,
2626 I40IW_QHASH_TYPE_TCP_ESTABLISHED
,
2627 I40IW_QHASH_MANAGE_TYPE_ADD
,
2630 cm_node
->qhash_set
= true;
2632 case I40IW_CM_STATE_CLOSED
:
2633 i40iw_cleanup_retrans_entry(cm_node
);
2634 atomic_inc(&cm_node
->ref_count
);
2635 i40iw_send_reset(cm_node
);
2637 case I40IW_CM_STATE_OFFLOADED
:
2638 case I40IW_CM_STATE_ESTABLISHED
:
2639 case I40IW_CM_STATE_FIN_WAIT1
:
2640 case I40IW_CM_STATE_FIN_WAIT2
:
2641 case I40IW_CM_STATE_MPAREQ_RCVD
:
2642 case I40IW_CM_STATE_LAST_ACK
:
2643 case I40IW_CM_STATE_CLOSING
:
2644 case I40IW_CM_STATE_UNKNOWN
:
2651 * i40iw_handle_synack_pkt - Process SYN+ACK packet (active side)
2652 * @cm_node: connection's node
2653 * @rbuf: receive buffer
2655 static void i40iw_handle_synack_pkt(struct i40iw_cm_node
*cm_node
,
2656 struct i40iw_puda_buf
*rbuf
)
2658 struct tcphdr
*tcph
= (struct tcphdr
*)rbuf
->tcph
;
2663 optionsize
= (tcph
->doff
<< 2) - sizeof(struct tcphdr
);
2664 inc_sequence
= ntohl(tcph
->seq
);
2665 switch (cm_node
->state
) {
2666 case I40IW_CM_STATE_SYN_SENT
:
2667 i40iw_cleanup_retrans_entry(cm_node
);
2669 if (i40iw_check_syn(cm_node
, tcph
)) {
2670 i40iw_pr_err("check syn fail\n");
2673 cm_node
->tcp_cntxt
.rem_ack_num
= ntohl(tcph
->ack_seq
);
2675 ret
= i40iw_handle_tcp_options(cm_node
, tcph
, optionsize
, 0);
2677 i40iw_debug(cm_node
->dev
,
2679 "cm_node=%p tcp_options failed\n",
2683 i40iw_cleanup_retrans_entry(cm_node
);
2684 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ 1;
2685 i40iw_send_ack(cm_node
); /* ACK for the syn_ack */
2686 ret
= i40iw_send_mpa_request(cm_node
);
2688 i40iw_debug(cm_node
->dev
,
2690 "cm_node=%p i40iw_send_mpa_request failed\n",
2694 cm_node
->state
= I40IW_CM_STATE_MPAREQ_SENT
;
2696 case I40IW_CM_STATE_MPAREQ_RCVD
:
2697 i40iw_passive_open_err(cm_node
, true);
2699 case I40IW_CM_STATE_LISTENING
:
2700 cm_node
->tcp_cntxt
.loc_seq_num
= ntohl(tcph
->ack_seq
);
2701 i40iw_cleanup_retrans_entry(cm_node
);
2702 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
2703 i40iw_send_reset(cm_node
);
2705 case I40IW_CM_STATE_CLOSED
:
2706 cm_node
->tcp_cntxt
.loc_seq_num
= ntohl(tcph
->ack_seq
);
2707 i40iw_cleanup_retrans_entry(cm_node
);
2708 atomic_inc(&cm_node
->ref_count
);
2709 i40iw_send_reset(cm_node
);
2711 case I40IW_CM_STATE_ESTABLISHED
:
2712 case I40IW_CM_STATE_FIN_WAIT1
:
2713 case I40IW_CM_STATE_FIN_WAIT2
:
2714 case I40IW_CM_STATE_LAST_ACK
:
2715 case I40IW_CM_STATE_OFFLOADED
:
2716 case I40IW_CM_STATE_CLOSING
:
2717 case I40IW_CM_STATE_UNKNOWN
:
2718 case I40IW_CM_STATE_MPAREQ_SENT
:
2725 * i40iw_handle_ack_pkt - process packet with ACK
2726 * @cm_node: connection's node
2727 * @rbuf: receive buffer
2729 static int i40iw_handle_ack_pkt(struct i40iw_cm_node
*cm_node
,
2730 struct i40iw_puda_buf
*rbuf
)
2732 struct tcphdr
*tcph
= (struct tcphdr
*)rbuf
->tcph
;
2736 u32 datasize
= rbuf
->datalen
;
2738 optionsize
= (tcph
->doff
<< 2) - sizeof(struct tcphdr
);
2740 if (i40iw_check_seq(cm_node
, tcph
))
2743 inc_sequence
= ntohl(tcph
->seq
);
2744 switch (cm_node
->state
) {
2745 case I40IW_CM_STATE_SYN_RCVD
:
2746 i40iw_cleanup_retrans_entry(cm_node
);
2747 ret
= i40iw_handle_tcp_options(cm_node
, tcph
, optionsize
, 1);
2750 cm_node
->tcp_cntxt
.rem_ack_num
= ntohl(tcph
->ack_seq
);
2751 cm_node
->state
= I40IW_CM_STATE_ESTABLISHED
;
2753 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ datasize
;
2754 i40iw_handle_rcv_mpa(cm_node
, rbuf
);
2757 case I40IW_CM_STATE_ESTABLISHED
:
2758 i40iw_cleanup_retrans_entry(cm_node
);
2760 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ datasize
;
2761 i40iw_handle_rcv_mpa(cm_node
, rbuf
);
2764 case I40IW_CM_STATE_MPAREQ_SENT
:
2765 cm_node
->tcp_cntxt
.rem_ack_num
= ntohl(tcph
->ack_seq
);
2767 cm_node
->tcp_cntxt
.rcv_nxt
= inc_sequence
+ datasize
;
2768 cm_node
->ack_rcvd
= false;
2769 i40iw_handle_rcv_mpa(cm_node
, rbuf
);
2771 cm_node
->ack_rcvd
= true;
2774 case I40IW_CM_STATE_LISTENING
:
2775 i40iw_cleanup_retrans_entry(cm_node
);
2776 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
2777 i40iw_send_reset(cm_node
);
2779 case I40IW_CM_STATE_CLOSED
:
2780 i40iw_cleanup_retrans_entry(cm_node
);
2781 atomic_inc(&cm_node
->ref_count
);
2782 i40iw_send_reset(cm_node
);
2784 case I40IW_CM_STATE_LAST_ACK
:
2785 case I40IW_CM_STATE_CLOSING
:
2786 i40iw_cleanup_retrans_entry(cm_node
);
2787 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
2788 if (!cm_node
->accept_pend
)
2789 cm_node
->cm_id
->rem_ref(cm_node
->cm_id
);
2790 i40iw_rem_ref_cm_node(cm_node
);
2792 case I40IW_CM_STATE_FIN_WAIT1
:
2793 i40iw_cleanup_retrans_entry(cm_node
);
2794 cm_node
->state
= I40IW_CM_STATE_FIN_WAIT2
;
2796 case I40IW_CM_STATE_SYN_SENT
:
2797 case I40IW_CM_STATE_FIN_WAIT2
:
2798 case I40IW_CM_STATE_OFFLOADED
:
2799 case I40IW_CM_STATE_MPAREQ_RCVD
:
2800 case I40IW_CM_STATE_UNKNOWN
:
2802 i40iw_cleanup_retrans_entry(cm_node
);
2809 * i40iw_process_packet - process cm packet
2810 * @cm_node: connection's node
2811 * @rbuf: receive buffer
2813 static void i40iw_process_packet(struct i40iw_cm_node
*cm_node
,
2814 struct i40iw_puda_buf
*rbuf
)
2816 enum i40iw_tcpip_pkt_type pkt_type
= I40IW_PKT_TYPE_UNKNOWN
;
2817 struct tcphdr
*tcph
= (struct tcphdr
*)rbuf
->tcph
;
2822 pkt_type
= I40IW_PKT_TYPE_RST
;
2823 } else if (tcph
->syn
) {
2824 pkt_type
= I40IW_PKT_TYPE_SYN
;
2826 pkt_type
= I40IW_PKT_TYPE_SYNACK
;
2827 } else if (tcph
->ack
) {
2828 pkt_type
= I40IW_PKT_TYPE_ACK
;
2834 case I40IW_PKT_TYPE_SYN
:
2835 i40iw_handle_syn_pkt(cm_node
, rbuf
);
2837 case I40IW_PKT_TYPE_SYNACK
:
2838 i40iw_handle_synack_pkt(cm_node
, rbuf
);
2840 case I40IW_PKT_TYPE_ACK
:
2841 ret
= i40iw_handle_ack_pkt(cm_node
, rbuf
);
2842 if (fin_set
&& !ret
)
2843 i40iw_handle_fin_pkt(cm_node
);
2845 case I40IW_PKT_TYPE_RST
:
2846 i40iw_handle_rst_pkt(cm_node
, rbuf
);
2850 (!i40iw_check_seq(cm_node
, (struct tcphdr
*)rbuf
->tcph
)))
2851 i40iw_handle_fin_pkt(cm_node
);
2857 * i40iw_make_listen_node - create a listen node with params
2858 * @cm_core: cm's core
2859 * @iwdev: iwarp device structure
2860 * @cm_info: quad info for connection
2862 static struct i40iw_cm_listener
*i40iw_make_listen_node(
2863 struct i40iw_cm_core
*cm_core
,
2864 struct i40iw_device
*iwdev
,
2865 struct i40iw_cm_info
*cm_info
)
2867 struct i40iw_cm_listener
*listener
;
2868 unsigned long flags
;
2870 /* cannot have multiple matching listeners */
2871 listener
= i40iw_find_listener(cm_core
, cm_info
->loc_addr
,
2874 I40IW_CM_LISTENER_EITHER_STATE
);
2876 (listener
->listener_state
== I40IW_CM_LISTENER_ACTIVE_STATE
)) {
2877 atomic_dec(&listener
->ref_count
);
2878 i40iw_debug(cm_core
->dev
,
2880 "Not creating listener since it already exists\n");
2885 /* create a CM listen node (1/2 node to compare incoming traffic to) */
2886 listener
= kzalloc(sizeof(*listener
), GFP_KERNEL
);
2889 cm_core
->stats_listen_nodes_created
++;
2890 memcpy(listener
->loc_addr
, cm_info
->loc_addr
, sizeof(listener
->loc_addr
));
2891 listener
->loc_port
= cm_info
->loc_port
;
2893 INIT_LIST_HEAD(&listener
->child_listen_list
);
2895 atomic_set(&listener
->ref_count
, 1);
2897 listener
->reused_node
= 1;
2900 listener
->cm_id
= cm_info
->cm_id
;
2901 listener
->ipv4
= cm_info
->ipv4
;
2902 listener
->vlan_id
= cm_info
->vlan_id
;
2903 atomic_set(&listener
->pend_accepts_cnt
, 0);
2904 listener
->cm_core
= cm_core
;
2905 listener
->iwdev
= iwdev
;
2907 listener
->backlog
= cm_info
->backlog
;
2908 listener
->listener_state
= I40IW_CM_LISTENER_ACTIVE_STATE
;
2910 if (!listener
->reused_node
) {
2911 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
2912 list_add(&listener
->list
, &cm_core
->listen_nodes
);
2913 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
2920 * i40iw_create_cm_node - make a connection node with params
2921 * @cm_core: cm's core
2922 * @iwdev: iwarp device structure
2923 * @conn_param: upper layer connection parameters
2924 * @cm_info: quad info for connection
2926 static struct i40iw_cm_node
*i40iw_create_cm_node(
2927 struct i40iw_cm_core
*cm_core
,
2928 struct i40iw_device
*iwdev
,
2929 struct iw_cm_conn_param
*conn_param
,
2930 struct i40iw_cm_info
*cm_info
)
2932 struct i40iw_cm_node
*cm_node
;
2933 struct i40iw_cm_listener
*loopback_remotelistener
;
2934 struct i40iw_cm_node
*loopback_remotenode
;
2935 struct i40iw_cm_info loopback_cm_info
;
2937 u16 private_data_len
= conn_param
->private_data_len
;
2938 const void *private_data
= conn_param
->private_data
;
2940 /* create a CM connection node */
2941 cm_node
= i40iw_make_cm_node(cm_core
, iwdev
, cm_info
, NULL
);
2943 return ERR_PTR(-ENOMEM
);
2944 /* set our node side to client (active) side */
2945 cm_node
->tcp_cntxt
.client
= 1;
2946 cm_node
->tcp_cntxt
.rcv_wscale
= I40IW_CM_DEFAULT_RCV_WND_SCALE
;
2948 i40iw_record_ird_ord(cm_node
, conn_param
->ird
, conn_param
->ord
);
2950 if (!memcmp(cm_info
->loc_addr
, cm_info
->rem_addr
, sizeof(cm_info
->loc_addr
))) {
2951 loopback_remotelistener
= i40iw_find_listener(
2956 I40IW_CM_LISTENER_ACTIVE_STATE
);
2957 if (!loopback_remotelistener
) {
2958 i40iw_rem_ref_cm_node(cm_node
);
2959 return ERR_PTR(-ECONNREFUSED
);
2961 loopback_cm_info
= *cm_info
;
2962 loopback_cm_info
.loc_port
= cm_info
->rem_port
;
2963 loopback_cm_info
.rem_port
= cm_info
->loc_port
;
2964 loopback_cm_info
.cm_id
= loopback_remotelistener
->cm_id
;
2965 loopback_cm_info
.ipv4
= cm_info
->ipv4
;
2966 loopback_remotenode
= i40iw_make_cm_node(cm_core
,
2969 loopback_remotelistener
);
2970 if (!loopback_remotenode
) {
2971 i40iw_rem_ref_cm_node(cm_node
);
2972 return ERR_PTR(-ENOMEM
);
2974 cm_core
->stats_loopbacks
++;
2975 loopback_remotenode
->loopbackpartner
= cm_node
;
2976 loopback_remotenode
->tcp_cntxt
.rcv_wscale
=
2977 I40IW_CM_DEFAULT_RCV_WND_SCALE
;
2978 cm_node
->loopbackpartner
= loopback_remotenode
;
2979 memcpy(loopback_remotenode
->pdata_buf
, private_data
,
2981 loopback_remotenode
->pdata
.size
= private_data_len
;
2983 if (loopback_remotenode
->ord_size
> cm_node
->ird_size
)
2984 loopback_remotenode
->ord_size
=
2987 cm_node
->state
= I40IW_CM_STATE_OFFLOADED
;
2988 cm_node
->tcp_cntxt
.rcv_nxt
=
2989 loopback_remotenode
->tcp_cntxt
.loc_seq_num
;
2990 loopback_remotenode
->tcp_cntxt
.rcv_nxt
=
2991 cm_node
->tcp_cntxt
.loc_seq_num
;
2992 cm_node
->tcp_cntxt
.max_snd_wnd
=
2993 loopback_remotenode
->tcp_cntxt
.rcv_wnd
;
2994 loopback_remotenode
->tcp_cntxt
.max_snd_wnd
= cm_node
->tcp_cntxt
.rcv_wnd
;
2995 cm_node
->tcp_cntxt
.snd_wnd
= loopback_remotenode
->tcp_cntxt
.rcv_wnd
;
2996 loopback_remotenode
->tcp_cntxt
.snd_wnd
= cm_node
->tcp_cntxt
.rcv_wnd
;
2997 cm_node
->tcp_cntxt
.snd_wscale
= loopback_remotenode
->tcp_cntxt
.rcv_wscale
;
2998 loopback_remotenode
->tcp_cntxt
.snd_wscale
= cm_node
->tcp_cntxt
.rcv_wscale
;
3003 cm_node
->pdata
.size
= private_data_len
;
3004 cm_node
->pdata
.addr
= cm_node
->pdata_buf
;
3006 memcpy(cm_node
->pdata_buf
, private_data
, private_data_len
);
3008 cm_node
->state
= I40IW_CM_STATE_SYN_SENT
;
3013 * i40iw_cm_reject - reject and teardown a connection
3014 * @cm_node: connection's node
3015 * @pdate: ptr to private data for reject
3016 * @plen: size of private data
3018 static int i40iw_cm_reject(struct i40iw_cm_node
*cm_node
, const void *pdata
, u8 plen
)
3023 struct iw_cm_id
*cm_id
= cm_node
->cm_id
;
3024 struct i40iw_cm_node
*loopback
= cm_node
->loopbackpartner
;
3026 if (cm_node
->tcp_cntxt
.client
)
3028 i40iw_cleanup_retrans_entry(cm_node
);
3031 passive_state
= atomic_add_return(1, &cm_node
->passive_state
);
3032 if (passive_state
== I40IW_SEND_RESET_EVENT
) {
3033 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
3034 i40iw_rem_ref_cm_node(cm_node
);
3036 if (cm_node
->state
== I40IW_CM_STATE_LISTENER_DESTROYED
) {
3037 i40iw_rem_ref_cm_node(cm_node
);
3039 ret
= i40iw_send_mpa_reject(cm_node
, pdata
, plen
);
3041 cm_node
->state
= I40IW_CM_STATE_CLOSED
;
3042 err
= i40iw_send_reset(cm_node
);
3044 i40iw_pr_err("send reset failed\n");
3046 cm_id
->add_ref(cm_id
);
3051 cm_node
->cm_id
= NULL
;
3052 if (cm_node
->state
== I40IW_CM_STATE_LISTENER_DESTROYED
) {
3053 i40iw_rem_ref_cm_node(cm_node
);
3054 i40iw_rem_ref_cm_node(loopback
);
3056 ret
= i40iw_send_cm_event(loopback
,
3058 IW_CM_EVENT_CONNECT_REPLY
,
3060 i40iw_rem_ref_cm_node(cm_node
);
3061 loopback
->state
= I40IW_CM_STATE_CLOSING
;
3063 cm_id
= loopback
->cm_id
;
3064 i40iw_rem_ref_cm_node(loopback
);
3065 cm_id
->rem_ref(cm_id
);
3073 * i40iw_cm_close - close of cm connection
3074 * @cm_node: connection's node
3076 static int i40iw_cm_close(struct i40iw_cm_node
*cm_node
)
3083 switch (cm_node
->state
) {
3084 case I40IW_CM_STATE_SYN_RCVD
:
3085 case I40IW_CM_STATE_SYN_SENT
:
3086 case I40IW_CM_STATE_ONE_SIDE_ESTABLISHED
:
3087 case I40IW_CM_STATE_ESTABLISHED
:
3088 case I40IW_CM_STATE_ACCEPTING
:
3089 case I40IW_CM_STATE_MPAREQ_SENT
:
3090 case I40IW_CM_STATE_MPAREQ_RCVD
:
3091 i40iw_cleanup_retrans_entry(cm_node
);
3092 i40iw_send_reset(cm_node
);
3094 case I40IW_CM_STATE_CLOSE_WAIT
:
3095 cm_node
->state
= I40IW_CM_STATE_LAST_ACK
;
3096 i40iw_send_fin(cm_node
);
3098 case I40IW_CM_STATE_FIN_WAIT1
:
3099 case I40IW_CM_STATE_FIN_WAIT2
:
3100 case I40IW_CM_STATE_LAST_ACK
:
3101 case I40IW_CM_STATE_TIME_WAIT
:
3102 case I40IW_CM_STATE_CLOSING
:
3105 case I40IW_CM_STATE_LISTENING
:
3106 i40iw_cleanup_retrans_entry(cm_node
);
3107 i40iw_send_reset(cm_node
);
3109 case I40IW_CM_STATE_MPAREJ_RCVD
:
3110 case I40IW_CM_STATE_UNKNOWN
:
3111 case I40IW_CM_STATE_INITED
:
3112 case I40IW_CM_STATE_CLOSED
:
3113 case I40IW_CM_STATE_LISTENER_DESTROYED
:
3114 i40iw_rem_ref_cm_node(cm_node
);
3116 case I40IW_CM_STATE_OFFLOADED
:
3117 if (cm_node
->send_entry
)
3118 i40iw_pr_err("send_entry\n");
3119 i40iw_rem_ref_cm_node(cm_node
);
3126 * i40iw_receive_ilq - recv an ETHERNET packet, and process it
3128 * @vsi: pointer to the vsi structure
3129 * @rbuf: receive buffer
3131 void i40iw_receive_ilq(struct i40iw_sc_vsi
*vsi
, struct i40iw_puda_buf
*rbuf
)
3133 struct i40iw_cm_node
*cm_node
;
3134 struct i40iw_cm_listener
*listener
;
3136 struct ipv6hdr
*ip6h
;
3137 struct tcphdr
*tcph
;
3138 struct i40iw_cm_info cm_info
;
3139 struct i40iw_sc_dev
*dev
= vsi
->dev
;
3140 struct i40iw_device
*iwdev
= (struct i40iw_device
*)dev
->back_dev
;
3141 struct i40iw_cm_core
*cm_core
= &iwdev
->cm_core
;
3142 struct vlan_ethhdr
*ethh
;
3145 /* if vlan, then maclen = 18 else 14 */
3146 iph
= (struct iphdr
*)rbuf
->iph
;
3147 memset(&cm_info
, 0, sizeof(cm_info
));
3149 i40iw_debug_buf(dev
,
3151 "RECEIVE ILQ BUFFER",
3154 ethh
= (struct vlan_ethhdr
*)rbuf
->mem
.va
;
3156 if (ethh
->h_vlan_proto
== htons(ETH_P_8021Q
)) {
3157 vtag
= ntohs(ethh
->h_vlan_TCI
);
3158 cm_info
.user_pri
= (vtag
& VLAN_PRIO_MASK
) >> VLAN_PRIO_SHIFT
;
3159 cm_info
.vlan_id
= vtag
& VLAN_VID_MASK
;
3160 i40iw_debug(cm_core
->dev
,
3166 cm_info
.vlan_id
= I40IW_NO_VLAN
;
3168 tcph
= (struct tcphdr
*)rbuf
->tcph
;
3171 cm_info
.loc_addr
[0] = ntohl(iph
->daddr
);
3172 cm_info
.rem_addr
[0] = ntohl(iph
->saddr
);
3173 cm_info
.ipv4
= true;
3174 cm_info
.tos
= iph
->tos
;
3176 ip6h
= (struct ipv6hdr
*)rbuf
->iph
;
3177 i40iw_copy_ip_ntohl(cm_info
.loc_addr
,
3178 ip6h
->daddr
.in6_u
.u6_addr32
);
3179 i40iw_copy_ip_ntohl(cm_info
.rem_addr
,
3180 ip6h
->saddr
.in6_u
.u6_addr32
);
3181 cm_info
.ipv4
= false;
3182 cm_info
.tos
= (ip6h
->priority
<< 4) | (ip6h
->flow_lbl
[0] >> 4);
3184 cm_info
.loc_port
= ntohs(tcph
->dest
);
3185 cm_info
.rem_port
= ntohs(tcph
->source
);
3186 cm_node
= i40iw_find_node(cm_core
,
3195 /* Only type of packet accepted are for */
3196 /* the PASSIVE open (syn only) */
3197 if (!tcph
->syn
|| tcph
->ack
)
3200 i40iw_find_listener(cm_core
,
3204 I40IW_CM_LISTENER_ACTIVE_STATE
);
3206 cm_info
.cm_id
= NULL
;
3207 i40iw_debug(cm_core
->dev
,
3209 "%s no listener found\n",
3213 cm_info
.cm_id
= listener
->cm_id
;
3214 cm_node
= i40iw_make_cm_node(cm_core
, iwdev
, &cm_info
, listener
);
3216 i40iw_debug(cm_core
->dev
,
3218 "%s allocate node failed\n",
3220 atomic_dec(&listener
->ref_count
);
3223 if (!tcph
->rst
&& !tcph
->fin
) {
3224 cm_node
->state
= I40IW_CM_STATE_LISTENING
;
3226 i40iw_rem_ref_cm_node(cm_node
);
3229 atomic_inc(&cm_node
->ref_count
);
3230 } else if (cm_node
->state
== I40IW_CM_STATE_OFFLOADED
) {
3231 i40iw_rem_ref_cm_node(cm_node
);
3234 i40iw_process_packet(cm_node
, rbuf
);
3235 i40iw_rem_ref_cm_node(cm_node
);
3239 * i40iw_setup_cm_core - allocate a top level instance of a cm
3241 * @iwdev: iwarp device structure
3243 int i40iw_setup_cm_core(struct i40iw_device
*iwdev
)
3245 struct i40iw_cm_core
*cm_core
= &iwdev
->cm_core
;
3247 cm_core
->iwdev
= iwdev
;
3248 cm_core
->dev
= &iwdev
->sc_dev
;
3250 INIT_LIST_HEAD(&cm_core
->accelerated_list
);
3251 INIT_LIST_HEAD(&cm_core
->non_accelerated_list
);
3252 INIT_LIST_HEAD(&cm_core
->listen_nodes
);
3254 timer_setup(&cm_core
->tcp_timer
, i40iw_cm_timer_tick
, 0);
3256 spin_lock_init(&cm_core
->ht_lock
);
3257 spin_lock_init(&cm_core
->listen_list_lock
);
3258 spin_lock_init(&cm_core
->apbvt_lock
);
3260 cm_core
->event_wq
= alloc_ordered_workqueue("iwewq",
3262 if (!cm_core
->event_wq
)
3265 cm_core
->disconn_wq
= alloc_ordered_workqueue("iwdwq",
3267 if (!cm_core
->disconn_wq
)
3272 i40iw_cleanup_cm_core(&iwdev
->cm_core
);
3278 * i40iw_cleanup_cm_core - deallocate a top level instance of a
3280 * @cm_core: cm's core
3282 void i40iw_cleanup_cm_core(struct i40iw_cm_core
*cm_core
)
3284 unsigned long flags
;
3289 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
3290 if (timer_pending(&cm_core
->tcp_timer
))
3291 del_timer_sync(&cm_core
->tcp_timer
);
3292 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
3294 if (cm_core
->event_wq
)
3295 destroy_workqueue(cm_core
->event_wq
);
3296 if (cm_core
->disconn_wq
)
3297 destroy_workqueue(cm_core
->disconn_wq
);
3301 * i40iw_init_tcp_ctx - setup qp context
3302 * @cm_node: connection's node
3303 * @tcp_info: offload info for tcp
3304 * @iwqp: associate qp for the connection
3306 static void i40iw_init_tcp_ctx(struct i40iw_cm_node
*cm_node
,
3307 struct i40iw_tcp_offload_info
*tcp_info
,
3308 struct i40iw_qp
*iwqp
)
3310 tcp_info
->ipv4
= cm_node
->ipv4
;
3311 tcp_info
->drop_ooo_seg
= true;
3312 tcp_info
->wscale
= true;
3313 tcp_info
->ignore_tcp_opt
= true;
3314 tcp_info
->ignore_tcp_uns_opt
= true;
3315 tcp_info
->no_nagle
= false;
3317 tcp_info
->ttl
= I40IW_DEFAULT_TTL
;
3318 tcp_info
->rtt_var
= cpu_to_le32(I40IW_DEFAULT_RTT_VAR
);
3319 tcp_info
->ss_thresh
= cpu_to_le32(I40IW_DEFAULT_SS_THRESH
);
3320 tcp_info
->rexmit_thresh
= I40IW_DEFAULT_REXMIT_THRESH
;
3322 tcp_info
->tcp_state
= I40IW_TCP_STATE_ESTABLISHED
;
3323 tcp_info
->snd_wscale
= cm_node
->tcp_cntxt
.snd_wscale
;
3324 tcp_info
->rcv_wscale
= cm_node
->tcp_cntxt
.rcv_wscale
;
3326 tcp_info
->snd_nxt
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
3327 tcp_info
->snd_wnd
= cpu_to_le32(cm_node
->tcp_cntxt
.snd_wnd
);
3328 tcp_info
->rcv_nxt
= cpu_to_le32(cm_node
->tcp_cntxt
.rcv_nxt
);
3329 tcp_info
->snd_max
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
3331 tcp_info
->snd_una
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
3332 tcp_info
->cwnd
= cpu_to_le32(2 * cm_node
->tcp_cntxt
.mss
);
3333 tcp_info
->snd_wl1
= cpu_to_le32(cm_node
->tcp_cntxt
.rcv_nxt
);
3334 tcp_info
->snd_wl2
= cpu_to_le32(cm_node
->tcp_cntxt
.loc_seq_num
);
3335 tcp_info
->max_snd_window
= cpu_to_le32(cm_node
->tcp_cntxt
.max_snd_wnd
);
3336 tcp_info
->rcv_wnd
= cpu_to_le32(cm_node
->tcp_cntxt
.rcv_wnd
<<
3337 cm_node
->tcp_cntxt
.rcv_wscale
);
3339 tcp_info
->flow_label
= 0;
3340 tcp_info
->snd_mss
= cpu_to_le32(((u32
)cm_node
->tcp_cntxt
.mss
));
3341 if (cm_node
->vlan_id
<= VLAN_VID_MASK
) {
3342 tcp_info
->insert_vlan_tag
= true;
3343 tcp_info
->vlan_tag
= cpu_to_le16(((u16
)cm_node
->user_pri
<< I40IW_VLAN_PRIO_SHIFT
) |
3346 if (cm_node
->ipv4
) {
3347 tcp_info
->src_port
= cpu_to_le16(cm_node
->loc_port
);
3348 tcp_info
->dst_port
= cpu_to_le16(cm_node
->rem_port
);
3350 tcp_info
->dest_ip_addr3
= cpu_to_le32(cm_node
->rem_addr
[0]);
3351 tcp_info
->local_ipaddr3
= cpu_to_le32(cm_node
->loc_addr
[0]);
3353 cpu_to_le16((u16
)i40iw_arp_table(
3355 &tcp_info
->dest_ip_addr3
,
3358 I40IW_ARP_RESOLVE
));
3360 tcp_info
->src_port
= cpu_to_le16(cm_node
->loc_port
);
3361 tcp_info
->dst_port
= cpu_to_le16(cm_node
->rem_port
);
3362 tcp_info
->dest_ip_addr0
= cpu_to_le32(cm_node
->rem_addr
[0]);
3363 tcp_info
->dest_ip_addr1
= cpu_to_le32(cm_node
->rem_addr
[1]);
3364 tcp_info
->dest_ip_addr2
= cpu_to_le32(cm_node
->rem_addr
[2]);
3365 tcp_info
->dest_ip_addr3
= cpu_to_le32(cm_node
->rem_addr
[3]);
3366 tcp_info
->local_ipaddr0
= cpu_to_le32(cm_node
->loc_addr
[0]);
3367 tcp_info
->local_ipaddr1
= cpu_to_le32(cm_node
->loc_addr
[1]);
3368 tcp_info
->local_ipaddr2
= cpu_to_le32(cm_node
->loc_addr
[2]);
3369 tcp_info
->local_ipaddr3
= cpu_to_le32(cm_node
->loc_addr
[3]);
3371 cpu_to_le16((u16
)i40iw_arp_table(
3373 &tcp_info
->dest_ip_addr0
,
3376 I40IW_ARP_RESOLVE
));
3381 * i40iw_cm_init_tsa_conn - setup qp for RTS
3382 * @iwqp: associate qp for the connection
3383 * @cm_node: connection's node
3385 static void i40iw_cm_init_tsa_conn(struct i40iw_qp
*iwqp
,
3386 struct i40iw_cm_node
*cm_node
)
3388 struct i40iw_tcp_offload_info tcp_info
;
3389 struct i40iwarp_offload_info
*iwarp_info
;
3390 struct i40iw_qp_host_ctx_info
*ctx_info
;
3391 struct i40iw_device
*iwdev
= iwqp
->iwdev
;
3392 struct i40iw_sc_dev
*dev
= &iwqp
->iwdev
->sc_dev
;
3394 memset(&tcp_info
, 0x00, sizeof(struct i40iw_tcp_offload_info
));
3395 iwarp_info
= &iwqp
->iwarp_info
;
3396 ctx_info
= &iwqp
->ctx_info
;
3398 ctx_info
->tcp_info
= &tcp_info
;
3399 ctx_info
->send_cq_num
= iwqp
->iwscq
->sc_cq
.cq_uk
.cq_id
;
3400 ctx_info
->rcv_cq_num
= iwqp
->iwrcq
->sc_cq
.cq_uk
.cq_id
;
3402 iwarp_info
->ord_size
= cm_node
->ord_size
;
3403 iwarp_info
->ird_size
= i40iw_derive_hw_ird_setting(cm_node
->ird_size
);
3405 if (iwarp_info
->ord_size
== 1)
3406 iwarp_info
->ord_size
= 2;
3408 iwarp_info
->rd_enable
= true;
3409 iwarp_info
->rdmap_ver
= 1;
3410 iwarp_info
->ddp_ver
= 1;
3412 iwarp_info
->pd_id
= iwqp
->iwpd
->sc_pd
.pd_id
;
3414 ctx_info
->tcp_info_valid
= true;
3415 ctx_info
->iwarp_info_valid
= true;
3416 ctx_info
->add_to_qoslist
= true;
3417 ctx_info
->user_pri
= cm_node
->user_pri
;
3419 i40iw_init_tcp_ctx(cm_node
, &tcp_info
, iwqp
);
3420 if (cm_node
->snd_mark_en
) {
3421 iwarp_info
->snd_mark_en
= true;
3422 iwarp_info
->snd_mark_offset
= (tcp_info
.snd_nxt
&
3423 SNDMARKER_SEQNMASK
) + cm_node
->lsmm_size
;
3426 cm_node
->state
= I40IW_CM_STATE_OFFLOADED
;
3427 tcp_info
.tcp_state
= I40IW_TCP_STATE_ESTABLISHED
;
3428 tcp_info
.src_mac_addr_idx
= iwdev
->mac_ip_table_idx
;
3429 tcp_info
.tos
= cm_node
->tos
;
3431 dev
->iw_priv_qp_ops
->qp_setctx(&iwqp
->sc_qp
, (u64
*)(iwqp
->host_ctx
.va
), ctx_info
);
3433 /* once tcp_info is set, no need to do it again */
3434 ctx_info
->tcp_info_valid
= false;
3435 ctx_info
->iwarp_info_valid
= false;
3436 ctx_info
->add_to_qoslist
= false;
3440 * i40iw_cm_disconn - when a connection is being closed
3441 * @iwqp: associate qp for the connection
3443 void i40iw_cm_disconn(struct i40iw_qp
*iwqp
)
3445 struct disconn_work
*work
;
3446 struct i40iw_device
*iwdev
= iwqp
->iwdev
;
3447 struct i40iw_cm_core
*cm_core
= &iwdev
->cm_core
;
3448 unsigned long flags
;
3450 work
= kzalloc(sizeof(*work
), GFP_ATOMIC
);
3452 return; /* Timer will clean up */
3454 spin_lock_irqsave(&iwdev
->qptable_lock
, flags
);
3455 if (!iwdev
->qp_table
[iwqp
->ibqp
.qp_num
]) {
3456 spin_unlock_irqrestore(&iwdev
->qptable_lock
, flags
);
3457 i40iw_debug(&iwdev
->sc_dev
, I40IW_DEBUG_CM
,
3458 "%s qp_id %d is already freed\n",
3459 __func__
, iwqp
->ibqp
.qp_num
);
3463 i40iw_add_ref(&iwqp
->ibqp
);
3464 spin_unlock_irqrestore(&iwdev
->qptable_lock
, flags
);
3467 INIT_WORK(&work
->work
, i40iw_disconnect_worker
);
3468 queue_work(cm_core
->disconn_wq
, &work
->work
);
3473 * i40iw_qp_disconnect - free qp and close cm
3474 * @iwqp: associate qp for the connection
3476 static void i40iw_qp_disconnect(struct i40iw_qp
*iwqp
)
3478 struct i40iw_device
*iwdev
;
3479 struct i40iw_ib_device
*iwibdev
;
3481 iwdev
= to_iwdev(iwqp
->ibqp
.device
);
3483 i40iw_pr_err("iwdev == NULL\n");
3487 iwibdev
= iwdev
->iwibdev
;
3489 if (iwqp
->active_conn
) {
3490 /* indicate this connection is NOT active */
3491 iwqp
->active_conn
= 0;
3493 /* Need to free the Last Streaming Mode Message */
3494 if (iwqp
->ietf_mem
.va
) {
3496 iwibdev
->ibdev
.ops
.dereg_mr(iwqp
->lsmm_mr
,
3498 i40iw_free_dma_mem(iwdev
->sc_dev
.hw
, &iwqp
->ietf_mem
);
3502 /* close the CM node down if it is still active */
3503 if (iwqp
->cm_node
) {
3504 i40iw_debug(&iwdev
->sc_dev
, I40IW_DEBUG_CM
, "%s Call close API\n", __func__
);
3505 i40iw_cm_close(iwqp
->cm_node
);
3510 * i40iw_cm_disconn_true - called by worker thread to disconnect qp
3511 * @iwqp: associate qp for the connection
3513 static void i40iw_cm_disconn_true(struct i40iw_qp
*iwqp
)
3515 struct iw_cm_id
*cm_id
;
3516 struct i40iw_device
*iwdev
;
3517 struct i40iw_sc_qp
*qp
= &iwqp
->sc_qp
;
3519 u8 original_hw_tcp_state
;
3520 u8 original_ibqp_state
;
3521 int disconn_status
= 0;
3522 int issue_disconn
= 0;
3523 int issue_close
= 0;
3524 int issue_flush
= 0;
3525 struct ib_event ibevent
;
3526 unsigned long flags
;
3530 i40iw_pr_err("iwqp == NULL\n");
3534 spin_lock_irqsave(&iwqp
->lock
, flags
);
3535 cm_id
= iwqp
->cm_id
;
3536 /* make sure we havent already closed this connection */
3538 spin_unlock_irqrestore(&iwqp
->lock
, flags
);
3542 iwdev
= to_iwdev(iwqp
->ibqp
.device
);
3544 original_hw_tcp_state
= iwqp
->hw_tcp_state
;
3545 original_ibqp_state
= iwqp
->ibqp_state
;
3546 last_ae
= iwqp
->last_aeq
;
3548 if (qp
->term_flags
) {
3552 /*When term timer expires after cm_timer, don't want
3553 *terminate-handler to issue cm_disconn which can re-free
3554 *a QP even after its refcnt=0.
3556 i40iw_terminate_del_timer(qp
);
3557 if (!iwqp
->flush_issued
) {
3558 iwqp
->flush_issued
= 1;
3561 } else if ((original_hw_tcp_state
== I40IW_TCP_STATE_CLOSE_WAIT
) ||
3562 ((original_ibqp_state
== IB_QPS_RTS
) &&
3563 (last_ae
== I40IW_AE_LLP_CONNECTION_RESET
))) {
3565 if (last_ae
== I40IW_AE_LLP_CONNECTION_RESET
)
3566 disconn_status
= -ECONNRESET
;
3569 if (((original_hw_tcp_state
== I40IW_TCP_STATE_CLOSED
) ||
3570 (original_hw_tcp_state
== I40IW_TCP_STATE_TIME_WAIT
) ||
3571 (last_ae
== I40IW_AE_RDMAP_ROE_BAD_LLP_CLOSE
) ||
3572 (last_ae
== I40IW_AE_LLP_CONNECTION_RESET
) ||
3576 if (!iwqp
->flush_issued
) {
3577 iwqp
->flush_issued
= 1;
3582 spin_unlock_irqrestore(&iwqp
->lock
, flags
);
3583 if (issue_flush
&& !iwqp
->destroyed
) {
3584 /* Flush the queues */
3585 i40iw_flush_wqes(iwdev
, iwqp
);
3587 if (qp
->term_flags
&& iwqp
->ibqp
.event_handler
) {
3588 ibevent
.device
= iwqp
->ibqp
.device
;
3589 ibevent
.event
= (qp
->eventtype
== TERM_EVENT_QP_FATAL
) ?
3590 IB_EVENT_QP_FATAL
: IB_EVENT_QP_ACCESS_ERR
;
3591 ibevent
.element
.qp
= &iwqp
->ibqp
;
3592 iwqp
->ibqp
.event_handler(&ibevent
, iwqp
->ibqp
.qp_context
);
3596 if (cm_id
&& cm_id
->event_handler
) {
3597 if (issue_disconn
) {
3598 ret
= i40iw_send_cm_event(NULL
,
3600 IW_CM_EVENT_DISCONNECT
,
3604 i40iw_debug(&iwdev
->sc_dev
,
3606 "disconnect event failed %s: - cm_id = %p\n",
3610 i40iw_qp_disconnect(iwqp
);
3611 cm_id
->provider_data
= iwqp
;
3612 ret
= i40iw_send_cm_event(NULL
, cm_id
, IW_CM_EVENT_CLOSE
, 0);
3614 i40iw_debug(&iwdev
->sc_dev
,
3616 "close event failed %s: - cm_id = %p\n",
3618 cm_id
->rem_ref(cm_id
);
3624 * i40iw_disconnect_worker - worker for connection close
3625 * @work: points or disconn structure
3627 static void i40iw_disconnect_worker(struct work_struct
*work
)
3629 struct disconn_work
*dwork
= container_of(work
, struct disconn_work
, work
);
3630 struct i40iw_qp
*iwqp
= dwork
->iwqp
;
3633 i40iw_cm_disconn_true(iwqp
);
3634 i40iw_rem_ref(&iwqp
->ibqp
);
3638 * i40iw_accept - registered call for connection to be accepted
3639 * @cm_id: cm information for passive connection
3640 * @conn_param: accpet parameters
3642 int i40iw_accept(struct iw_cm_id
*cm_id
, struct iw_cm_conn_param
*conn_param
)
3645 struct i40iw_qp
*iwqp
;
3646 struct i40iw_device
*iwdev
;
3647 struct i40iw_sc_dev
*dev
;
3648 struct i40iw_cm_core
*cm_core
;
3649 struct i40iw_cm_node
*cm_node
;
3650 struct ib_qp_attr attr
;
3653 struct i40iw_pd
*iwpd
;
3655 struct i40iw_kmem_info accept
;
3656 enum i40iw_status_code status
;
3658 unsigned long flags
;
3660 memset(&attr
, 0, sizeof(attr
));
3661 ibqp
= i40iw_get_qp(cm_id
->device
, conn_param
->qpn
);
3665 iwqp
= to_iwqp(ibqp
);
3666 iwdev
= iwqp
->iwdev
;
3667 dev
= &iwdev
->sc_dev
;
3668 cm_core
= &iwdev
->cm_core
;
3669 cm_node
= (struct i40iw_cm_node
*)cm_id
->provider_data
;
3671 if (((struct sockaddr_in
*)&cm_id
->local_addr
)->sin_family
== AF_INET
) {
3672 cm_node
->ipv4
= true;
3673 cm_node
->vlan_id
= i40iw_get_vlan_ipv4(cm_node
->loc_addr
);
3675 cm_node
->ipv4
= false;
3676 i40iw_netdev_vlan_ipv6(cm_node
->loc_addr
, &cm_node
->vlan_id
);
3678 i40iw_debug(cm_node
->dev
,
3680 "Accept vlan_id=%d\n",
3682 if (cm_node
->state
== I40IW_CM_STATE_LISTENER_DESTROYED
) {
3683 if (cm_node
->loopbackpartner
)
3684 i40iw_rem_ref_cm_node(cm_node
->loopbackpartner
);
3685 i40iw_rem_ref_cm_node(cm_node
);
3689 passive_state
= atomic_add_return(1, &cm_node
->passive_state
);
3690 if (passive_state
== I40IW_SEND_RESET_EVENT
) {
3691 i40iw_rem_ref_cm_node(cm_node
);
3695 cm_node
->cm_core
->stats_accepts
++;
3696 iwqp
->cm_node
= (void *)cm_node
;
3697 cm_node
->iwqp
= iwqp
;
3699 buf_len
= conn_param
->private_data_len
+ I40IW_MAX_IETF_SIZE
;
3701 status
= i40iw_allocate_dma_mem(dev
->hw
, &iwqp
->ietf_mem
, buf_len
, 1);
3705 cm_node
->pdata
.size
= conn_param
->private_data_len
;
3706 accept
.addr
= iwqp
->ietf_mem
.va
;
3707 accept
.size
= i40iw_cm_build_mpa_frame(cm_node
, &accept
, MPA_KEY_REPLY
);
3708 memcpy(accept
.addr
+ accept
.size
, conn_param
->private_data
,
3709 conn_param
->private_data_len
);
3711 /* setup our first outgoing iWarp send WQE (the IETF frame response) */
3712 if ((cm_node
->ipv4
&&
3713 !i40iw_ipv4_is_loopback(cm_node
->loc_addr
[0], cm_node
->rem_addr
[0])) ||
3715 !i40iw_ipv6_is_loopback(cm_node
->loc_addr
, cm_node
->rem_addr
))) {
3717 tagged_offset
= (uintptr_t)iwqp
->ietf_mem
.va
;
3718 ibmr
= i40iw_reg_phys_mr(&iwpd
->ibpd
,
3721 IB_ACCESS_LOCAL_WRITE
,
3724 i40iw_free_dma_mem(dev
->hw
, &iwqp
->ietf_mem
);
3728 ibmr
->pd
= &iwpd
->ibpd
;
3729 ibmr
->device
= iwpd
->ibpd
.device
;
3730 iwqp
->lsmm_mr
= ibmr
;
3732 iwqp
->sc_qp
.qp_uk
.sq_base
= kmap(iwqp
->page
);
3733 dev
->iw_priv_qp_ops
->qp_send_lsmm(&iwqp
->sc_qp
,
3735 (accept
.size
+ conn_param
->private_data_len
),
3740 iwqp
->sc_qp
.qp_uk
.sq_base
= kmap(iwqp
->page
);
3741 dev
->iw_priv_qp_ops
->qp_send_lsmm(&iwqp
->sc_qp
, NULL
, 0, 0);
3747 iwqp
->cm_id
= cm_id
;
3748 cm_node
->cm_id
= cm_id
;
3750 cm_id
->provider_data
= (void *)iwqp
;
3751 iwqp
->active_conn
= 0;
3753 cm_node
->lsmm_size
= accept
.size
+ conn_param
->private_data_len
;
3754 i40iw_cm_init_tsa_conn(iwqp
, cm_node
);
3755 cm_id
->add_ref(cm_id
);
3756 i40iw_add_ref(&iwqp
->ibqp
);
3758 attr
.qp_state
= IB_QPS_RTS
;
3759 cm_node
->qhash_set
= false;
3760 i40iw_modify_qp(&iwqp
->ibqp
, &attr
, IB_QP_STATE
, NULL
);
3762 cm_node
->accelerated
= true;
3763 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
3764 list_move_tail(&cm_node
->list
, &cm_core
->accelerated_list
);
3765 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
3768 i40iw_send_cm_event(cm_node
, cm_id
, IW_CM_EVENT_ESTABLISHED
, 0);
3770 i40iw_debug(dev
, I40IW_DEBUG_CM
, "error sending cm event - ESTABLISHED\n");
3772 if (cm_node
->loopbackpartner
) {
3773 cm_node
->loopbackpartner
->pdata
.size
= conn_param
->private_data_len
;
3775 /* copy entire MPA frame to our cm_node's frame */
3776 memcpy(cm_node
->loopbackpartner
->pdata_buf
,
3777 conn_param
->private_data
,
3778 conn_param
->private_data_len
);
3779 i40iw_create_event(cm_node
->loopbackpartner
, I40IW_CM_EVENT_CONNECTED
);
3782 if (cm_node
->accept_pend
) {
3783 atomic_dec(&cm_node
->listener
->pend_accepts_cnt
);
3784 cm_node
->accept_pend
= 0;
3790 * i40iw_reject - registered call for connection to be rejected
3791 * @cm_id: cm information for passive connection
3792 * @pdata: private data to be sent
3793 * @pdata_len: private data length
3795 int i40iw_reject(struct iw_cm_id
*cm_id
, const void *pdata
, u8 pdata_len
)
3797 struct i40iw_device
*iwdev
;
3798 struct i40iw_cm_node
*cm_node
;
3799 struct i40iw_cm_node
*loopback
;
3801 cm_node
= (struct i40iw_cm_node
*)cm_id
->provider_data
;
3802 loopback
= cm_node
->loopbackpartner
;
3803 cm_node
->cm_id
= cm_id
;
3804 cm_node
->pdata
.size
= pdata_len
;
3806 iwdev
= to_iwdev(cm_id
->device
);
3809 cm_node
->cm_core
->stats_rejects
++;
3811 if (pdata_len
+ sizeof(struct ietf_mpa_v2
) > MAX_CM_BUFFER
)
3815 memcpy(&loopback
->pdata_buf
, pdata
, pdata_len
);
3816 loopback
->pdata
.size
= pdata_len
;
3819 return i40iw_cm_reject(cm_node
, pdata
, pdata_len
);
3823 * i40iw_connect - registered call for connection to be established
3824 * @cm_id: cm information for passive connection
3825 * @conn_param: Information about the connection
3827 int i40iw_connect(struct iw_cm_id
*cm_id
, struct iw_cm_conn_param
*conn_param
)
3830 struct i40iw_qp
*iwqp
;
3831 struct i40iw_device
*iwdev
;
3832 struct i40iw_cm_node
*cm_node
;
3833 struct i40iw_cm_info cm_info
;
3834 struct sockaddr_in
*laddr
;
3835 struct sockaddr_in
*raddr
;
3836 struct sockaddr_in6
*laddr6
;
3837 struct sockaddr_in6
*raddr6
;
3840 ibqp
= i40iw_get_qp(cm_id
->device
, conn_param
->qpn
);
3843 iwqp
= to_iwqp(ibqp
);
3846 iwdev
= to_iwdev(iwqp
->ibqp
.device
);
3850 laddr
= (struct sockaddr_in
*)&cm_id
->m_local_addr
;
3851 raddr
= (struct sockaddr_in
*)&cm_id
->m_remote_addr
;
3852 laddr6
= (struct sockaddr_in6
*)&cm_id
->m_local_addr
;
3853 raddr6
= (struct sockaddr_in6
*)&cm_id
->m_remote_addr
;
3855 if (!(laddr
->sin_port
) || !(raddr
->sin_port
))
3858 iwqp
->active_conn
= 1;
3860 cm_id
->provider_data
= iwqp
;
3862 /* set up the connection params for the node */
3863 if (cm_id
->remote_addr
.ss_family
== AF_INET
) {
3864 cm_info
.ipv4
= true;
3865 memset(cm_info
.loc_addr
, 0, sizeof(cm_info
.loc_addr
));
3866 memset(cm_info
.rem_addr
, 0, sizeof(cm_info
.rem_addr
));
3867 cm_info
.loc_addr
[0] = ntohl(laddr
->sin_addr
.s_addr
);
3868 cm_info
.rem_addr
[0] = ntohl(raddr
->sin_addr
.s_addr
);
3869 cm_info
.loc_port
= ntohs(laddr
->sin_port
);
3870 cm_info
.rem_port
= ntohs(raddr
->sin_port
);
3871 cm_info
.vlan_id
= i40iw_get_vlan_ipv4(cm_info
.loc_addr
);
3873 cm_info
.ipv4
= false;
3874 i40iw_copy_ip_ntohl(cm_info
.loc_addr
,
3875 laddr6
->sin6_addr
.in6_u
.u6_addr32
);
3876 i40iw_copy_ip_ntohl(cm_info
.rem_addr
,
3877 raddr6
->sin6_addr
.in6_u
.u6_addr32
);
3878 cm_info
.loc_port
= ntohs(laddr6
->sin6_port
);
3879 cm_info
.rem_port
= ntohs(raddr6
->sin6_port
);
3880 i40iw_netdev_vlan_ipv6(cm_info
.loc_addr
, &cm_info
.vlan_id
);
3882 cm_info
.cm_id
= cm_id
;
3883 cm_info
.tos
= cm_id
->tos
;
3884 cm_info
.user_pri
= rt_tos2priority(cm_id
->tos
);
3885 i40iw_debug(&iwdev
->sc_dev
, I40IW_DEBUG_DCB
, "%s TOS:[%d] UP:[%d]\n",
3886 __func__
, cm_id
->tos
, cm_info
.user_pri
);
3887 cm_id
->add_ref(cm_id
);
3888 cm_node
= i40iw_create_cm_node(&iwdev
->cm_core
, iwdev
,
3889 conn_param
, &cm_info
);
3891 if (IS_ERR(cm_node
)) {
3892 ret
= PTR_ERR(cm_node
);
3893 cm_id
->rem_ref(cm_id
);
3897 if ((cm_info
.ipv4
&& (laddr
->sin_addr
.s_addr
!= raddr
->sin_addr
.s_addr
)) ||
3898 (!cm_info
.ipv4
&& memcmp(laddr6
->sin6_addr
.in6_u
.u6_addr32
,
3899 raddr6
->sin6_addr
.in6_u
.u6_addr32
,
3900 sizeof(laddr6
->sin6_addr
.in6_u
.u6_addr32
)))) {
3901 if (i40iw_manage_qhash(iwdev
, &cm_info
, I40IW_QHASH_TYPE_TCP_ESTABLISHED
,
3902 I40IW_QHASH_MANAGE_TYPE_ADD
, NULL
, true)) {
3906 cm_node
->qhash_set
= true;
3909 if (i40iw_manage_apbvt(iwdev
, cm_info
.loc_port
,
3910 I40IW_MANAGE_APBVT_ADD
)) {
3915 cm_node
->apbvt_set
= true;
3916 iwqp
->cm_node
= cm_node
;
3917 cm_node
->iwqp
= iwqp
;
3918 iwqp
->cm_id
= cm_id
;
3919 i40iw_add_ref(&iwqp
->ibqp
);
3921 if (cm_node
->state
!= I40IW_CM_STATE_OFFLOADED
) {
3922 cm_node
->state
= I40IW_CM_STATE_SYN_SENT
;
3923 ret
= i40iw_send_syn(cm_node
, 0);
3928 if (cm_node
->loopbackpartner
) {
3929 cm_node
->loopbackpartner
->state
= I40IW_CM_STATE_MPAREQ_RCVD
;
3930 i40iw_create_event(cm_node
->loopbackpartner
,
3931 I40IW_CM_EVENT_MPA_REQ
);
3934 i40iw_debug(cm_node
->dev
,
3936 "Api - connect(): port=0x%04x, cm_node=%p, cm_id = %p.\n",
3945 i40iw_debug(&iwdev
->sc_dev
,
3947 "Api - connect() FAILED: dest addr=%pI4",
3950 i40iw_debug(&iwdev
->sc_dev
,
3952 "Api - connect() FAILED: dest addr=%pI6",
3955 i40iw_rem_ref_cm_node(cm_node
);
3956 cm_id
->rem_ref(cm_id
);
3957 iwdev
->cm_core
.stats_connect_errs
++;
3962 * i40iw_create_listen - registered call creating listener
3963 * @cm_id: cm information for passive connection
3964 * @backlog: to max accept pending count
3966 int i40iw_create_listen(struct iw_cm_id
*cm_id
, int backlog
)
3968 struct i40iw_device
*iwdev
;
3969 struct i40iw_cm_listener
*cm_listen_node
;
3970 struct i40iw_cm_info cm_info
;
3971 enum i40iw_status_code ret
;
3972 struct sockaddr_in
*laddr
;
3973 struct sockaddr_in6
*laddr6
;
3974 bool wildcard
= false;
3976 iwdev
= to_iwdev(cm_id
->device
);
3980 laddr
= (struct sockaddr_in
*)&cm_id
->m_local_addr
;
3981 laddr6
= (struct sockaddr_in6
*)&cm_id
->m_local_addr
;
3982 memset(&cm_info
, 0, sizeof(cm_info
));
3983 if (laddr
->sin_family
== AF_INET
) {
3984 cm_info
.ipv4
= true;
3985 cm_info
.loc_addr
[0] = ntohl(laddr
->sin_addr
.s_addr
);
3986 cm_info
.loc_port
= ntohs(laddr
->sin_port
);
3988 if (laddr
->sin_addr
.s_addr
!= INADDR_ANY
)
3989 cm_info
.vlan_id
= i40iw_get_vlan_ipv4(cm_info
.loc_addr
);
3994 cm_info
.ipv4
= false;
3995 i40iw_copy_ip_ntohl(cm_info
.loc_addr
,
3996 laddr6
->sin6_addr
.in6_u
.u6_addr32
);
3997 cm_info
.loc_port
= ntohs(laddr6
->sin6_port
);
3998 if (ipv6_addr_type(&laddr6
->sin6_addr
) != IPV6_ADDR_ANY
)
3999 i40iw_netdev_vlan_ipv6(cm_info
.loc_addr
,
4004 cm_info
.backlog
= backlog
;
4005 cm_info
.cm_id
= cm_id
;
4007 cm_listen_node
= i40iw_make_listen_node(&iwdev
->cm_core
, iwdev
, &cm_info
);
4008 if (!cm_listen_node
) {
4009 i40iw_pr_err("cm_listen_node == NULL\n");
4013 cm_id
->provider_data
= cm_listen_node
;
4015 cm_listen_node
->tos
= cm_id
->tos
;
4016 cm_listen_node
->user_pri
= rt_tos2priority(cm_id
->tos
);
4017 cm_info
.user_pri
= cm_listen_node
->user_pri
;
4019 if (!cm_listen_node
->reused_node
) {
4022 ret
= i40iw_add_mqh_4(iwdev
,
4026 ret
= i40iw_add_mqh_6(iwdev
,
4032 ret
= i40iw_manage_apbvt(iwdev
,
4034 I40IW_MANAGE_APBVT_ADD
);
4039 ret
= i40iw_manage_qhash(iwdev
,
4041 I40IW_QHASH_TYPE_TCP_SYN
,
4042 I40IW_QHASH_MANAGE_TYPE_ADD
,
4047 cm_listen_node
->qhash_set
= true;
4048 ret
= i40iw_manage_apbvt(iwdev
,
4050 I40IW_MANAGE_APBVT_ADD
);
4055 cm_id
->add_ref(cm_id
);
4056 cm_listen_node
->cm_core
->stats_listen_created
++;
4059 i40iw_cm_del_listen(&iwdev
->cm_core
, (void *)cm_listen_node
, false);
4064 * i40iw_destroy_listen - registered call to destroy listener
4065 * @cm_id: cm information for passive connection
4067 int i40iw_destroy_listen(struct iw_cm_id
*cm_id
)
4069 struct i40iw_device
*iwdev
;
4071 iwdev
= to_iwdev(cm_id
->device
);
4072 if (cm_id
->provider_data
)
4073 i40iw_cm_del_listen(&iwdev
->cm_core
, cm_id
->provider_data
, true);
4075 i40iw_pr_err("cm_id->provider_data was NULL\n");
4077 cm_id
->rem_ref(cm_id
);
4083 * i40iw_cm_event_connected - handle connected active node
4084 * @event: the info for cm_node of connection
4086 static void i40iw_cm_event_connected(struct i40iw_cm_event
*event
)
4088 struct i40iw_qp
*iwqp
;
4089 struct i40iw_device
*iwdev
;
4090 struct i40iw_cm_core
*cm_core
;
4091 struct i40iw_cm_node
*cm_node
;
4092 struct i40iw_sc_dev
*dev
;
4093 struct ib_qp_attr attr
;
4094 struct iw_cm_id
*cm_id
;
4095 unsigned long flags
;
4099 cm_node
= event
->cm_node
;
4100 cm_id
= cm_node
->cm_id
;
4101 iwqp
= (struct i40iw_qp
*)cm_id
->provider_data
;
4102 iwdev
= to_iwdev(iwqp
->ibqp
.device
);
4103 dev
= &iwdev
->sc_dev
;
4104 cm_core
= &iwdev
->cm_core
;
4106 if (iwqp
->destroyed
) {
4107 status
= -ETIMEDOUT
;
4110 i40iw_cm_init_tsa_conn(iwqp
, cm_node
);
4111 read0
= (cm_node
->send_rdma0_op
== SEND_RDMA_READ_ZERO
);
4113 iwqp
->sc_qp
.qp_uk
.sq_base
= kmap(iwqp
->page
);
4114 dev
->iw_priv_qp_ops
->qp_send_rtt(&iwqp
->sc_qp
, read0
);
4118 memset(&attr
, 0, sizeof(attr
));
4119 attr
.qp_state
= IB_QPS_RTS
;
4120 cm_node
->qhash_set
= false;
4121 i40iw_modify_qp(&iwqp
->ibqp
, &attr
, IB_QP_STATE
, NULL
);
4123 cm_node
->accelerated
= true;
4124 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
4125 list_move_tail(&cm_node
->list
, &cm_core
->accelerated_list
);
4126 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
4127 status
= i40iw_send_cm_event(cm_node
, cm_id
, IW_CM_EVENT_CONNECT_REPLY
,
4130 i40iw_debug(dev
, I40IW_DEBUG_CM
, "error sending cm event - CONNECT_REPLY\n");
4136 cm_id
->provider_data
= NULL
;
4137 i40iw_send_cm_event(event
->cm_node
,
4139 IW_CM_EVENT_CONNECT_REPLY
,
4141 cm_id
->rem_ref(cm_id
);
4142 i40iw_rem_ref_cm_node(event
->cm_node
);
4146 * i40iw_cm_event_reset - handle reset
4147 * @event: the info for cm_node of connection
4149 static void i40iw_cm_event_reset(struct i40iw_cm_event
*event
)
4151 struct i40iw_cm_node
*cm_node
= event
->cm_node
;
4152 struct iw_cm_id
*cm_id
= cm_node
->cm_id
;
4153 struct i40iw_qp
*iwqp
;
4158 iwqp
= cm_id
->provider_data
;
4162 i40iw_debug(cm_node
->dev
,
4164 "reset event %p - cm_id = %p\n",
4165 event
->cm_node
, cm_id
);
4168 i40iw_send_cm_event(cm_node
, cm_node
->cm_id
, IW_CM_EVENT_DISCONNECT
, -ECONNRESET
);
4169 i40iw_send_cm_event(cm_node
, cm_node
->cm_id
, IW_CM_EVENT_CLOSE
, 0);
4173 * i40iw_cm_event_handler - worker thread callback to send event to cm upper layer
4174 * @work: pointer of cm event info.
4176 static void i40iw_cm_event_handler(struct work_struct
*work
)
4178 struct i40iw_cm_event
*event
= container_of(work
,
4179 struct i40iw_cm_event
,
4181 struct i40iw_cm_node
*cm_node
;
4183 if (!event
|| !event
->cm_node
|| !event
->cm_node
->cm_core
)
4186 cm_node
= event
->cm_node
;
4188 switch (event
->type
) {
4189 case I40IW_CM_EVENT_MPA_REQ
:
4190 i40iw_send_cm_event(cm_node
,
4192 IW_CM_EVENT_CONNECT_REQUEST
,
4195 case I40IW_CM_EVENT_RESET
:
4196 i40iw_cm_event_reset(event
);
4198 case I40IW_CM_EVENT_CONNECTED
:
4199 if (!event
->cm_node
->cm_id
||
4200 (event
->cm_node
->state
!= I40IW_CM_STATE_OFFLOADED
))
4202 i40iw_cm_event_connected(event
);
4204 case I40IW_CM_EVENT_MPA_REJECT
:
4205 if (!event
->cm_node
->cm_id
||
4206 (cm_node
->state
== I40IW_CM_STATE_OFFLOADED
))
4208 i40iw_send_cm_event(cm_node
,
4210 IW_CM_EVENT_CONNECT_REPLY
,
4213 case I40IW_CM_EVENT_ABORTED
:
4214 if (!event
->cm_node
->cm_id
||
4215 (event
->cm_node
->state
== I40IW_CM_STATE_OFFLOADED
))
4217 i40iw_event_connect_error(event
);
4220 i40iw_pr_err("event type = %d\n", event
->type
);
4224 event
->cm_info
.cm_id
->rem_ref(event
->cm_info
.cm_id
);
4225 i40iw_rem_ref_cm_node(event
->cm_node
);
4230 * i40iw_cm_post_event - queue event request for worker thread
4231 * @event: cm node's info for up event call
4233 static void i40iw_cm_post_event(struct i40iw_cm_event
*event
)
4235 atomic_inc(&event
->cm_node
->ref_count
);
4236 event
->cm_info
.cm_id
->add_ref(event
->cm_info
.cm_id
);
4237 INIT_WORK(&event
->event_work
, i40iw_cm_event_handler
);
4239 queue_work(event
->cm_node
->cm_core
->event_wq
, &event
->event_work
);
4243 * i40iw_qhash_ctrl - enable/disable qhash for list
4244 * @iwdev: device pointer
4245 * @parent_listen_node: parent listen node
4246 * @nfo: cm info node
4247 * @ipaddr: Pointer to IPv4 or IPv6 address
4248 * @ipv4: flag indicating IPv4 when true
4249 * @ifup: flag indicating interface up when true
4251 * Enables or disables the qhash for the node in the child
4252 * listen list that matches ipaddr. If no matching IP was found
4253 * it will allocate and add a new child listen node to the
4254 * parent listen node. The listen_list_lock is assumed to be
4257 static void i40iw_qhash_ctrl(struct i40iw_device
*iwdev
,
4258 struct i40iw_cm_listener
*parent_listen_node
,
4259 struct i40iw_cm_info
*nfo
,
4260 u32
*ipaddr
, bool ipv4
, bool ifup
)
4262 struct list_head
*child_listen_list
= &parent_listen_node
->child_listen_list
;
4263 struct i40iw_cm_listener
*child_listen_node
;
4264 struct list_head
*pos
, *tpos
;
4265 enum i40iw_status_code ret
;
4266 bool node_allocated
= false;
4267 enum i40iw_quad_hash_manage_type op
=
4268 ifup
? I40IW_QHASH_MANAGE_TYPE_ADD
: I40IW_QHASH_MANAGE_TYPE_DELETE
;
4270 list_for_each_safe(pos
, tpos
, child_listen_list
) {
4273 struct i40iw_cm_listener
,
4275 if (!memcmp(child_listen_node
->loc_addr
, ipaddr
, ipv4
? 4 : 16))
4279 /* if not found then add a child listener if interface is going up */
4282 child_listen_node
= kmemdup(parent_listen_node
,
4283 sizeof(*child_listen_node
), GFP_ATOMIC
);
4284 if (!child_listen_node
)
4286 node_allocated
= true;
4288 memcpy(child_listen_node
->loc_addr
, ipaddr
, ipv4
? 4 : 16);
4291 memcpy(nfo
->loc_addr
,
4292 child_listen_node
->loc_addr
,
4293 sizeof(nfo
->loc_addr
));
4294 nfo
->vlan_id
= child_listen_node
->vlan_id
;
4295 ret
= i40iw_manage_qhash(iwdev
, nfo
,
4296 I40IW_QHASH_TYPE_TCP_SYN
,
4300 child_listen_node
->qhash_set
= ifup
;
4302 list_add(&child_listen_node
->child_listen_list
,
4303 &parent_listen_node
->child_listen_list
);
4304 } else if (node_allocated
) {
4305 kfree(child_listen_node
);
4310 * i40iw_cm_teardown_connections - teardown QPs
4311 * @iwdev: device pointer
4312 * @ipaddr: Pointer to IPv4 or IPv6 address
4313 * @ipv4: flag indicating IPv4 when true
4314 * @disconnect_all: flag indicating disconnect all QPs
4315 * teardown QPs where source or destination addr matches ip addr
4317 void i40iw_cm_teardown_connections(struct i40iw_device
*iwdev
, u32
*ipaddr
,
4318 struct i40iw_cm_info
*nfo
,
4319 bool disconnect_all
)
4321 struct i40iw_cm_core
*cm_core
= &iwdev
->cm_core
;
4322 struct list_head
*list_core_temp
;
4323 struct list_head
*list_node
;
4324 struct i40iw_cm_node
*cm_node
;
4325 unsigned long flags
;
4326 struct list_head teardown_list
;
4327 struct ib_qp_attr attr
;
4329 INIT_LIST_HEAD(&teardown_list
);
4330 spin_lock_irqsave(&cm_core
->ht_lock
, flags
);
4331 list_for_each_safe(list_node
, list_core_temp
,
4332 &cm_core
->accelerated_list
) {
4333 cm_node
= container_of(list_node
, struct i40iw_cm_node
, list
);
4334 if (disconnect_all
||
4335 (nfo
->vlan_id
== cm_node
->vlan_id
&&
4336 (!memcmp(cm_node
->loc_addr
, ipaddr
, nfo
->ipv4
? 4 : 16) ||
4337 !memcmp(cm_node
->rem_addr
, ipaddr
, nfo
->ipv4
? 4 : 16)))) {
4338 atomic_inc(&cm_node
->ref_count
);
4339 list_add(&cm_node
->teardown_entry
, &teardown_list
);
4342 list_for_each_safe(list_node
, list_core_temp
,
4343 &cm_core
->non_accelerated_list
) {
4344 cm_node
= container_of(list_node
, struct i40iw_cm_node
, list
);
4345 if (disconnect_all
||
4346 (nfo
->vlan_id
== cm_node
->vlan_id
&&
4347 (!memcmp(cm_node
->loc_addr
, ipaddr
, nfo
->ipv4
? 4 : 16) ||
4348 !memcmp(cm_node
->rem_addr
, ipaddr
, nfo
->ipv4
? 4 : 16)))) {
4349 atomic_inc(&cm_node
->ref_count
);
4350 list_add(&cm_node
->teardown_entry
, &teardown_list
);
4353 spin_unlock_irqrestore(&cm_core
->ht_lock
, flags
);
4355 list_for_each_safe(list_node
, list_core_temp
, &teardown_list
) {
4356 cm_node
= container_of(list_node
, struct i40iw_cm_node
,
4358 attr
.qp_state
= IB_QPS_ERR
;
4359 i40iw_modify_qp(&cm_node
->iwqp
->ibqp
, &attr
, IB_QP_STATE
, NULL
);
4361 i40iw_cm_disconn(cm_node
->iwqp
);
4362 i40iw_rem_ref_cm_node(cm_node
);
4367 * i40iw_ifdown_notify - process an ifdown on an interface
4368 * @iwdev: device pointer
4369 * @ipaddr: Pointer to IPv4 or IPv6 address
4370 * @ipv4: flag indicating IPv4 when true
4371 * @ifup: flag indicating interface up when true
4373 void i40iw_if_notify(struct i40iw_device
*iwdev
, struct net_device
*netdev
,
4374 u32
*ipaddr
, bool ipv4
, bool ifup
)
4376 struct i40iw_cm_core
*cm_core
= &iwdev
->cm_core
;
4377 unsigned long flags
;
4378 struct i40iw_cm_listener
*listen_node
;
4379 static const u32 ip_zero
[4] = { 0, 0, 0, 0 };
4380 struct i40iw_cm_info nfo
;
4381 u16 vlan_id
= rdma_vlan_dev_vlan_id(netdev
);
4382 enum i40iw_status_code ret
;
4383 enum i40iw_quad_hash_manage_type op
=
4384 ifup
? I40IW_QHASH_MANAGE_TYPE_ADD
: I40IW_QHASH_MANAGE_TYPE_DELETE
;
4386 nfo
.vlan_id
= vlan_id
;
4389 /* Disable or enable qhash for listeners */
4390 spin_lock_irqsave(&cm_core
->listen_list_lock
, flags
);
4391 list_for_each_entry(listen_node
, &cm_core
->listen_nodes
, list
) {
4392 if (vlan_id
== listen_node
->vlan_id
&&
4393 (!memcmp(listen_node
->loc_addr
, ipaddr
, ipv4
? 4 : 16) ||
4394 !memcmp(listen_node
->loc_addr
, ip_zero
, ipv4
? 4 : 16))) {
4395 memcpy(nfo
.loc_addr
, listen_node
->loc_addr
,
4396 sizeof(nfo
.loc_addr
));
4397 nfo
.loc_port
= listen_node
->loc_port
;
4398 nfo
.user_pri
= listen_node
->user_pri
;
4399 if (!list_empty(&listen_node
->child_listen_list
)) {
4400 i40iw_qhash_ctrl(iwdev
,
4403 ipaddr
, ipv4
, ifup
);
4404 } else if (memcmp(listen_node
->loc_addr
, ip_zero
,
4406 ret
= i40iw_manage_qhash(iwdev
,
4408 I40IW_QHASH_TYPE_TCP_SYN
,
4413 listen_node
->qhash_set
= ifup
;
4417 spin_unlock_irqrestore(&cm_core
->listen_list_lock
, flags
);
4419 /* teardown connected qp's on ifdown */
4421 i40iw_cm_teardown_connections(iwdev
, ipaddr
, &nfo
, false);