Merge tag 'block-5.11-2021-01-10' of git://git.kernel.dk/linux-block
[linux/fpc-iii.git] / drivers / infiniband / hw / i40iw / i40iw_cm.c
blob9acc0ecc9a43e42154e81546ced7858b14d7bb0a
1 /*******************************************************************************
3 * Copyright (c) 2015-2016 Intel Corporation. All rights reserved.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenFabrics.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
13 * conditions are met:
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
17 * disclaimer.
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31 * SOFTWARE.
33 *******************************************************************************/
35 #include <linux/atomic.h>
36 #include <linux/ip.h>
37 #include <linux/tcp.h>
38 #include <linux/init.h>
39 #include <linux/if_arp.h>
40 #include <linux/if_vlan.h>
41 #include <linux/notifier.h>
42 #include <linux/net.h>
43 #include <linux/types.h>
44 #include <linux/timer.h>
45 #include <linux/time.h>
46 #include <linux/delay.h>
47 #include <linux/etherdevice.h>
48 #include <linux/netdevice.h>
49 #include <linux/random.h>
50 #include <linux/list.h>
51 #include <linux/threads.h>
52 #include <linux/highmem.h>
53 #include <net/arp.h>
54 #include <net/ndisc.h>
55 #include <net/neighbour.h>
56 #include <net/route.h>
57 #include <net/addrconf.h>
58 #include <net/ip6_route.h>
59 #include <net/ip_fib.h>
60 #include <net/secure_seq.h>
61 #include <net/tcp.h>
62 #include <asm/checksum.h>
64 #include "i40iw.h"
66 static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *);
67 static void i40iw_cm_post_event(struct i40iw_cm_event *event);
68 static void i40iw_disconnect_worker(struct work_struct *work);
70 /**
71 * i40iw_free_sqbuf - put back puda buffer if refcount = 0
72 * @vsi: pointer to vsi structure
73 * @buf: puda buffer to free
75 void i40iw_free_sqbuf(struct i40iw_sc_vsi *vsi, void *bufp)
77 struct i40iw_puda_buf *buf = (struct i40iw_puda_buf *)bufp;
78 struct i40iw_puda_rsrc *ilq = vsi->ilq;
80 if (!atomic_dec_return(&buf->refcount))
81 i40iw_puda_ret_bufpool(ilq, buf);
84 /**
85 * i40iw_derive_hw_ird_setting - Calculate IRD
87 * @cm_ird: IRD of connection's node
89 * The ird from the connection is rounded to a supported HW
90 * setting (2,8,32,64) and then encoded for ird_size field of
91 * qp_ctx
93 static u8 i40iw_derive_hw_ird_setting(u16 cm_ird)
95 u8 encoded_ird_size;
97 /* ird_size field is encoded in qp_ctx */
98 switch (cm_ird ? roundup_pow_of_two(cm_ird) : 0) {
99 case I40IW_HW_IRD_SETTING_64:
100 encoded_ird_size = 3;
101 break;
102 case I40IW_HW_IRD_SETTING_32:
103 case I40IW_HW_IRD_SETTING_16:
104 encoded_ird_size = 2;
105 break;
106 case I40IW_HW_IRD_SETTING_8:
107 case I40IW_HW_IRD_SETTING_4:
108 encoded_ird_size = 1;
109 break;
110 case I40IW_HW_IRD_SETTING_2:
111 default:
112 encoded_ird_size = 0;
113 break;
115 return encoded_ird_size;
119 * i40iw_record_ird_ord - Record IRD/ORD passed in
120 * @cm_node: connection's node
121 * @conn_ird: connection IRD
122 * @conn_ord: connection ORD
124 static void i40iw_record_ird_ord(struct i40iw_cm_node *cm_node, u32 conn_ird,
125 u32 conn_ord)
127 if (conn_ird > I40IW_MAX_IRD_SIZE)
128 conn_ird = I40IW_MAX_IRD_SIZE;
130 if (conn_ord > I40IW_MAX_ORD_SIZE)
131 conn_ord = I40IW_MAX_ORD_SIZE;
132 else if (!conn_ord && cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO)
133 conn_ord = 1;
135 cm_node->ird_size = conn_ird;
136 cm_node->ord_size = conn_ord;
140 * i40iw_copy_ip_ntohl - change network to host ip
141 * @dst: host ip
142 * @src: big endian
144 void i40iw_copy_ip_ntohl(u32 *dst, __be32 *src)
146 *dst++ = ntohl(*src++);
147 *dst++ = ntohl(*src++);
148 *dst++ = ntohl(*src++);
149 *dst = ntohl(*src);
153 * i40iw_copy_ip_htonl - change host addr to network ip
154 * @dst: host ip
155 * @src: little endian
157 static inline void i40iw_copy_ip_htonl(__be32 *dst, u32 *src)
159 *dst++ = htonl(*src++);
160 *dst++ = htonl(*src++);
161 *dst++ = htonl(*src++);
162 *dst = htonl(*src);
166 * i40iw_fill_sockaddr4 - get addr info for passive connection
167 * @cm_node: connection's node
168 * @event: upper layer's cm event
170 static inline void i40iw_fill_sockaddr4(struct i40iw_cm_node *cm_node,
171 struct iw_cm_event *event)
173 struct sockaddr_in *laddr = (struct sockaddr_in *)&event->local_addr;
174 struct sockaddr_in *raddr = (struct sockaddr_in *)&event->remote_addr;
176 laddr->sin_family = AF_INET;
177 raddr->sin_family = AF_INET;
179 laddr->sin_port = htons(cm_node->loc_port);
180 raddr->sin_port = htons(cm_node->rem_port);
182 laddr->sin_addr.s_addr = htonl(cm_node->loc_addr[0]);
183 raddr->sin_addr.s_addr = htonl(cm_node->rem_addr[0]);
187 * i40iw_fill_sockaddr6 - get ipv6 addr info for passive side
188 * @cm_node: connection's node
189 * @event: upper layer's cm event
191 static inline void i40iw_fill_sockaddr6(struct i40iw_cm_node *cm_node,
192 struct iw_cm_event *event)
194 struct sockaddr_in6 *laddr6 = (struct sockaddr_in6 *)&event->local_addr;
195 struct sockaddr_in6 *raddr6 = (struct sockaddr_in6 *)&event->remote_addr;
197 laddr6->sin6_family = AF_INET6;
198 raddr6->sin6_family = AF_INET6;
200 laddr6->sin6_port = htons(cm_node->loc_port);
201 raddr6->sin6_port = htons(cm_node->rem_port);
203 i40iw_copy_ip_htonl(laddr6->sin6_addr.in6_u.u6_addr32,
204 cm_node->loc_addr);
205 i40iw_copy_ip_htonl(raddr6->sin6_addr.in6_u.u6_addr32,
206 cm_node->rem_addr);
210 * i40iw_get_addr_info
211 * @cm_node: contains ip/tcp info
212 * @cm_info: to get a copy of the cm_node ip/tcp info
214 static void i40iw_get_addr_info(struct i40iw_cm_node *cm_node,
215 struct i40iw_cm_info *cm_info)
217 cm_info->ipv4 = cm_node->ipv4;
218 cm_info->vlan_id = cm_node->vlan_id;
219 memcpy(cm_info->loc_addr, cm_node->loc_addr, sizeof(cm_info->loc_addr));
220 memcpy(cm_info->rem_addr, cm_node->rem_addr, sizeof(cm_info->rem_addr));
221 cm_info->loc_port = cm_node->loc_port;
222 cm_info->rem_port = cm_node->rem_port;
223 cm_info->user_pri = cm_node->user_pri;
227 * i40iw_get_cmevent_info - for cm event upcall
228 * @cm_node: connection's node
229 * @cm_id: upper layers cm struct for the event
230 * @event: upper layer's cm event
232 static inline void i40iw_get_cmevent_info(struct i40iw_cm_node *cm_node,
233 struct iw_cm_id *cm_id,
234 struct iw_cm_event *event)
236 memcpy(&event->local_addr, &cm_id->m_local_addr,
237 sizeof(event->local_addr));
238 memcpy(&event->remote_addr, &cm_id->m_remote_addr,
239 sizeof(event->remote_addr));
240 if (cm_node) {
241 event->private_data = (void *)cm_node->pdata_buf;
242 event->private_data_len = (u8)cm_node->pdata.size;
243 event->ird = cm_node->ird_size;
244 event->ord = cm_node->ord_size;
249 * i40iw_send_cm_event - upcall cm's event handler
250 * @cm_node: connection's node
251 * @cm_id: upper layer's cm info struct
252 * @type: Event type to indicate
253 * @status: status for the event type
255 static int i40iw_send_cm_event(struct i40iw_cm_node *cm_node,
256 struct iw_cm_id *cm_id,
257 enum iw_cm_event_type type,
258 int status)
260 struct iw_cm_event event;
262 memset(&event, 0, sizeof(event));
263 event.event = type;
264 event.status = status;
265 switch (type) {
266 case IW_CM_EVENT_CONNECT_REQUEST:
267 if (cm_node->ipv4)
268 i40iw_fill_sockaddr4(cm_node, &event);
269 else
270 i40iw_fill_sockaddr6(cm_node, &event);
271 event.provider_data = (void *)cm_node;
272 event.private_data = (void *)cm_node->pdata_buf;
273 event.private_data_len = (u8)cm_node->pdata.size;
274 event.ird = cm_node->ird_size;
275 break;
276 case IW_CM_EVENT_CONNECT_REPLY:
277 i40iw_get_cmevent_info(cm_node, cm_id, &event);
278 break;
279 case IW_CM_EVENT_ESTABLISHED:
280 event.ird = cm_node->ird_size;
281 event.ord = cm_node->ord_size;
282 break;
283 case IW_CM_EVENT_DISCONNECT:
284 break;
285 case IW_CM_EVENT_CLOSE:
286 break;
287 default:
288 i40iw_pr_err("event type received type = %d\n", type);
289 return -1;
291 return cm_id->event_handler(cm_id, &event);
295 * i40iw_create_event - create cm event
296 * @cm_node: connection's node
297 * @type: Event type to generate
299 static struct i40iw_cm_event *i40iw_create_event(struct i40iw_cm_node *cm_node,
300 enum i40iw_cm_event_type type)
302 struct i40iw_cm_event *event;
304 if (!cm_node->cm_id)
305 return NULL;
307 event = kzalloc(sizeof(*event), GFP_ATOMIC);
309 if (!event)
310 return NULL;
312 event->type = type;
313 event->cm_node = cm_node;
314 memcpy(event->cm_info.rem_addr, cm_node->rem_addr, sizeof(event->cm_info.rem_addr));
315 memcpy(event->cm_info.loc_addr, cm_node->loc_addr, sizeof(event->cm_info.loc_addr));
316 event->cm_info.rem_port = cm_node->rem_port;
317 event->cm_info.loc_port = cm_node->loc_port;
318 event->cm_info.cm_id = cm_node->cm_id;
320 i40iw_debug(cm_node->dev,
321 I40IW_DEBUG_CM,
322 "node=%p event=%p type=%u dst=%pI4 src=%pI4\n",
323 cm_node,
324 event,
325 type,
326 event->cm_info.loc_addr,
327 event->cm_info.rem_addr);
329 i40iw_cm_post_event(event);
330 return event;
334 * i40iw_free_retrans_entry - free send entry
335 * @cm_node: connection's node
337 static void i40iw_free_retrans_entry(struct i40iw_cm_node *cm_node)
339 struct i40iw_device *iwdev = cm_node->iwdev;
340 struct i40iw_timer_entry *send_entry;
342 send_entry = cm_node->send_entry;
343 if (send_entry) {
344 cm_node->send_entry = NULL;
345 i40iw_free_sqbuf(&iwdev->vsi, (void *)send_entry->sqbuf);
346 kfree(send_entry);
347 atomic_dec(&cm_node->ref_count);
352 * i40iw_cleanup_retrans_entry - free send entry with lock
353 * @cm_node: connection's node
355 static void i40iw_cleanup_retrans_entry(struct i40iw_cm_node *cm_node)
357 unsigned long flags;
359 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
360 i40iw_free_retrans_entry(cm_node);
361 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
365 * i40iw_form_cm_frame - get a free packet and build frame
366 * @cm_node: connection's node ionfo to use in frame
367 * @options: pointer to options info
368 * @hdr: pointer mpa header
369 * @pdata: pointer to private data
370 * @flags: indicates FIN or ACK
372 static struct i40iw_puda_buf *i40iw_form_cm_frame(struct i40iw_cm_node *cm_node,
373 struct i40iw_kmem_info *options,
374 struct i40iw_kmem_info *hdr,
375 struct i40iw_kmem_info *pdata,
376 u8 flags)
378 struct i40iw_puda_buf *sqbuf;
379 struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
380 u8 *buf;
382 struct tcphdr *tcph;
383 struct iphdr *iph;
384 struct ipv6hdr *ip6h;
385 struct ethhdr *ethh;
386 u16 packetsize;
387 u16 eth_hlen = ETH_HLEN;
388 u32 opts_len = 0;
389 u32 pd_len = 0;
390 u32 hdr_len = 0;
391 u16 vtag;
393 sqbuf = i40iw_puda_get_bufpool(vsi->ilq);
394 if (!sqbuf)
395 return NULL;
396 buf = sqbuf->mem.va;
398 if (options)
399 opts_len = (u32)options->size;
401 if (hdr)
402 hdr_len = hdr->size;
404 if (pdata)
405 pd_len = pdata->size;
407 if (cm_node->vlan_id <= VLAN_VID_MASK)
408 eth_hlen += 4;
410 if (cm_node->ipv4)
411 packetsize = sizeof(*iph) + sizeof(*tcph);
412 else
413 packetsize = sizeof(*ip6h) + sizeof(*tcph);
414 packetsize += opts_len + hdr_len + pd_len;
416 memset(buf, 0x00, eth_hlen + packetsize);
418 sqbuf->totallen = packetsize + eth_hlen;
419 sqbuf->maclen = eth_hlen;
420 sqbuf->tcphlen = sizeof(*tcph) + opts_len;
421 sqbuf->scratch = (void *)cm_node;
423 ethh = (struct ethhdr *)buf;
424 buf += eth_hlen;
426 if (cm_node->ipv4) {
427 sqbuf->ipv4 = true;
429 iph = (struct iphdr *)buf;
430 buf += sizeof(*iph);
431 tcph = (struct tcphdr *)buf;
432 buf += sizeof(*tcph);
434 ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
435 ether_addr_copy(ethh->h_source, cm_node->loc_mac);
436 if (cm_node->vlan_id <= VLAN_VID_MASK) {
437 ((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
438 vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
439 ((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
441 ((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IP);
442 } else {
443 ethh->h_proto = htons(ETH_P_IP);
446 iph->version = IPVERSION;
447 iph->ihl = 5; /* 5 * 4Byte words, IP headr len */
448 iph->tos = cm_node->tos;
449 iph->tot_len = htons(packetsize);
450 iph->id = htons(++cm_node->tcp_cntxt.loc_id);
452 iph->frag_off = htons(0x4000);
453 iph->ttl = 0x40;
454 iph->protocol = IPPROTO_TCP;
455 iph->saddr = htonl(cm_node->loc_addr[0]);
456 iph->daddr = htonl(cm_node->rem_addr[0]);
457 } else {
458 sqbuf->ipv4 = false;
459 ip6h = (struct ipv6hdr *)buf;
460 buf += sizeof(*ip6h);
461 tcph = (struct tcphdr *)buf;
462 buf += sizeof(*tcph);
464 ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
465 ether_addr_copy(ethh->h_source, cm_node->loc_mac);
466 if (cm_node->vlan_id <= VLAN_VID_MASK) {
467 ((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
468 vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
469 ((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
470 ((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IPV6);
471 } else {
472 ethh->h_proto = htons(ETH_P_IPV6);
474 ip6h->version = 6;
475 ip6h->priority = cm_node->tos >> 4;
476 ip6h->flow_lbl[0] = cm_node->tos << 4;
477 ip6h->flow_lbl[1] = 0;
478 ip6h->flow_lbl[2] = 0;
479 ip6h->payload_len = htons(packetsize - sizeof(*ip6h));
480 ip6h->nexthdr = 6;
481 ip6h->hop_limit = 128;
482 i40iw_copy_ip_htonl(ip6h->saddr.in6_u.u6_addr32,
483 cm_node->loc_addr);
484 i40iw_copy_ip_htonl(ip6h->daddr.in6_u.u6_addr32,
485 cm_node->rem_addr);
488 tcph->source = htons(cm_node->loc_port);
489 tcph->dest = htons(cm_node->rem_port);
491 tcph->seq = htonl(cm_node->tcp_cntxt.loc_seq_num);
493 if (flags & SET_ACK) {
494 cm_node->tcp_cntxt.loc_ack_num = cm_node->tcp_cntxt.rcv_nxt;
495 tcph->ack_seq = htonl(cm_node->tcp_cntxt.loc_ack_num);
496 tcph->ack = 1;
497 } else {
498 tcph->ack_seq = 0;
501 if (flags & SET_SYN) {
502 cm_node->tcp_cntxt.loc_seq_num++;
503 tcph->syn = 1;
504 } else {
505 cm_node->tcp_cntxt.loc_seq_num += hdr_len + pd_len;
508 if (flags & SET_FIN) {
509 cm_node->tcp_cntxt.loc_seq_num++;
510 tcph->fin = 1;
513 if (flags & SET_RST)
514 tcph->rst = 1;
516 tcph->doff = (u16)((sizeof(*tcph) + opts_len + 3) >> 2);
517 sqbuf->tcphlen = tcph->doff << 2;
518 tcph->window = htons(cm_node->tcp_cntxt.rcv_wnd);
519 tcph->urg_ptr = 0;
521 if (opts_len) {
522 memcpy(buf, options->addr, opts_len);
523 buf += opts_len;
526 if (hdr_len) {
527 memcpy(buf, hdr->addr, hdr_len);
528 buf += hdr_len;
531 if (pdata && pdata->addr)
532 memcpy(buf, pdata->addr, pdata->size);
534 atomic_set(&sqbuf->refcount, 1);
536 return sqbuf;
540 * i40iw_send_reset - Send RST packet
541 * @cm_node: connection's node
543 int i40iw_send_reset(struct i40iw_cm_node *cm_node)
545 struct i40iw_puda_buf *sqbuf;
546 int flags = SET_RST | SET_ACK;
548 sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, flags);
549 if (!sqbuf) {
550 i40iw_pr_err("no sqbuf\n");
551 return -1;
554 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 0, 1);
558 * i40iw_active_open_err - send event for active side cm error
559 * @cm_node: connection's node
560 * @reset: Flag to send reset or not
562 static void i40iw_active_open_err(struct i40iw_cm_node *cm_node, bool reset)
564 i40iw_cleanup_retrans_entry(cm_node);
565 cm_node->cm_core->stats_connect_errs++;
566 if (reset) {
567 i40iw_debug(cm_node->dev,
568 I40IW_DEBUG_CM,
569 "%s cm_node=%p state=%d\n",
570 __func__,
571 cm_node,
572 cm_node->state);
573 atomic_inc(&cm_node->ref_count);
574 i40iw_send_reset(cm_node);
577 cm_node->state = I40IW_CM_STATE_CLOSED;
578 i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
582 * i40iw_passive_open_err - handle passive side cm error
583 * @cm_node: connection's node
584 * @reset: send reset or just free cm_node
586 static void i40iw_passive_open_err(struct i40iw_cm_node *cm_node, bool reset)
588 i40iw_cleanup_retrans_entry(cm_node);
589 cm_node->cm_core->stats_passive_errs++;
590 cm_node->state = I40IW_CM_STATE_CLOSED;
591 i40iw_debug(cm_node->dev,
592 I40IW_DEBUG_CM,
593 "%s cm_node=%p state =%d\n",
594 __func__,
595 cm_node,
596 cm_node->state);
597 if (reset)
598 i40iw_send_reset(cm_node);
599 else
600 i40iw_rem_ref_cm_node(cm_node);
604 * i40iw_event_connect_error - to create connect error event
605 * @event: cm information for connect event
607 static void i40iw_event_connect_error(struct i40iw_cm_event *event)
609 struct i40iw_qp *iwqp;
610 struct iw_cm_id *cm_id;
612 cm_id = event->cm_node->cm_id;
613 if (!cm_id)
614 return;
616 iwqp = cm_id->provider_data;
618 if (!iwqp || !iwqp->iwdev)
619 return;
621 iwqp->cm_id = NULL;
622 cm_id->provider_data = NULL;
623 i40iw_send_cm_event(event->cm_node, cm_id,
624 IW_CM_EVENT_CONNECT_REPLY,
625 -ECONNRESET);
626 cm_id->rem_ref(cm_id);
627 i40iw_rem_ref_cm_node(event->cm_node);
631 * i40iw_process_options
632 * @cm_node: connection's node
633 * @optionsloc: point to start of options
634 * @optionsize: size of all options
635 * @syn_packet: flag if syn packet
637 static int i40iw_process_options(struct i40iw_cm_node *cm_node,
638 u8 *optionsloc,
639 u32 optionsize,
640 u32 syn_packet)
642 u32 tmp;
643 u32 offset = 0;
644 union all_known_options *all_options;
645 char got_mss_option = 0;
647 while (offset < optionsize) {
648 all_options = (union all_known_options *)(optionsloc + offset);
649 switch (all_options->as_base.optionnum) {
650 case OPTION_NUMBER_END:
651 offset = optionsize;
652 break;
653 case OPTION_NUMBER_NONE:
654 offset += 1;
655 continue;
656 case OPTION_NUMBER_MSS:
657 i40iw_debug(cm_node->dev,
658 I40IW_DEBUG_CM,
659 "%s: MSS Length: %d Offset: %d Size: %d\n",
660 __func__,
661 all_options->as_mss.length,
662 offset,
663 optionsize);
664 got_mss_option = 1;
665 if (all_options->as_mss.length != 4)
666 return -1;
667 tmp = ntohs(all_options->as_mss.mss);
668 if (tmp > 0 && tmp < cm_node->tcp_cntxt.mss)
669 cm_node->tcp_cntxt.mss = tmp;
670 break;
671 case OPTION_NUMBER_WINDOW_SCALE:
672 cm_node->tcp_cntxt.snd_wscale =
673 all_options->as_windowscale.shiftcount;
674 break;
675 default:
676 i40iw_debug(cm_node->dev,
677 I40IW_DEBUG_CM,
678 "TCP Option not understood: %x\n",
679 all_options->as_base.optionnum);
680 break;
682 offset += all_options->as_base.length;
684 if (!got_mss_option && syn_packet)
685 cm_node->tcp_cntxt.mss = I40IW_CM_DEFAULT_MSS;
686 return 0;
690 * i40iw_handle_tcp_options -
691 * @cm_node: connection's node
692 * @tcph: pointer tcp header
693 * @optionsize: size of options rcvd
694 * @passive: active or passive flag
696 static int i40iw_handle_tcp_options(struct i40iw_cm_node *cm_node,
697 struct tcphdr *tcph,
698 int optionsize,
699 int passive)
701 u8 *optionsloc = (u8 *)&tcph[1];
703 if (optionsize) {
704 if (i40iw_process_options(cm_node,
705 optionsloc,
706 optionsize,
707 (u32)tcph->syn)) {
708 i40iw_debug(cm_node->dev,
709 I40IW_DEBUG_CM,
710 "%s: Node %p, Sending RESET\n",
711 __func__,
712 cm_node);
713 if (passive)
714 i40iw_passive_open_err(cm_node, true);
715 else
716 i40iw_active_open_err(cm_node, true);
717 return -1;
721 cm_node->tcp_cntxt.snd_wnd = ntohs(tcph->window) <<
722 cm_node->tcp_cntxt.snd_wscale;
724 if (cm_node->tcp_cntxt.snd_wnd > cm_node->tcp_cntxt.max_snd_wnd)
725 cm_node->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.snd_wnd;
726 return 0;
730 * i40iw_build_mpa_v1 - build a MPA V1 frame
731 * @cm_node: connection's node
732 * @mpa_key: to do read0 or write0
734 static void i40iw_build_mpa_v1(struct i40iw_cm_node *cm_node,
735 void *start_addr,
736 u8 mpa_key)
738 struct ietf_mpa_v1 *mpa_frame = (struct ietf_mpa_v1 *)start_addr;
740 switch (mpa_key) {
741 case MPA_KEY_REQUEST:
742 memcpy(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE);
743 break;
744 case MPA_KEY_REPLY:
745 memcpy(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE);
746 break;
747 default:
748 break;
750 mpa_frame->flags = IETF_MPA_FLAGS_CRC;
751 mpa_frame->rev = cm_node->mpa_frame_rev;
752 mpa_frame->priv_data_len = htons(cm_node->pdata.size);
756 * i40iw_build_mpa_v2 - build a MPA V2 frame
757 * @cm_node: connection's node
758 * @start_addr: buffer start address
759 * @mpa_key: to do read0 or write0
761 static void i40iw_build_mpa_v2(struct i40iw_cm_node *cm_node,
762 void *start_addr,
763 u8 mpa_key)
765 struct ietf_mpa_v2 *mpa_frame = (struct ietf_mpa_v2 *)start_addr;
766 struct ietf_rtr_msg *rtr_msg = &mpa_frame->rtr_msg;
767 u16 ctrl_ird, ctrl_ord;
769 /* initialize the upper 5 bytes of the frame */
770 i40iw_build_mpa_v1(cm_node, start_addr, mpa_key);
771 mpa_frame->flags |= IETF_MPA_V2_FLAG;
772 mpa_frame->priv_data_len += htons(IETF_RTR_MSG_SIZE);
774 /* initialize RTR msg */
775 if (cm_node->mpav2_ird_ord == IETF_NO_IRD_ORD) {
776 ctrl_ird = IETF_NO_IRD_ORD;
777 ctrl_ord = IETF_NO_IRD_ORD;
778 } else {
779 ctrl_ird = (cm_node->ird_size > IETF_NO_IRD_ORD) ?
780 IETF_NO_IRD_ORD : cm_node->ird_size;
781 ctrl_ord = (cm_node->ord_size > IETF_NO_IRD_ORD) ?
782 IETF_NO_IRD_ORD : cm_node->ord_size;
785 ctrl_ird |= IETF_PEER_TO_PEER;
787 switch (mpa_key) {
788 case MPA_KEY_REQUEST:
789 ctrl_ord |= IETF_RDMA0_WRITE;
790 ctrl_ord |= IETF_RDMA0_READ;
791 break;
792 case MPA_KEY_REPLY:
793 switch (cm_node->send_rdma0_op) {
794 case SEND_RDMA_WRITE_ZERO:
795 ctrl_ord |= IETF_RDMA0_WRITE;
796 break;
797 case SEND_RDMA_READ_ZERO:
798 ctrl_ord |= IETF_RDMA0_READ;
799 break;
801 break;
802 default:
803 break;
805 rtr_msg->ctrl_ird = htons(ctrl_ird);
806 rtr_msg->ctrl_ord = htons(ctrl_ord);
810 * i40iw_cm_build_mpa_frame - build mpa frame for mpa version 1 or version 2
811 * @cm_node: connection's node
812 * @mpa: mpa: data buffer
813 * @mpa_key: to do read0 or write0
815 static int i40iw_cm_build_mpa_frame(struct i40iw_cm_node *cm_node,
816 struct i40iw_kmem_info *mpa,
817 u8 mpa_key)
819 int hdr_len = 0;
821 switch (cm_node->mpa_frame_rev) {
822 case IETF_MPA_V1:
823 hdr_len = sizeof(struct ietf_mpa_v1);
824 i40iw_build_mpa_v1(cm_node, mpa->addr, mpa_key);
825 break;
826 case IETF_MPA_V2:
827 hdr_len = sizeof(struct ietf_mpa_v2);
828 i40iw_build_mpa_v2(cm_node, mpa->addr, mpa_key);
829 break;
830 default:
831 break;
834 return hdr_len;
838 * i40iw_send_mpa_request - active node send mpa request to passive node
839 * @cm_node: connection's node
841 static int i40iw_send_mpa_request(struct i40iw_cm_node *cm_node)
843 struct i40iw_puda_buf *sqbuf;
845 if (!cm_node) {
846 i40iw_pr_err("cm_node == NULL\n");
847 return -1;
850 cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
851 cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
852 &cm_node->mpa_hdr,
853 MPA_KEY_REQUEST);
854 if (!cm_node->mpa_hdr.size) {
855 i40iw_pr_err("mpa size = %d\n", cm_node->mpa_hdr.size);
856 return -1;
859 sqbuf = i40iw_form_cm_frame(cm_node,
860 NULL,
861 &cm_node->mpa_hdr,
862 &cm_node->pdata,
863 SET_ACK);
864 if (!sqbuf) {
865 i40iw_pr_err("sq_buf == NULL\n");
866 return -1;
868 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
872 * i40iw_send_mpa_reject -
873 * @cm_node: connection's node
874 * @pdata: reject data for connection
875 * @plen: length of reject data
877 static int i40iw_send_mpa_reject(struct i40iw_cm_node *cm_node,
878 const void *pdata,
879 u8 plen)
881 struct i40iw_puda_buf *sqbuf;
882 struct i40iw_kmem_info priv_info;
884 cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
885 cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
886 &cm_node->mpa_hdr,
887 MPA_KEY_REPLY);
889 cm_node->mpa_frame.flags |= IETF_MPA_FLAGS_REJECT;
890 priv_info.addr = (void *)pdata;
891 priv_info.size = plen;
893 sqbuf = i40iw_form_cm_frame(cm_node,
894 NULL,
895 &cm_node->mpa_hdr,
896 &priv_info,
897 SET_ACK | SET_FIN);
898 if (!sqbuf) {
899 i40iw_pr_err("no sqbuf\n");
900 return -ENOMEM;
902 cm_node->state = I40IW_CM_STATE_FIN_WAIT1;
903 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
907 * recv_mpa - process an IETF MPA frame
908 * @cm_node: connection's node
909 * @buffer: Data pointer
910 * @type: to return accept or reject
911 * @len: Len of mpa buffer
913 static int i40iw_parse_mpa(struct i40iw_cm_node *cm_node, u8 *buffer, u32 *type, u32 len)
915 struct ietf_mpa_v1 *mpa_frame;
916 struct ietf_mpa_v2 *mpa_v2_frame;
917 struct ietf_rtr_msg *rtr_msg;
918 int mpa_hdr_len;
919 int priv_data_len;
921 *type = I40IW_MPA_REQUEST_ACCEPT;
923 if (len < sizeof(struct ietf_mpa_v1)) {
924 i40iw_pr_err("ietf buffer small (%x)\n", len);
925 return -1;
928 mpa_frame = (struct ietf_mpa_v1 *)buffer;
929 mpa_hdr_len = sizeof(struct ietf_mpa_v1);
930 priv_data_len = ntohs(mpa_frame->priv_data_len);
932 if (priv_data_len > IETF_MAX_PRIV_DATA_LEN) {
933 i40iw_pr_err("large pri_data %d\n", priv_data_len);
934 return -1;
936 if (mpa_frame->rev != IETF_MPA_V1 && mpa_frame->rev != IETF_MPA_V2) {
937 i40iw_pr_err("unsupported mpa rev = %d\n", mpa_frame->rev);
938 return -1;
940 if (mpa_frame->rev > cm_node->mpa_frame_rev) {
941 i40iw_pr_err("rev %d\n", mpa_frame->rev);
942 return -1;
944 cm_node->mpa_frame_rev = mpa_frame->rev;
946 if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
947 if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE)) {
948 i40iw_pr_err("Unexpected MPA Key received\n");
949 return -1;
951 } else {
952 if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE)) {
953 i40iw_pr_err("Unexpected MPA Key received\n");
954 return -1;
958 if (priv_data_len + mpa_hdr_len > len) {
959 i40iw_pr_err("ietf buffer len(%x + %x != %x)\n",
960 priv_data_len, mpa_hdr_len, len);
961 return -1;
963 if (len > MAX_CM_BUFFER) {
964 i40iw_pr_err("ietf buffer large len = %d\n", len);
965 return -1;
968 switch (mpa_frame->rev) {
969 case IETF_MPA_V2:{
970 u16 ird_size;
971 u16 ord_size;
972 u16 ctrl_ord;
973 u16 ctrl_ird;
975 mpa_v2_frame = (struct ietf_mpa_v2 *)buffer;
976 mpa_hdr_len += IETF_RTR_MSG_SIZE;
977 rtr_msg = &mpa_v2_frame->rtr_msg;
979 /* parse rtr message */
980 ctrl_ord = ntohs(rtr_msg->ctrl_ord);
981 ctrl_ird = ntohs(rtr_msg->ctrl_ird);
982 ird_size = ctrl_ird & IETF_NO_IRD_ORD;
983 ord_size = ctrl_ord & IETF_NO_IRD_ORD;
985 if (!(ctrl_ird & IETF_PEER_TO_PEER))
986 return -1;
988 if (ird_size == IETF_NO_IRD_ORD || ord_size == IETF_NO_IRD_ORD) {
989 cm_node->mpav2_ird_ord = IETF_NO_IRD_ORD;
990 goto negotiate_done;
993 if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
994 /* responder */
995 if (!ord_size && (ctrl_ord & IETF_RDMA0_READ))
996 cm_node->ird_size = 1;
997 if (cm_node->ord_size > ird_size)
998 cm_node->ord_size = ird_size;
999 } else {
1000 /* initiator */
1001 if (!ird_size && (ctrl_ord & IETF_RDMA0_READ))
1002 return -1;
1003 if (cm_node->ord_size > ird_size)
1004 cm_node->ord_size = ird_size;
1006 if (cm_node->ird_size < ord_size)
1007 /* no resources available */
1008 return -1;
1011 negotiate_done:
1012 if (ctrl_ord & IETF_RDMA0_READ)
1013 cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
1014 else if (ctrl_ord & IETF_RDMA0_WRITE)
1015 cm_node->send_rdma0_op = SEND_RDMA_WRITE_ZERO;
1016 else /* Not supported RDMA0 operation */
1017 return -1;
1018 i40iw_debug(cm_node->dev, I40IW_DEBUG_CM,
1019 "MPAV2: Negotiated ORD: %d, IRD: %d\n",
1020 cm_node->ord_size, cm_node->ird_size);
1021 break;
1023 break;
1024 case IETF_MPA_V1:
1025 default:
1026 break;
1029 memcpy(cm_node->pdata_buf, buffer + mpa_hdr_len, priv_data_len);
1030 cm_node->pdata.size = priv_data_len;
1032 if (mpa_frame->flags & IETF_MPA_FLAGS_REJECT)
1033 *type = I40IW_MPA_REQUEST_REJECT;
1035 if (mpa_frame->flags & IETF_MPA_FLAGS_MARKERS)
1036 cm_node->snd_mark_en = true;
1038 return 0;
1042 * i40iw_schedule_cm_timer
1043 * @@cm_node: connection's node
1044 * @sqbuf: buffer to send
1045 * @type: if it is send or close
1046 * @send_retrans: if rexmits to be done
1047 * @close_when_complete: is cm_node to be removed
1049 * note - cm_node needs to be protected before calling this. Encase in:
1050 * i40iw_rem_ref_cm_node(cm_core, cm_node);
1051 * i40iw_schedule_cm_timer(...)
1052 * atomic_inc(&cm_node->ref_count);
1054 int i40iw_schedule_cm_timer(struct i40iw_cm_node *cm_node,
1055 struct i40iw_puda_buf *sqbuf,
1056 enum i40iw_timer_type type,
1057 int send_retrans,
1058 int close_when_complete)
1060 struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1061 struct i40iw_cm_core *cm_core = cm_node->cm_core;
1062 struct i40iw_timer_entry *new_send;
1063 int ret = 0;
1064 u32 was_timer_set;
1065 unsigned long flags;
1067 new_send = kzalloc(sizeof(*new_send), GFP_ATOMIC);
1068 if (!new_send) {
1069 if (type != I40IW_TIMER_TYPE_CLOSE)
1070 i40iw_free_sqbuf(vsi, (void *)sqbuf);
1071 return -ENOMEM;
1073 new_send->retrycount = I40IW_DEFAULT_RETRYS;
1074 new_send->retranscount = I40IW_DEFAULT_RETRANS;
1075 new_send->sqbuf = sqbuf;
1076 new_send->timetosend = jiffies;
1077 new_send->type = type;
1078 new_send->send_retrans = send_retrans;
1079 new_send->close_when_complete = close_when_complete;
1081 if (type == I40IW_TIMER_TYPE_CLOSE) {
1082 new_send->timetosend += (HZ / 10);
1083 if (cm_node->close_entry) {
1084 kfree(new_send);
1085 i40iw_pr_err("already close entry\n");
1086 return -EINVAL;
1088 cm_node->close_entry = new_send;
1091 if (type == I40IW_TIMER_TYPE_SEND) {
1092 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1093 cm_node->send_entry = new_send;
1094 atomic_inc(&cm_node->ref_count);
1095 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1096 new_send->timetosend = jiffies + I40IW_RETRY_TIMEOUT;
1098 atomic_inc(&sqbuf->refcount);
1099 i40iw_puda_send_buf(vsi->ilq, sqbuf);
1100 if (!send_retrans) {
1101 i40iw_cleanup_retrans_entry(cm_node);
1102 if (close_when_complete)
1103 i40iw_rem_ref_cm_node(cm_node);
1104 return ret;
1108 spin_lock_irqsave(&cm_core->ht_lock, flags);
1109 was_timer_set = timer_pending(&cm_core->tcp_timer);
1111 if (!was_timer_set) {
1112 cm_core->tcp_timer.expires = new_send->timetosend;
1113 add_timer(&cm_core->tcp_timer);
1115 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1117 return ret;
1121 * i40iw_retrans_expired - Could not rexmit the packet
1122 * @cm_node: connection's node
1124 static void i40iw_retrans_expired(struct i40iw_cm_node *cm_node)
1126 struct iw_cm_id *cm_id = cm_node->cm_id;
1127 enum i40iw_cm_node_state state = cm_node->state;
1129 cm_node->state = I40IW_CM_STATE_CLOSED;
1130 switch (state) {
1131 case I40IW_CM_STATE_SYN_RCVD:
1132 case I40IW_CM_STATE_CLOSING:
1133 i40iw_rem_ref_cm_node(cm_node);
1134 break;
1135 case I40IW_CM_STATE_FIN_WAIT1:
1136 case I40IW_CM_STATE_LAST_ACK:
1137 if (cm_node->cm_id)
1138 cm_id->rem_ref(cm_id);
1139 i40iw_send_reset(cm_node);
1140 break;
1141 default:
1142 atomic_inc(&cm_node->ref_count);
1143 i40iw_send_reset(cm_node);
1144 i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
1145 break;
1150 * i40iw_handle_close_entry - for handling retry/timeouts
1151 * @cm_node: connection's node
1152 * @rem_node: flag for remove cm_node
1154 static void i40iw_handle_close_entry(struct i40iw_cm_node *cm_node, u32 rem_node)
1156 struct i40iw_timer_entry *close_entry = cm_node->close_entry;
1157 struct iw_cm_id *cm_id = cm_node->cm_id;
1158 struct i40iw_qp *iwqp;
1159 unsigned long flags;
1161 if (!close_entry)
1162 return;
1163 iwqp = (struct i40iw_qp *)close_entry->sqbuf;
1164 if (iwqp) {
1165 spin_lock_irqsave(&iwqp->lock, flags);
1166 if (iwqp->cm_id) {
1167 iwqp->hw_tcp_state = I40IW_TCP_STATE_CLOSED;
1168 iwqp->hw_iwarp_state = I40IW_QP_STATE_ERROR;
1169 iwqp->last_aeq = I40IW_AE_RESET_SENT;
1170 iwqp->ibqp_state = IB_QPS_ERR;
1171 spin_unlock_irqrestore(&iwqp->lock, flags);
1172 i40iw_cm_disconn(iwqp);
1173 } else {
1174 spin_unlock_irqrestore(&iwqp->lock, flags);
1176 } else if (rem_node) {
1177 /* TIME_WAIT state */
1178 i40iw_rem_ref_cm_node(cm_node);
1180 if (cm_id)
1181 cm_id->rem_ref(cm_id);
1182 kfree(close_entry);
1183 cm_node->close_entry = NULL;
1187 * i40iw_build_timer_list - Add cm_nodes to timer list
1188 * @timer_list: ptr to timer list
1189 * @hte: ptr to accelerated or non-accelerated list
1191 static void i40iw_build_timer_list(struct list_head *timer_list,
1192 struct list_head *hte)
1194 struct i40iw_cm_node *cm_node;
1195 struct list_head *list_core_temp, *list_node;
1197 list_for_each_safe(list_node, list_core_temp, hte) {
1198 cm_node = container_of(list_node, struct i40iw_cm_node, list);
1199 if (cm_node->close_entry || cm_node->send_entry) {
1200 atomic_inc(&cm_node->ref_count);
1201 list_add(&cm_node->timer_entry, timer_list);
1207 * i40iw_cm_timer_tick - system's timer expired callback
1208 * @pass: Pointing to cm_core
1210 static void i40iw_cm_timer_tick(struct timer_list *t)
1212 unsigned long nexttimeout = jiffies + I40IW_LONG_TIME;
1213 struct i40iw_cm_node *cm_node;
1214 struct i40iw_timer_entry *send_entry, *close_entry;
1215 struct list_head *list_core_temp;
1216 struct i40iw_sc_vsi *vsi;
1217 struct list_head *list_node;
1218 struct i40iw_cm_core *cm_core = from_timer(cm_core, t, tcp_timer);
1219 u32 settimer = 0;
1220 unsigned long timetosend;
1221 unsigned long flags;
1223 struct list_head timer_list;
1225 INIT_LIST_HEAD(&timer_list);
1227 spin_lock_irqsave(&cm_core->ht_lock, flags);
1228 i40iw_build_timer_list(&timer_list, &cm_core->non_accelerated_list);
1229 i40iw_build_timer_list(&timer_list, &cm_core->accelerated_list);
1230 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1232 list_for_each_safe(list_node, list_core_temp, &timer_list) {
1233 cm_node = container_of(list_node,
1234 struct i40iw_cm_node,
1235 timer_entry);
1236 close_entry = cm_node->close_entry;
1238 if (close_entry) {
1239 if (time_after(close_entry->timetosend, jiffies)) {
1240 if (nexttimeout > close_entry->timetosend ||
1241 !settimer) {
1242 nexttimeout = close_entry->timetosend;
1243 settimer = 1;
1245 } else {
1246 i40iw_handle_close_entry(cm_node, 1);
1250 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1252 send_entry = cm_node->send_entry;
1253 if (!send_entry)
1254 goto done;
1255 if (time_after(send_entry->timetosend, jiffies)) {
1256 if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
1257 if ((nexttimeout > send_entry->timetosend) ||
1258 !settimer) {
1259 nexttimeout = send_entry->timetosend;
1260 settimer = 1;
1262 } else {
1263 i40iw_free_retrans_entry(cm_node);
1265 goto done;
1268 if ((cm_node->state == I40IW_CM_STATE_OFFLOADED) ||
1269 (cm_node->state == I40IW_CM_STATE_CLOSED)) {
1270 i40iw_free_retrans_entry(cm_node);
1271 goto done;
1274 if (!send_entry->retranscount || !send_entry->retrycount) {
1275 i40iw_free_retrans_entry(cm_node);
1277 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1278 i40iw_retrans_expired(cm_node);
1279 cm_node->state = I40IW_CM_STATE_CLOSED;
1280 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1281 goto done;
1283 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1285 vsi = &cm_node->iwdev->vsi;
1287 if (!cm_node->ack_rcvd) {
1288 atomic_inc(&send_entry->sqbuf->refcount);
1289 i40iw_puda_send_buf(vsi->ilq, send_entry->sqbuf);
1290 cm_node->cm_core->stats_pkt_retrans++;
1292 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1293 if (send_entry->send_retrans) {
1294 send_entry->retranscount--;
1295 timetosend = (I40IW_RETRY_TIMEOUT <<
1296 (I40IW_DEFAULT_RETRANS -
1297 send_entry->retranscount));
1299 send_entry->timetosend = jiffies +
1300 min(timetosend, I40IW_MAX_TIMEOUT);
1301 if (nexttimeout > send_entry->timetosend || !settimer) {
1302 nexttimeout = send_entry->timetosend;
1303 settimer = 1;
1305 } else {
1306 int close_when_complete;
1308 close_when_complete = send_entry->close_when_complete;
1309 i40iw_debug(cm_node->dev,
1310 I40IW_DEBUG_CM,
1311 "cm_node=%p state=%d\n",
1312 cm_node,
1313 cm_node->state);
1314 i40iw_free_retrans_entry(cm_node);
1315 if (close_when_complete)
1316 i40iw_rem_ref_cm_node(cm_node);
1318 done:
1319 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1320 i40iw_rem_ref_cm_node(cm_node);
1323 if (settimer) {
1324 spin_lock_irqsave(&cm_core->ht_lock, flags);
1325 if (!timer_pending(&cm_core->tcp_timer)) {
1326 cm_core->tcp_timer.expires = nexttimeout;
1327 add_timer(&cm_core->tcp_timer);
1329 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1334 * i40iw_send_syn - send SYN packet
1335 * @cm_node: connection's node
1336 * @sendack: flag to set ACK bit or not
1338 int i40iw_send_syn(struct i40iw_cm_node *cm_node, u32 sendack)
1340 struct i40iw_puda_buf *sqbuf;
1341 int flags = SET_SYN;
1342 char optionsbuffer[sizeof(struct option_mss) +
1343 sizeof(struct option_windowscale) +
1344 sizeof(struct option_base) + TCP_OPTIONS_PADDING];
1345 struct i40iw_kmem_info opts;
1347 int optionssize = 0;
1348 /* Sending MSS option */
1349 union all_known_options *options;
1351 opts.addr = optionsbuffer;
1352 if (!cm_node) {
1353 i40iw_pr_err("no cm_node\n");
1354 return -EINVAL;
1357 options = (union all_known_options *)&optionsbuffer[optionssize];
1358 options->as_mss.optionnum = OPTION_NUMBER_MSS;
1359 options->as_mss.length = sizeof(struct option_mss);
1360 options->as_mss.mss = htons(cm_node->tcp_cntxt.mss);
1361 optionssize += sizeof(struct option_mss);
1363 options = (union all_known_options *)&optionsbuffer[optionssize];
1364 options->as_windowscale.optionnum = OPTION_NUMBER_WINDOW_SCALE;
1365 options->as_windowscale.length = sizeof(struct option_windowscale);
1366 options->as_windowscale.shiftcount = cm_node->tcp_cntxt.rcv_wscale;
1367 optionssize += sizeof(struct option_windowscale);
1368 options = (union all_known_options *)&optionsbuffer[optionssize];
1369 options->as_end = OPTION_NUMBER_END;
1370 optionssize += 1;
1372 if (sendack)
1373 flags |= SET_ACK;
1375 opts.size = optionssize;
1377 sqbuf = i40iw_form_cm_frame(cm_node, &opts, NULL, NULL, flags);
1378 if (!sqbuf) {
1379 i40iw_pr_err("no sqbuf\n");
1380 return -1;
1382 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1386 * i40iw_send_ack - Send ACK packet
1387 * @cm_node: connection's node
1389 static void i40iw_send_ack(struct i40iw_cm_node *cm_node)
1391 struct i40iw_puda_buf *sqbuf;
1392 struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1394 sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK);
1395 if (sqbuf)
1396 i40iw_puda_send_buf(vsi->ilq, sqbuf);
1397 else
1398 i40iw_pr_err("no sqbuf\n");
1402 * i40iw_send_fin - Send FIN pkt
1403 * @cm_node: connection's node
1405 static int i40iw_send_fin(struct i40iw_cm_node *cm_node)
1407 struct i40iw_puda_buf *sqbuf;
1409 sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK | SET_FIN);
1410 if (!sqbuf) {
1411 i40iw_pr_err("no sqbuf\n");
1412 return -1;
1414 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1418 * i40iw_find_node - find a cm node that matches the reference cm node
1419 * @cm_core: cm's core
1420 * @rem_port: remote tcp port num
1421 * @rem_addr: remote ip addr
1422 * @loc_port: local tcp port num
1423 * @loc_addr: loc ip addr
1424 * @add_refcnt: flag to increment refcount of cm_node
1425 * @accelerated_list: flag for accelerated vs non-accelerated list to search
1427 struct i40iw_cm_node *i40iw_find_node(struct i40iw_cm_core *cm_core,
1428 u16 rem_port,
1429 u32 *rem_addr,
1430 u16 loc_port,
1431 u32 *loc_addr,
1432 bool add_refcnt,
1433 bool accelerated_list)
1435 struct list_head *hte;
1436 struct i40iw_cm_node *cm_node;
1437 unsigned long flags;
1439 hte = accelerated_list ?
1440 &cm_core->accelerated_list : &cm_core->non_accelerated_list;
1442 /* walk list and find cm_node associated with this session ID */
1443 spin_lock_irqsave(&cm_core->ht_lock, flags);
1444 list_for_each_entry(cm_node, hte, list) {
1445 if (!memcmp(cm_node->loc_addr, loc_addr, sizeof(cm_node->loc_addr)) &&
1446 (cm_node->loc_port == loc_port) &&
1447 !memcmp(cm_node->rem_addr, rem_addr, sizeof(cm_node->rem_addr)) &&
1448 (cm_node->rem_port == rem_port)) {
1449 if (add_refcnt)
1450 atomic_inc(&cm_node->ref_count);
1451 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1452 return cm_node;
1455 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1457 /* no owner node */
1458 return NULL;
1462 * i40iw_find_listener - find a cm node listening on this addr-port pair
1463 * @cm_core: cm's core
1464 * @dst_port: listener tcp port num
1465 * @dst_addr: listener ip addr
1466 * @listener_state: state to match with listen node's
1468 static struct i40iw_cm_listener *i40iw_find_listener(
1469 struct i40iw_cm_core *cm_core,
1470 u32 *dst_addr,
1471 u16 dst_port,
1472 u16 vlan_id,
1473 enum i40iw_cm_listener_state
1474 listener_state)
1476 struct i40iw_cm_listener *listen_node;
1477 static const u32 ip_zero[4] = { 0, 0, 0, 0 };
1478 u32 listen_addr[4];
1479 u16 listen_port;
1480 unsigned long flags;
1482 /* walk list and find cm_node associated with this session ID */
1483 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1484 list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1485 memcpy(listen_addr, listen_node->loc_addr, sizeof(listen_addr));
1486 listen_port = listen_node->loc_port;
1487 /* compare node pair, return node handle if a match */
1488 if ((!memcmp(listen_addr, dst_addr, sizeof(listen_addr)) ||
1489 !memcmp(listen_addr, ip_zero, sizeof(listen_addr))) &&
1490 (listen_port == dst_port) &&
1491 (listener_state & listen_node->listener_state)) {
1492 atomic_inc(&listen_node->ref_count);
1493 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1494 return listen_node;
1497 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1498 return NULL;
1502 * i40iw_add_hte_node - add a cm node to the hash table
1503 * @cm_core: cm's core
1504 * @cm_node: connection's node
1506 static void i40iw_add_hte_node(struct i40iw_cm_core *cm_core,
1507 struct i40iw_cm_node *cm_node)
1509 unsigned long flags;
1511 if (!cm_node || !cm_core) {
1512 i40iw_pr_err("cm_node or cm_core == NULL\n");
1513 return;
1516 spin_lock_irqsave(&cm_core->ht_lock, flags);
1517 list_add_tail(&cm_node->list, &cm_core->non_accelerated_list);
1518 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1522 * i40iw_find_port - find port that matches reference port
1523 * @hte: ptr to accelerated or non-accelerated list
1524 * @accelerated_list: flag for accelerated vs non-accelerated list
1526 static bool i40iw_find_port(struct list_head *hte, u16 port)
1528 struct i40iw_cm_node *cm_node;
1530 list_for_each_entry(cm_node, hte, list) {
1531 if (cm_node->loc_port == port)
1532 return true;
1534 return false;
1538 * i40iw_port_in_use - determine if port is in use
1539 * @cm_core: cm's core
1540 * @port: port number
1542 bool i40iw_port_in_use(struct i40iw_cm_core *cm_core, u16 port)
1544 struct i40iw_cm_listener *listen_node;
1545 unsigned long flags;
1547 spin_lock_irqsave(&cm_core->ht_lock, flags);
1548 if (i40iw_find_port(&cm_core->accelerated_list, port) ||
1549 i40iw_find_port(&cm_core->non_accelerated_list, port)) {
1550 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1551 return true;
1553 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1555 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1556 list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1557 if (listen_node->loc_port == port) {
1558 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1559 return true;
1562 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1564 return false;
1568 * i40iw_del_multiple_qhash - Remove qhash and child listens
1569 * @iwdev: iWarp device
1570 * @cm_info: CM info for parent listen node
1571 * @cm_parent_listen_node: The parent listen node
1573 static enum i40iw_status_code i40iw_del_multiple_qhash(
1574 struct i40iw_device *iwdev,
1575 struct i40iw_cm_info *cm_info,
1576 struct i40iw_cm_listener *cm_parent_listen_node)
1578 struct i40iw_cm_listener *child_listen_node;
1579 enum i40iw_status_code ret = I40IW_ERR_CONFIG;
1580 struct list_head *pos, *tpos;
1581 unsigned long flags;
1583 spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1584 list_for_each_safe(pos, tpos, &cm_parent_listen_node->child_listen_list) {
1585 child_listen_node = list_entry(pos, struct i40iw_cm_listener, child_listen_list);
1586 if (child_listen_node->ipv4)
1587 i40iw_debug(&iwdev->sc_dev,
1588 I40IW_DEBUG_CM,
1589 "removing child listen for IP=%pI4, port=%d, vlan=%d\n",
1590 child_listen_node->loc_addr,
1591 child_listen_node->loc_port,
1592 child_listen_node->vlan_id);
1593 else
1594 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
1595 "removing child listen for IP=%pI6, port=%d, vlan=%d\n",
1596 child_listen_node->loc_addr,
1597 child_listen_node->loc_port,
1598 child_listen_node->vlan_id);
1599 list_del(pos);
1600 memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1601 sizeof(cm_info->loc_addr));
1602 cm_info->vlan_id = child_listen_node->vlan_id;
1603 if (child_listen_node->qhash_set) {
1604 ret = i40iw_manage_qhash(iwdev, cm_info,
1605 I40IW_QHASH_TYPE_TCP_SYN,
1606 I40IW_QHASH_MANAGE_TYPE_DELETE,
1607 NULL, false);
1608 child_listen_node->qhash_set = false;
1609 } else {
1610 ret = I40IW_SUCCESS;
1612 i40iw_debug(&iwdev->sc_dev,
1613 I40IW_DEBUG_CM,
1614 "freed pointer = %p\n",
1615 child_listen_node);
1616 kfree(child_listen_node);
1617 cm_parent_listen_node->cm_core->stats_listen_nodes_destroyed++;
1619 spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1621 return ret;
1625 * i40iw_netdev_vlan_ipv6 - Gets the netdev and vlan
1626 * @addr: local IPv6 address
1627 * @vlan_id: vlan id for the given IPv6 address
1629 * Returns the net_device of the IPv6 address and also sets the
1630 * vlan id for that address.
1632 static struct net_device *i40iw_netdev_vlan_ipv6(u32 *addr, u16 *vlan_id)
1634 struct net_device *ip_dev = NULL;
1635 struct in6_addr laddr6;
1637 if (!IS_ENABLED(CONFIG_IPV6))
1638 return NULL;
1639 i40iw_copy_ip_htonl(laddr6.in6_u.u6_addr32, addr);
1640 if (vlan_id)
1641 *vlan_id = I40IW_NO_VLAN;
1642 rcu_read_lock();
1643 for_each_netdev_rcu(&init_net, ip_dev) {
1644 if (ipv6_chk_addr(&init_net, &laddr6, ip_dev, 1)) {
1645 if (vlan_id)
1646 *vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1647 break;
1650 rcu_read_unlock();
1651 return ip_dev;
1655 * i40iw_get_vlan_ipv4 - Returns the vlan_id for IPv4 address
1656 * @addr: local IPv4 address
1658 static u16 i40iw_get_vlan_ipv4(u32 *addr)
1660 struct net_device *netdev;
1661 u16 vlan_id = I40IW_NO_VLAN;
1663 netdev = ip_dev_find(&init_net, htonl(addr[0]));
1664 if (netdev) {
1665 vlan_id = rdma_vlan_dev_vlan_id(netdev);
1666 dev_put(netdev);
1668 return vlan_id;
1672 * i40iw_add_mqh_6 - Adds multiple qhashes for IPv6
1673 * @iwdev: iWarp device
1674 * @cm_info: CM info for parent listen node
1675 * @cm_parent_listen_node: The parent listen node
1677 * Adds a qhash and a child listen node for every IPv6 address
1678 * on the adapter and adds the associated qhash filter
1680 static enum i40iw_status_code i40iw_add_mqh_6(struct i40iw_device *iwdev,
1681 struct i40iw_cm_info *cm_info,
1682 struct i40iw_cm_listener *cm_parent_listen_node)
1684 struct net_device *ip_dev;
1685 struct inet6_dev *idev;
1686 struct inet6_ifaddr *ifp, *tmp;
1687 enum i40iw_status_code ret = 0;
1688 struct i40iw_cm_listener *child_listen_node;
1689 unsigned long flags;
1691 rtnl_lock();
1692 for_each_netdev(&init_net, ip_dev) {
1693 if ((((rdma_vlan_dev_vlan_id(ip_dev) < I40IW_NO_VLAN) &&
1694 (rdma_vlan_dev_real_dev(ip_dev) == iwdev->netdev)) ||
1695 (ip_dev == iwdev->netdev)) && (ip_dev->flags & IFF_UP)) {
1696 idev = __in6_dev_get(ip_dev);
1697 if (!idev) {
1698 i40iw_pr_err("idev == NULL\n");
1699 break;
1701 list_for_each_entry_safe(ifp, tmp, &idev->addr_list, if_list) {
1702 i40iw_debug(&iwdev->sc_dev,
1703 I40IW_DEBUG_CM,
1704 "IP=%pI6, vlan_id=%d, MAC=%pM\n",
1705 &ifp->addr,
1706 rdma_vlan_dev_vlan_id(ip_dev),
1707 ip_dev->dev_addr);
1708 child_listen_node =
1709 kzalloc(sizeof(*child_listen_node), GFP_ATOMIC);
1710 i40iw_debug(&iwdev->sc_dev,
1711 I40IW_DEBUG_CM,
1712 "Allocating child listener %p\n",
1713 child_listen_node);
1714 if (!child_listen_node) {
1715 ret = I40IW_ERR_NO_MEMORY;
1716 goto exit;
1718 cm_info->vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1719 cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1721 memcpy(child_listen_node, cm_parent_listen_node,
1722 sizeof(*child_listen_node));
1724 i40iw_copy_ip_ntohl(child_listen_node->loc_addr,
1725 ifp->addr.in6_u.u6_addr32);
1726 memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1727 sizeof(cm_info->loc_addr));
1729 ret = i40iw_manage_qhash(iwdev, cm_info,
1730 I40IW_QHASH_TYPE_TCP_SYN,
1731 I40IW_QHASH_MANAGE_TYPE_ADD,
1732 NULL, true);
1733 if (!ret) {
1734 child_listen_node->qhash_set = true;
1735 spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1736 list_add(&child_listen_node->child_listen_list,
1737 &cm_parent_listen_node->child_listen_list);
1738 spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1739 cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1740 } else {
1741 kfree(child_listen_node);
1746 exit:
1747 rtnl_unlock();
1748 return ret;
1752 * i40iw_add_mqh_4 - Adds multiple qhashes for IPv4
1753 * @iwdev: iWarp device
1754 * @cm_info: CM info for parent listen node
1755 * @cm_parent_listen_node: The parent listen node
1757 * Adds a qhash and a child listen node for every IPv4 address
1758 * on the adapter and adds the associated qhash filter
1760 static enum i40iw_status_code i40iw_add_mqh_4(
1761 struct i40iw_device *iwdev,
1762 struct i40iw_cm_info *cm_info,
1763 struct i40iw_cm_listener *cm_parent_listen_node)
1765 struct net_device *dev;
1766 struct in_device *idev;
1767 struct i40iw_cm_listener *child_listen_node;
1768 enum i40iw_status_code ret = 0;
1769 unsigned long flags;
1771 rtnl_lock();
1772 for_each_netdev(&init_net, dev) {
1773 if ((((rdma_vlan_dev_vlan_id(dev) < I40IW_NO_VLAN) &&
1774 (rdma_vlan_dev_real_dev(dev) == iwdev->netdev)) ||
1775 (dev == iwdev->netdev)) && (dev->flags & IFF_UP)) {
1776 const struct in_ifaddr *ifa;
1778 idev = in_dev_get(dev);
1780 in_dev_for_each_ifa_rtnl(ifa, idev) {
1781 i40iw_debug(&iwdev->sc_dev,
1782 I40IW_DEBUG_CM,
1783 "Allocating child CM Listener forIP=%pI4, vlan_id=%d, MAC=%pM\n",
1784 &ifa->ifa_address,
1785 rdma_vlan_dev_vlan_id(dev),
1786 dev->dev_addr);
1787 child_listen_node = kzalloc(sizeof(*child_listen_node), GFP_KERNEL);
1788 cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1789 i40iw_debug(&iwdev->sc_dev,
1790 I40IW_DEBUG_CM,
1791 "Allocating child listener %p\n",
1792 child_listen_node);
1793 if (!child_listen_node) {
1794 in_dev_put(idev);
1795 ret = I40IW_ERR_NO_MEMORY;
1796 goto exit;
1798 cm_info->vlan_id = rdma_vlan_dev_vlan_id(dev);
1799 cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1800 memcpy(child_listen_node,
1801 cm_parent_listen_node,
1802 sizeof(*child_listen_node));
1804 child_listen_node->loc_addr[0] = ntohl(ifa->ifa_address);
1805 memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1806 sizeof(cm_info->loc_addr));
1808 ret = i40iw_manage_qhash(iwdev,
1809 cm_info,
1810 I40IW_QHASH_TYPE_TCP_SYN,
1811 I40IW_QHASH_MANAGE_TYPE_ADD,
1812 NULL,
1813 true);
1814 if (!ret) {
1815 child_listen_node->qhash_set = true;
1816 spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1817 list_add(&child_listen_node->child_listen_list,
1818 &cm_parent_listen_node->child_listen_list);
1819 spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1820 } else {
1821 kfree(child_listen_node);
1822 cm_parent_listen_node->cm_core->stats_listen_nodes_created--;
1826 in_dev_put(idev);
1829 exit:
1830 rtnl_unlock();
1831 return ret;
1835 * i40iw_dec_refcnt_listen - delete listener and associated cm nodes
1836 * @cm_core: cm's core
1837 * @free_hanging_nodes: to free associated cm_nodes
1838 * @apbvt_del: flag to delete the apbvt
1840 static int i40iw_dec_refcnt_listen(struct i40iw_cm_core *cm_core,
1841 struct i40iw_cm_listener *listener,
1842 int free_hanging_nodes, bool apbvt_del)
1844 int ret = -EINVAL;
1845 int err = 0;
1846 struct list_head *list_pos;
1847 struct list_head *list_temp;
1848 struct i40iw_cm_node *cm_node;
1849 struct list_head reset_list;
1850 struct i40iw_cm_info nfo;
1851 struct i40iw_cm_node *loopback;
1852 enum i40iw_cm_node_state old_state;
1853 unsigned long flags;
1855 /* free non-accelerated child nodes for this listener */
1856 INIT_LIST_HEAD(&reset_list);
1857 if (free_hanging_nodes) {
1858 spin_lock_irqsave(&cm_core->ht_lock, flags);
1859 list_for_each_safe(list_pos,
1860 list_temp, &cm_core->non_accelerated_list) {
1861 cm_node = container_of(list_pos, struct i40iw_cm_node, list);
1862 if ((cm_node->listener == listener) &&
1863 !cm_node->accelerated) {
1864 atomic_inc(&cm_node->ref_count);
1865 list_add(&cm_node->reset_entry, &reset_list);
1868 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1871 list_for_each_safe(list_pos, list_temp, &reset_list) {
1872 cm_node = container_of(list_pos, struct i40iw_cm_node, reset_entry);
1873 loopback = cm_node->loopbackpartner;
1874 if (cm_node->state >= I40IW_CM_STATE_FIN_WAIT1) {
1875 i40iw_rem_ref_cm_node(cm_node);
1876 } else {
1877 if (!loopback) {
1878 i40iw_cleanup_retrans_entry(cm_node);
1879 err = i40iw_send_reset(cm_node);
1880 if (err) {
1881 cm_node->state = I40IW_CM_STATE_CLOSED;
1882 i40iw_pr_err("send reset\n");
1883 } else {
1884 old_state = cm_node->state;
1885 cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1886 if (old_state != I40IW_CM_STATE_MPAREQ_RCVD)
1887 i40iw_rem_ref_cm_node(cm_node);
1889 } else {
1890 struct i40iw_cm_event event;
1892 event.cm_node = loopback;
1893 memcpy(event.cm_info.rem_addr,
1894 loopback->rem_addr, sizeof(event.cm_info.rem_addr));
1895 memcpy(event.cm_info.loc_addr,
1896 loopback->loc_addr, sizeof(event.cm_info.loc_addr));
1897 event.cm_info.rem_port = loopback->rem_port;
1898 event.cm_info.loc_port = loopback->loc_port;
1899 event.cm_info.cm_id = loopback->cm_id;
1900 event.cm_info.ipv4 = loopback->ipv4;
1901 atomic_inc(&loopback->ref_count);
1902 loopback->state = I40IW_CM_STATE_CLOSED;
1903 i40iw_event_connect_error(&event);
1904 cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1905 i40iw_rem_ref_cm_node(cm_node);
1910 if (!atomic_dec_return(&listener->ref_count)) {
1911 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1912 list_del(&listener->list);
1913 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1915 if (listener->iwdev) {
1916 if (apbvt_del)
1917 i40iw_manage_apbvt(listener->iwdev,
1918 listener->loc_port,
1919 I40IW_MANAGE_APBVT_DEL);
1921 memcpy(nfo.loc_addr, listener->loc_addr, sizeof(nfo.loc_addr));
1922 nfo.loc_port = listener->loc_port;
1923 nfo.ipv4 = listener->ipv4;
1924 nfo.vlan_id = listener->vlan_id;
1925 nfo.user_pri = listener->user_pri;
1927 if (!list_empty(&listener->child_listen_list)) {
1928 i40iw_del_multiple_qhash(listener->iwdev, &nfo, listener);
1929 } else {
1930 if (listener->qhash_set)
1931 i40iw_manage_qhash(listener->iwdev,
1932 &nfo,
1933 I40IW_QHASH_TYPE_TCP_SYN,
1934 I40IW_QHASH_MANAGE_TYPE_DELETE,
1935 NULL,
1936 false);
1940 cm_core->stats_listen_destroyed++;
1941 kfree(listener);
1942 cm_core->stats_listen_nodes_destroyed++;
1943 listener = NULL;
1944 ret = 0;
1947 if (listener) {
1948 if (atomic_read(&listener->pend_accepts_cnt) > 0)
1949 i40iw_debug(cm_core->dev,
1950 I40IW_DEBUG_CM,
1951 "%s: listener (%p) pending accepts=%u\n",
1952 __func__,
1953 listener,
1954 atomic_read(&listener->pend_accepts_cnt));
1957 return ret;
1961 * i40iw_cm_del_listen - delete a linstener
1962 * @cm_core: cm's core
1963 * @listener: passive connection's listener
1964 * @apbvt_del: flag to delete apbvt
1966 static int i40iw_cm_del_listen(struct i40iw_cm_core *cm_core,
1967 struct i40iw_cm_listener *listener,
1968 bool apbvt_del)
1970 listener->listener_state = I40IW_CM_LISTENER_PASSIVE_STATE;
1971 listener->cm_id = NULL; /* going to be destroyed pretty soon */
1972 return i40iw_dec_refcnt_listen(cm_core, listener, 1, apbvt_del);
1976 * i40iw_addr_resolve_neigh - resolve neighbor address
1977 * @iwdev: iwarp device structure
1978 * @src_ip: local ip address
1979 * @dst_ip: remote ip address
1980 * @arpindex: if there is an arp entry
1982 static int i40iw_addr_resolve_neigh(struct i40iw_device *iwdev,
1983 u32 src_ip,
1984 u32 dst_ip,
1985 int arpindex)
1987 struct rtable *rt;
1988 struct neighbour *neigh;
1989 int rc = arpindex;
1990 __be32 dst_ipaddr = htonl(dst_ip);
1991 __be32 src_ipaddr = htonl(src_ip);
1993 rt = ip_route_output(&init_net, dst_ipaddr, src_ipaddr, 0, 0);
1994 if (IS_ERR(rt)) {
1995 i40iw_pr_err("ip_route_output\n");
1996 return rc;
1999 neigh = dst_neigh_lookup(&rt->dst, &dst_ipaddr);
2001 rcu_read_lock();
2002 if (neigh) {
2003 if (neigh->nud_state & NUD_VALID) {
2004 if (arpindex >= 0) {
2005 if (ether_addr_equal(iwdev->arp_table[arpindex].mac_addr,
2006 neigh->ha))
2007 /* Mac address same as arp table */
2008 goto resolve_neigh_exit;
2009 i40iw_manage_arp_cache(iwdev,
2010 iwdev->arp_table[arpindex].mac_addr,
2011 &dst_ip,
2012 true,
2013 I40IW_ARP_DELETE);
2016 i40iw_manage_arp_cache(iwdev, neigh->ha, &dst_ip, true, I40IW_ARP_ADD);
2017 rc = i40iw_arp_table(iwdev, &dst_ip, true, NULL, I40IW_ARP_RESOLVE);
2018 } else {
2019 neigh_event_send(neigh, NULL);
2022 resolve_neigh_exit:
2024 rcu_read_unlock();
2025 if (neigh)
2026 neigh_release(neigh);
2028 ip_rt_put(rt);
2029 return rc;
2033 * i40iw_get_dst_ipv6
2035 static struct dst_entry *i40iw_get_dst_ipv6(struct sockaddr_in6 *src_addr,
2036 struct sockaddr_in6 *dst_addr)
2038 struct dst_entry *dst;
2039 struct flowi6 fl6;
2041 memset(&fl6, 0, sizeof(fl6));
2042 fl6.daddr = dst_addr->sin6_addr;
2043 fl6.saddr = src_addr->sin6_addr;
2044 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
2045 fl6.flowi6_oif = dst_addr->sin6_scope_id;
2047 dst = ip6_route_output(&init_net, NULL, &fl6);
2048 return dst;
2052 * i40iw_addr_resolve_neigh_ipv6 - resolve neighbor ipv6 address
2053 * @iwdev: iwarp device structure
2054 * @dst_ip: remote ip address
2055 * @arpindex: if there is an arp entry
2057 static int i40iw_addr_resolve_neigh_ipv6(struct i40iw_device *iwdev,
2058 u32 *src,
2059 u32 *dest,
2060 int arpindex)
2062 struct neighbour *neigh;
2063 int rc = arpindex;
2064 struct dst_entry *dst;
2065 struct sockaddr_in6 dst_addr;
2066 struct sockaddr_in6 src_addr;
2068 memset(&dst_addr, 0, sizeof(dst_addr));
2069 dst_addr.sin6_family = AF_INET6;
2070 i40iw_copy_ip_htonl(dst_addr.sin6_addr.in6_u.u6_addr32, dest);
2071 memset(&src_addr, 0, sizeof(src_addr));
2072 src_addr.sin6_family = AF_INET6;
2073 i40iw_copy_ip_htonl(src_addr.sin6_addr.in6_u.u6_addr32, src);
2074 dst = i40iw_get_dst_ipv6(&src_addr, &dst_addr);
2075 if (!dst || dst->error) {
2076 if (dst) {
2077 i40iw_pr_err("ip6_route_output returned dst->error = %d\n",
2078 dst->error);
2079 dst_release(dst);
2081 return rc;
2084 neigh = dst_neigh_lookup(dst, dst_addr.sin6_addr.in6_u.u6_addr32);
2086 rcu_read_lock();
2087 if (neigh) {
2088 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "dst_neigh_lookup MAC=%pM\n", neigh->ha);
2089 if (neigh->nud_state & NUD_VALID) {
2090 if (arpindex >= 0) {
2091 if (ether_addr_equal
2092 (iwdev->arp_table[arpindex].mac_addr,
2093 neigh->ha)) {
2094 /* Mac address same as in arp table */
2095 goto resolve_neigh_exit6;
2097 i40iw_manage_arp_cache(iwdev,
2098 iwdev->arp_table[arpindex].mac_addr,
2099 dest,
2100 false,
2101 I40IW_ARP_DELETE);
2103 i40iw_manage_arp_cache(iwdev,
2104 neigh->ha,
2105 dest,
2106 false,
2107 I40IW_ARP_ADD);
2108 rc = i40iw_arp_table(iwdev,
2109 dest,
2110 false,
2111 NULL,
2112 I40IW_ARP_RESOLVE);
2113 } else {
2114 neigh_event_send(neigh, NULL);
2118 resolve_neigh_exit6:
2119 rcu_read_unlock();
2120 if (neigh)
2121 neigh_release(neigh);
2122 dst_release(dst);
2123 return rc;
2127 * i40iw_ipv4_is_loopback - check if loopback
2128 * @loc_addr: local addr to compare
2129 * @rem_addr: remote address
2131 static bool i40iw_ipv4_is_loopback(u32 loc_addr, u32 rem_addr)
2133 return ipv4_is_loopback(htonl(rem_addr)) || (loc_addr == rem_addr);
2137 * i40iw_ipv6_is_loopback - check if loopback
2138 * @loc_addr: local addr to compare
2139 * @rem_addr: remote address
2141 static bool i40iw_ipv6_is_loopback(u32 *loc_addr, u32 *rem_addr)
2143 struct in6_addr raddr6;
2145 i40iw_copy_ip_htonl(raddr6.in6_u.u6_addr32, rem_addr);
2146 return !memcmp(loc_addr, rem_addr, 16) || ipv6_addr_loopback(&raddr6);
2150 * i40iw_make_cm_node - create a new instance of a cm node
2151 * @cm_core: cm's core
2152 * @iwdev: iwarp device structure
2153 * @cm_info: quad info for connection
2154 * @listener: passive connection's listener
2156 static struct i40iw_cm_node *i40iw_make_cm_node(
2157 struct i40iw_cm_core *cm_core,
2158 struct i40iw_device *iwdev,
2159 struct i40iw_cm_info *cm_info,
2160 struct i40iw_cm_listener *listener)
2162 struct i40iw_cm_node *cm_node;
2163 int oldarpindex;
2164 int arpindex;
2165 struct net_device *netdev = iwdev->netdev;
2167 /* create an hte and cm_node for this instance */
2168 cm_node = kzalloc(sizeof(*cm_node), GFP_ATOMIC);
2169 if (!cm_node)
2170 return NULL;
2172 /* set our node specific transport info */
2173 cm_node->ipv4 = cm_info->ipv4;
2174 cm_node->vlan_id = cm_info->vlan_id;
2175 if ((cm_node->vlan_id == I40IW_NO_VLAN) && iwdev->dcb)
2176 cm_node->vlan_id = 0;
2177 cm_node->tos = cm_info->tos;
2178 cm_node->user_pri = cm_info->user_pri;
2179 if (listener) {
2180 if (listener->tos != cm_info->tos)
2181 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB,
2182 "application TOS[%d] and remote client TOS[%d] mismatch\n",
2183 listener->tos, cm_info->tos);
2184 cm_node->tos = max(listener->tos, cm_info->tos);
2185 cm_node->user_pri = rt_tos2priority(cm_node->tos);
2186 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "listener: TOS:[%d] UP:[%d]\n",
2187 cm_node->tos, cm_node->user_pri);
2189 memcpy(cm_node->loc_addr, cm_info->loc_addr, sizeof(cm_node->loc_addr));
2190 memcpy(cm_node->rem_addr, cm_info->rem_addr, sizeof(cm_node->rem_addr));
2191 cm_node->loc_port = cm_info->loc_port;
2192 cm_node->rem_port = cm_info->rem_port;
2194 cm_node->mpa_frame_rev = iwdev->mpa_version;
2195 cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
2196 cm_node->ird_size = I40IW_MAX_IRD_SIZE;
2197 cm_node->ord_size = I40IW_MAX_ORD_SIZE;
2199 cm_node->listener = listener;
2200 cm_node->cm_id = cm_info->cm_id;
2201 ether_addr_copy(cm_node->loc_mac, netdev->dev_addr);
2202 spin_lock_init(&cm_node->retrans_list_lock);
2203 cm_node->ack_rcvd = false;
2205 atomic_set(&cm_node->ref_count, 1);
2206 /* associate our parent CM core */
2207 cm_node->cm_core = cm_core;
2208 cm_node->tcp_cntxt.loc_id = I40IW_CM_DEF_LOCAL_ID;
2209 cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2210 cm_node->tcp_cntxt.rcv_wnd =
2211 I40IW_CM_DEFAULT_RCV_WND_SCALED >> I40IW_CM_DEFAULT_RCV_WND_SCALE;
2212 if (cm_node->ipv4) {
2213 cm_node->tcp_cntxt.loc_seq_num = secure_tcp_seq(htonl(cm_node->loc_addr[0]),
2214 htonl(cm_node->rem_addr[0]),
2215 htons(cm_node->loc_port),
2216 htons(cm_node->rem_port));
2217 cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV4;
2218 } else if (IS_ENABLED(CONFIG_IPV6)) {
2219 __be32 loc[4] = {
2220 htonl(cm_node->loc_addr[0]), htonl(cm_node->loc_addr[1]),
2221 htonl(cm_node->loc_addr[2]), htonl(cm_node->loc_addr[3])
2223 __be32 rem[4] = {
2224 htonl(cm_node->rem_addr[0]), htonl(cm_node->rem_addr[1]),
2225 htonl(cm_node->rem_addr[2]), htonl(cm_node->rem_addr[3])
2227 cm_node->tcp_cntxt.loc_seq_num = secure_tcpv6_seq(loc, rem,
2228 htons(cm_node->loc_port),
2229 htons(cm_node->rem_port));
2230 cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV6;
2233 cm_node->iwdev = iwdev;
2234 cm_node->dev = &iwdev->sc_dev;
2236 if ((cm_node->ipv4 &&
2237 i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
2238 (!cm_node->ipv4 && i40iw_ipv6_is_loopback(cm_node->loc_addr,
2239 cm_node->rem_addr))) {
2240 arpindex = i40iw_arp_table(iwdev,
2241 cm_node->rem_addr,
2242 false,
2243 NULL,
2244 I40IW_ARP_RESOLVE);
2245 } else {
2246 oldarpindex = i40iw_arp_table(iwdev,
2247 cm_node->rem_addr,
2248 false,
2249 NULL,
2250 I40IW_ARP_RESOLVE);
2251 if (cm_node->ipv4)
2252 arpindex = i40iw_addr_resolve_neigh(iwdev,
2253 cm_info->loc_addr[0],
2254 cm_info->rem_addr[0],
2255 oldarpindex);
2256 else if (IS_ENABLED(CONFIG_IPV6))
2257 arpindex = i40iw_addr_resolve_neigh_ipv6(iwdev,
2258 cm_info->loc_addr,
2259 cm_info->rem_addr,
2260 oldarpindex);
2261 else
2262 arpindex = -EINVAL;
2264 if (arpindex < 0) {
2265 i40iw_pr_err("cm_node arpindex\n");
2266 kfree(cm_node);
2267 return NULL;
2269 ether_addr_copy(cm_node->rem_mac, iwdev->arp_table[arpindex].mac_addr);
2270 i40iw_add_hte_node(cm_core, cm_node);
2271 cm_core->stats_nodes_created++;
2272 return cm_node;
2276 * i40iw_rem_ref_cm_node - destroy an instance of a cm node
2277 * @cm_node: connection's node
2279 static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *cm_node)
2281 struct i40iw_cm_core *cm_core = cm_node->cm_core;
2282 struct i40iw_qp *iwqp;
2283 struct i40iw_cm_info nfo;
2284 unsigned long flags;
2286 spin_lock_irqsave(&cm_node->cm_core->ht_lock, flags);
2287 if (atomic_dec_return(&cm_node->ref_count)) {
2288 spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2289 return;
2291 list_del(&cm_node->list);
2292 spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2294 /* if the node is destroyed before connection was accelerated */
2295 if (!cm_node->accelerated && cm_node->accept_pend) {
2296 pr_err("node destroyed before established\n");
2297 atomic_dec(&cm_node->listener->pend_accepts_cnt);
2299 if (cm_node->close_entry)
2300 i40iw_handle_close_entry(cm_node, 0);
2301 if (cm_node->listener) {
2302 i40iw_dec_refcnt_listen(cm_core, cm_node->listener, 0, true);
2303 } else {
2304 if (cm_node->apbvt_set) {
2305 i40iw_manage_apbvt(cm_node->iwdev,
2306 cm_node->loc_port,
2307 I40IW_MANAGE_APBVT_DEL);
2308 cm_node->apbvt_set = 0;
2310 i40iw_get_addr_info(cm_node, &nfo);
2311 if (cm_node->qhash_set) {
2312 i40iw_manage_qhash(cm_node->iwdev,
2313 &nfo,
2314 I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2315 I40IW_QHASH_MANAGE_TYPE_DELETE,
2316 NULL,
2317 false);
2318 cm_node->qhash_set = 0;
2322 iwqp = cm_node->iwqp;
2323 if (iwqp) {
2324 iwqp->cm_node = NULL;
2325 i40iw_qp_rem_ref(&iwqp->ibqp);
2326 cm_node->iwqp = NULL;
2327 } else if (cm_node->qhash_set) {
2328 i40iw_get_addr_info(cm_node, &nfo);
2329 i40iw_manage_qhash(cm_node->iwdev,
2330 &nfo,
2331 I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2332 I40IW_QHASH_MANAGE_TYPE_DELETE,
2333 NULL,
2334 false);
2335 cm_node->qhash_set = 0;
2338 cm_node->cm_core->stats_nodes_destroyed++;
2339 kfree(cm_node);
2343 * i40iw_handle_fin_pkt - FIN packet received
2344 * @cm_node: connection's node
2346 static void i40iw_handle_fin_pkt(struct i40iw_cm_node *cm_node)
2348 u32 ret;
2350 switch (cm_node->state) {
2351 case I40IW_CM_STATE_SYN_RCVD:
2352 case I40IW_CM_STATE_SYN_SENT:
2353 case I40IW_CM_STATE_ESTABLISHED:
2354 case I40IW_CM_STATE_MPAREJ_RCVD:
2355 cm_node->tcp_cntxt.rcv_nxt++;
2356 i40iw_cleanup_retrans_entry(cm_node);
2357 cm_node->state = I40IW_CM_STATE_LAST_ACK;
2358 i40iw_send_fin(cm_node);
2359 break;
2360 case I40IW_CM_STATE_MPAREQ_SENT:
2361 i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
2362 cm_node->tcp_cntxt.rcv_nxt++;
2363 i40iw_cleanup_retrans_entry(cm_node);
2364 cm_node->state = I40IW_CM_STATE_CLOSED;
2365 atomic_inc(&cm_node->ref_count);
2366 i40iw_send_reset(cm_node);
2367 break;
2368 case I40IW_CM_STATE_FIN_WAIT1:
2369 cm_node->tcp_cntxt.rcv_nxt++;
2370 i40iw_cleanup_retrans_entry(cm_node);
2371 cm_node->state = I40IW_CM_STATE_CLOSING;
2372 i40iw_send_ack(cm_node);
2374 * Wait for ACK as this is simultaneous close.
2375 * After we receive ACK, do not send anything.
2376 * Just rm the node.
2378 break;
2379 case I40IW_CM_STATE_FIN_WAIT2:
2380 cm_node->tcp_cntxt.rcv_nxt++;
2381 i40iw_cleanup_retrans_entry(cm_node);
2382 cm_node->state = I40IW_CM_STATE_TIME_WAIT;
2383 i40iw_send_ack(cm_node);
2384 ret =
2385 i40iw_schedule_cm_timer(cm_node, NULL, I40IW_TIMER_TYPE_CLOSE, 1, 0);
2386 if (ret)
2387 i40iw_pr_err("node %p state = %d\n", cm_node, cm_node->state);
2388 break;
2389 case I40IW_CM_STATE_TIME_WAIT:
2390 cm_node->tcp_cntxt.rcv_nxt++;
2391 i40iw_cleanup_retrans_entry(cm_node);
2392 cm_node->state = I40IW_CM_STATE_CLOSED;
2393 i40iw_rem_ref_cm_node(cm_node);
2394 break;
2395 case I40IW_CM_STATE_OFFLOADED:
2396 default:
2397 i40iw_pr_err("bad state node %p state = %d\n", cm_node, cm_node->state);
2398 break;
2403 * i40iw_handle_rst_pkt - process received RST packet
2404 * @cm_node: connection's node
2405 * @rbuf: receive buffer
2407 static void i40iw_handle_rst_pkt(struct i40iw_cm_node *cm_node,
2408 struct i40iw_puda_buf *rbuf)
2410 i40iw_cleanup_retrans_entry(cm_node);
2411 switch (cm_node->state) {
2412 case I40IW_CM_STATE_SYN_SENT:
2413 case I40IW_CM_STATE_MPAREQ_SENT:
2414 switch (cm_node->mpa_frame_rev) {
2415 case IETF_MPA_V2:
2416 cm_node->mpa_frame_rev = IETF_MPA_V1;
2417 /* send a syn and goto syn sent state */
2418 cm_node->state = I40IW_CM_STATE_SYN_SENT;
2419 if (i40iw_send_syn(cm_node, 0))
2420 i40iw_active_open_err(cm_node, false);
2421 break;
2422 case IETF_MPA_V1:
2423 default:
2424 i40iw_active_open_err(cm_node, false);
2425 break;
2427 break;
2428 case I40IW_CM_STATE_MPAREQ_RCVD:
2429 atomic_inc(&cm_node->passive_state);
2430 break;
2431 case I40IW_CM_STATE_ESTABLISHED:
2432 case I40IW_CM_STATE_SYN_RCVD:
2433 case I40IW_CM_STATE_LISTENING:
2434 i40iw_pr_err("Bad state state = %d\n", cm_node->state);
2435 i40iw_passive_open_err(cm_node, false);
2436 break;
2437 case I40IW_CM_STATE_OFFLOADED:
2438 i40iw_active_open_err(cm_node, false);
2439 break;
2440 case I40IW_CM_STATE_CLOSED:
2441 break;
2442 case I40IW_CM_STATE_FIN_WAIT2:
2443 case I40IW_CM_STATE_FIN_WAIT1:
2444 case I40IW_CM_STATE_LAST_ACK:
2445 cm_node->cm_id->rem_ref(cm_node->cm_id);
2446 fallthrough;
2447 case I40IW_CM_STATE_TIME_WAIT:
2448 cm_node->state = I40IW_CM_STATE_CLOSED;
2449 i40iw_rem_ref_cm_node(cm_node);
2450 break;
2451 default:
2452 break;
2457 * i40iw_handle_rcv_mpa - Process a recv'd mpa buffer
2458 * @cm_node: connection's node
2459 * @rbuf: receive buffer
2461 static void i40iw_handle_rcv_mpa(struct i40iw_cm_node *cm_node,
2462 struct i40iw_puda_buf *rbuf)
2464 int ret;
2465 int datasize = rbuf->datalen;
2466 u8 *dataloc = rbuf->data;
2468 enum i40iw_cm_event_type type = I40IW_CM_EVENT_UNKNOWN;
2469 u32 res_type;
2471 ret = i40iw_parse_mpa(cm_node, dataloc, &res_type, datasize);
2472 if (ret) {
2473 if (cm_node->state == I40IW_CM_STATE_MPAREQ_SENT)
2474 i40iw_active_open_err(cm_node, true);
2475 else
2476 i40iw_passive_open_err(cm_node, true);
2477 return;
2480 switch (cm_node->state) {
2481 case I40IW_CM_STATE_ESTABLISHED:
2482 if (res_type == I40IW_MPA_REQUEST_REJECT)
2483 i40iw_pr_err("state for reject\n");
2484 cm_node->state = I40IW_CM_STATE_MPAREQ_RCVD;
2485 type = I40IW_CM_EVENT_MPA_REQ;
2486 i40iw_send_ack(cm_node); /* ACK received MPA request */
2487 atomic_set(&cm_node->passive_state,
2488 I40IW_PASSIVE_STATE_INDICATED);
2489 break;
2490 case I40IW_CM_STATE_MPAREQ_SENT:
2491 i40iw_cleanup_retrans_entry(cm_node);
2492 if (res_type == I40IW_MPA_REQUEST_REJECT) {
2493 type = I40IW_CM_EVENT_MPA_REJECT;
2494 cm_node->state = I40IW_CM_STATE_MPAREJ_RCVD;
2495 } else {
2496 type = I40IW_CM_EVENT_CONNECTED;
2497 cm_node->state = I40IW_CM_STATE_OFFLOADED;
2499 i40iw_send_ack(cm_node);
2500 break;
2501 default:
2502 pr_err("%s wrong cm_node state =%d\n", __func__, cm_node->state);
2503 break;
2505 i40iw_create_event(cm_node, type);
2509 * i40iw_indicate_pkt_err - Send up err event to cm
2510 * @cm_node: connection's node
2512 static void i40iw_indicate_pkt_err(struct i40iw_cm_node *cm_node)
2514 switch (cm_node->state) {
2515 case I40IW_CM_STATE_SYN_SENT:
2516 case I40IW_CM_STATE_MPAREQ_SENT:
2517 i40iw_active_open_err(cm_node, true);
2518 break;
2519 case I40IW_CM_STATE_ESTABLISHED:
2520 case I40IW_CM_STATE_SYN_RCVD:
2521 i40iw_passive_open_err(cm_node, true);
2522 break;
2523 case I40IW_CM_STATE_OFFLOADED:
2524 default:
2525 break;
2530 * i40iw_check_syn - Check for error on received syn ack
2531 * @cm_node: connection's node
2532 * @tcph: pointer tcp header
2534 static int i40iw_check_syn(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2536 int err = 0;
2538 if (ntohl(tcph->ack_seq) != cm_node->tcp_cntxt.loc_seq_num) {
2539 err = 1;
2540 i40iw_active_open_err(cm_node, true);
2542 return err;
2546 * i40iw_check_seq - check seq numbers if OK
2547 * @cm_node: connection's node
2548 * @tcph: pointer tcp header
2550 static int i40iw_check_seq(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2552 int err = 0;
2553 u32 seq;
2554 u32 ack_seq;
2555 u32 loc_seq_num = cm_node->tcp_cntxt.loc_seq_num;
2556 u32 rcv_nxt = cm_node->tcp_cntxt.rcv_nxt;
2557 u32 rcv_wnd;
2559 seq = ntohl(tcph->seq);
2560 ack_seq = ntohl(tcph->ack_seq);
2561 rcv_wnd = cm_node->tcp_cntxt.rcv_wnd;
2562 if (ack_seq != loc_seq_num)
2563 err = -1;
2564 else if (!between(seq, rcv_nxt, (rcv_nxt + rcv_wnd)))
2565 err = -1;
2566 if (err) {
2567 i40iw_pr_err("seq number\n");
2568 i40iw_indicate_pkt_err(cm_node);
2570 return err;
2574 * i40iw_handle_syn_pkt - is for Passive node
2575 * @cm_node: connection's node
2576 * @rbuf: receive buffer
2578 static void i40iw_handle_syn_pkt(struct i40iw_cm_node *cm_node,
2579 struct i40iw_puda_buf *rbuf)
2581 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2582 int ret;
2583 u32 inc_sequence;
2584 int optionsize;
2585 struct i40iw_cm_info nfo;
2587 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2588 inc_sequence = ntohl(tcph->seq);
2590 switch (cm_node->state) {
2591 case I40IW_CM_STATE_SYN_SENT:
2592 case I40IW_CM_STATE_MPAREQ_SENT:
2593 /* Rcvd syn on active open connection */
2594 i40iw_active_open_err(cm_node, 1);
2595 break;
2596 case I40IW_CM_STATE_LISTENING:
2597 /* Passive OPEN */
2598 if (atomic_read(&cm_node->listener->pend_accepts_cnt) >
2599 cm_node->listener->backlog) {
2600 cm_node->cm_core->stats_backlog_drops++;
2601 i40iw_passive_open_err(cm_node, false);
2602 break;
2604 ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2605 if (ret) {
2606 i40iw_passive_open_err(cm_node, false);
2607 /* drop pkt */
2608 break;
2610 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2611 cm_node->accept_pend = 1;
2612 atomic_inc(&cm_node->listener->pend_accepts_cnt);
2614 cm_node->state = I40IW_CM_STATE_SYN_RCVD;
2615 i40iw_get_addr_info(cm_node, &nfo);
2616 ret = i40iw_manage_qhash(cm_node->iwdev,
2617 &nfo,
2618 I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2619 I40IW_QHASH_MANAGE_TYPE_ADD,
2620 (void *)cm_node,
2621 false);
2622 cm_node->qhash_set = true;
2623 break;
2624 case I40IW_CM_STATE_CLOSED:
2625 i40iw_cleanup_retrans_entry(cm_node);
2626 atomic_inc(&cm_node->ref_count);
2627 i40iw_send_reset(cm_node);
2628 break;
2629 case I40IW_CM_STATE_OFFLOADED:
2630 case I40IW_CM_STATE_ESTABLISHED:
2631 case I40IW_CM_STATE_FIN_WAIT1:
2632 case I40IW_CM_STATE_FIN_WAIT2:
2633 case I40IW_CM_STATE_MPAREQ_RCVD:
2634 case I40IW_CM_STATE_LAST_ACK:
2635 case I40IW_CM_STATE_CLOSING:
2636 case I40IW_CM_STATE_UNKNOWN:
2637 default:
2638 break;
2643 * i40iw_handle_synack_pkt - Process SYN+ACK packet (active side)
2644 * @cm_node: connection's node
2645 * @rbuf: receive buffer
2647 static void i40iw_handle_synack_pkt(struct i40iw_cm_node *cm_node,
2648 struct i40iw_puda_buf *rbuf)
2650 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2651 int ret;
2652 u32 inc_sequence;
2653 int optionsize;
2655 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2656 inc_sequence = ntohl(tcph->seq);
2657 switch (cm_node->state) {
2658 case I40IW_CM_STATE_SYN_SENT:
2659 i40iw_cleanup_retrans_entry(cm_node);
2660 /* active open */
2661 if (i40iw_check_syn(cm_node, tcph)) {
2662 i40iw_pr_err("check syn fail\n");
2663 return;
2665 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2666 /* setup options */
2667 ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 0);
2668 if (ret) {
2669 i40iw_debug(cm_node->dev,
2670 I40IW_DEBUG_CM,
2671 "cm_node=%p tcp_options failed\n",
2672 cm_node);
2673 break;
2675 i40iw_cleanup_retrans_entry(cm_node);
2676 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2677 i40iw_send_ack(cm_node); /* ACK for the syn_ack */
2678 ret = i40iw_send_mpa_request(cm_node);
2679 if (ret) {
2680 i40iw_debug(cm_node->dev,
2681 I40IW_DEBUG_CM,
2682 "cm_node=%p i40iw_send_mpa_request failed\n",
2683 cm_node);
2684 break;
2686 cm_node->state = I40IW_CM_STATE_MPAREQ_SENT;
2687 break;
2688 case I40IW_CM_STATE_MPAREQ_RCVD:
2689 i40iw_passive_open_err(cm_node, true);
2690 break;
2691 case I40IW_CM_STATE_LISTENING:
2692 cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2693 i40iw_cleanup_retrans_entry(cm_node);
2694 cm_node->state = I40IW_CM_STATE_CLOSED;
2695 i40iw_send_reset(cm_node);
2696 break;
2697 case I40IW_CM_STATE_CLOSED:
2698 cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2699 i40iw_cleanup_retrans_entry(cm_node);
2700 atomic_inc(&cm_node->ref_count);
2701 i40iw_send_reset(cm_node);
2702 break;
2703 case I40IW_CM_STATE_ESTABLISHED:
2704 case I40IW_CM_STATE_FIN_WAIT1:
2705 case I40IW_CM_STATE_FIN_WAIT2:
2706 case I40IW_CM_STATE_LAST_ACK:
2707 case I40IW_CM_STATE_OFFLOADED:
2708 case I40IW_CM_STATE_CLOSING:
2709 case I40IW_CM_STATE_UNKNOWN:
2710 case I40IW_CM_STATE_MPAREQ_SENT:
2711 default:
2712 break;
2717 * i40iw_handle_ack_pkt - process packet with ACK
2718 * @cm_node: connection's node
2719 * @rbuf: receive buffer
2721 static int i40iw_handle_ack_pkt(struct i40iw_cm_node *cm_node,
2722 struct i40iw_puda_buf *rbuf)
2724 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2725 u32 inc_sequence;
2726 int ret = 0;
2727 int optionsize;
2728 u32 datasize = rbuf->datalen;
2730 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2732 if (i40iw_check_seq(cm_node, tcph))
2733 return -EINVAL;
2735 inc_sequence = ntohl(tcph->seq);
2736 switch (cm_node->state) {
2737 case I40IW_CM_STATE_SYN_RCVD:
2738 i40iw_cleanup_retrans_entry(cm_node);
2739 ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2740 if (ret)
2741 break;
2742 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2743 cm_node->state = I40IW_CM_STATE_ESTABLISHED;
2744 if (datasize) {
2745 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2746 i40iw_handle_rcv_mpa(cm_node, rbuf);
2748 break;
2749 case I40IW_CM_STATE_ESTABLISHED:
2750 i40iw_cleanup_retrans_entry(cm_node);
2751 if (datasize) {
2752 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2753 i40iw_handle_rcv_mpa(cm_node, rbuf);
2755 break;
2756 case I40IW_CM_STATE_MPAREQ_SENT:
2757 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2758 if (datasize) {
2759 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2760 cm_node->ack_rcvd = false;
2761 i40iw_handle_rcv_mpa(cm_node, rbuf);
2762 } else {
2763 cm_node->ack_rcvd = true;
2765 break;
2766 case I40IW_CM_STATE_LISTENING:
2767 i40iw_cleanup_retrans_entry(cm_node);
2768 cm_node->state = I40IW_CM_STATE_CLOSED;
2769 i40iw_send_reset(cm_node);
2770 break;
2771 case I40IW_CM_STATE_CLOSED:
2772 i40iw_cleanup_retrans_entry(cm_node);
2773 atomic_inc(&cm_node->ref_count);
2774 i40iw_send_reset(cm_node);
2775 break;
2776 case I40IW_CM_STATE_LAST_ACK:
2777 case I40IW_CM_STATE_CLOSING:
2778 i40iw_cleanup_retrans_entry(cm_node);
2779 cm_node->state = I40IW_CM_STATE_CLOSED;
2780 if (!cm_node->accept_pend)
2781 cm_node->cm_id->rem_ref(cm_node->cm_id);
2782 i40iw_rem_ref_cm_node(cm_node);
2783 break;
2784 case I40IW_CM_STATE_FIN_WAIT1:
2785 i40iw_cleanup_retrans_entry(cm_node);
2786 cm_node->state = I40IW_CM_STATE_FIN_WAIT2;
2787 break;
2788 case I40IW_CM_STATE_SYN_SENT:
2789 case I40IW_CM_STATE_FIN_WAIT2:
2790 case I40IW_CM_STATE_OFFLOADED:
2791 case I40IW_CM_STATE_MPAREQ_RCVD:
2792 case I40IW_CM_STATE_UNKNOWN:
2793 default:
2794 i40iw_cleanup_retrans_entry(cm_node);
2795 break;
2797 return ret;
2801 * i40iw_process_packet - process cm packet
2802 * @cm_node: connection's node
2803 * @rbuf: receive buffer
2805 static void i40iw_process_packet(struct i40iw_cm_node *cm_node,
2806 struct i40iw_puda_buf *rbuf)
2808 enum i40iw_tcpip_pkt_type pkt_type = I40IW_PKT_TYPE_UNKNOWN;
2809 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2810 u32 fin_set = 0;
2811 int ret;
2813 if (tcph->rst) {
2814 pkt_type = I40IW_PKT_TYPE_RST;
2815 } else if (tcph->syn) {
2816 pkt_type = I40IW_PKT_TYPE_SYN;
2817 if (tcph->ack)
2818 pkt_type = I40IW_PKT_TYPE_SYNACK;
2819 } else if (tcph->ack) {
2820 pkt_type = I40IW_PKT_TYPE_ACK;
2822 if (tcph->fin)
2823 fin_set = 1;
2825 switch (pkt_type) {
2826 case I40IW_PKT_TYPE_SYN:
2827 i40iw_handle_syn_pkt(cm_node, rbuf);
2828 break;
2829 case I40IW_PKT_TYPE_SYNACK:
2830 i40iw_handle_synack_pkt(cm_node, rbuf);
2831 break;
2832 case I40IW_PKT_TYPE_ACK:
2833 ret = i40iw_handle_ack_pkt(cm_node, rbuf);
2834 if (fin_set && !ret)
2835 i40iw_handle_fin_pkt(cm_node);
2836 break;
2837 case I40IW_PKT_TYPE_RST:
2838 i40iw_handle_rst_pkt(cm_node, rbuf);
2839 break;
2840 default:
2841 if (fin_set &&
2842 (!i40iw_check_seq(cm_node, (struct tcphdr *)rbuf->tcph)))
2843 i40iw_handle_fin_pkt(cm_node);
2844 break;
2849 * i40iw_make_listen_node - create a listen node with params
2850 * @cm_core: cm's core
2851 * @iwdev: iwarp device structure
2852 * @cm_info: quad info for connection
2854 static struct i40iw_cm_listener *i40iw_make_listen_node(
2855 struct i40iw_cm_core *cm_core,
2856 struct i40iw_device *iwdev,
2857 struct i40iw_cm_info *cm_info)
2859 struct i40iw_cm_listener *listener;
2860 unsigned long flags;
2862 /* cannot have multiple matching listeners */
2863 listener = i40iw_find_listener(cm_core, cm_info->loc_addr,
2864 cm_info->loc_port,
2865 cm_info->vlan_id,
2866 I40IW_CM_LISTENER_EITHER_STATE);
2867 if (listener &&
2868 (listener->listener_state == I40IW_CM_LISTENER_ACTIVE_STATE)) {
2869 atomic_dec(&listener->ref_count);
2870 i40iw_debug(cm_core->dev,
2871 I40IW_DEBUG_CM,
2872 "Not creating listener since it already exists\n");
2873 return NULL;
2876 if (!listener) {
2877 /* create a CM listen node (1/2 node to compare incoming traffic to) */
2878 listener = kzalloc(sizeof(*listener), GFP_KERNEL);
2879 if (!listener)
2880 return NULL;
2881 cm_core->stats_listen_nodes_created++;
2882 memcpy(listener->loc_addr, cm_info->loc_addr, sizeof(listener->loc_addr));
2883 listener->loc_port = cm_info->loc_port;
2885 INIT_LIST_HEAD(&listener->child_listen_list);
2887 atomic_set(&listener->ref_count, 1);
2888 } else {
2889 listener->reused_node = 1;
2892 listener->cm_id = cm_info->cm_id;
2893 listener->ipv4 = cm_info->ipv4;
2894 listener->vlan_id = cm_info->vlan_id;
2895 atomic_set(&listener->pend_accepts_cnt, 0);
2896 listener->cm_core = cm_core;
2897 listener->iwdev = iwdev;
2899 listener->backlog = cm_info->backlog;
2900 listener->listener_state = I40IW_CM_LISTENER_ACTIVE_STATE;
2902 if (!listener->reused_node) {
2903 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
2904 list_add(&listener->list, &cm_core->listen_nodes);
2905 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
2908 return listener;
2912 * i40iw_create_cm_node - make a connection node with params
2913 * @cm_core: cm's core
2914 * @iwdev: iwarp device structure
2915 * @conn_param: upper layer connection parameters
2916 * @cm_info: quad info for connection
2918 static struct i40iw_cm_node *i40iw_create_cm_node(
2919 struct i40iw_cm_core *cm_core,
2920 struct i40iw_device *iwdev,
2921 struct iw_cm_conn_param *conn_param,
2922 struct i40iw_cm_info *cm_info)
2924 struct i40iw_cm_node *cm_node;
2925 struct i40iw_cm_listener *loopback_remotelistener;
2926 struct i40iw_cm_node *loopback_remotenode;
2927 struct i40iw_cm_info loopback_cm_info;
2929 u16 private_data_len = conn_param->private_data_len;
2930 const void *private_data = conn_param->private_data;
2932 /* create a CM connection node */
2933 cm_node = i40iw_make_cm_node(cm_core, iwdev, cm_info, NULL);
2934 if (!cm_node)
2935 return ERR_PTR(-ENOMEM);
2936 /* set our node side to client (active) side */
2937 cm_node->tcp_cntxt.client = 1;
2938 cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2940 i40iw_record_ird_ord(cm_node, conn_param->ird, conn_param->ord);
2942 if (!memcmp(cm_info->loc_addr, cm_info->rem_addr, sizeof(cm_info->loc_addr))) {
2943 loopback_remotelistener = i40iw_find_listener(
2944 cm_core,
2945 cm_info->rem_addr,
2946 cm_node->rem_port,
2947 cm_node->vlan_id,
2948 I40IW_CM_LISTENER_ACTIVE_STATE);
2949 if (!loopback_remotelistener) {
2950 i40iw_rem_ref_cm_node(cm_node);
2951 return ERR_PTR(-ECONNREFUSED);
2952 } else {
2953 loopback_cm_info = *cm_info;
2954 loopback_cm_info.loc_port = cm_info->rem_port;
2955 loopback_cm_info.rem_port = cm_info->loc_port;
2956 loopback_cm_info.cm_id = loopback_remotelistener->cm_id;
2957 loopback_cm_info.ipv4 = cm_info->ipv4;
2958 loopback_remotenode = i40iw_make_cm_node(cm_core,
2959 iwdev,
2960 &loopback_cm_info,
2961 loopback_remotelistener);
2962 if (!loopback_remotenode) {
2963 i40iw_rem_ref_cm_node(cm_node);
2964 return ERR_PTR(-ENOMEM);
2966 cm_core->stats_loopbacks++;
2967 loopback_remotenode->loopbackpartner = cm_node;
2968 loopback_remotenode->tcp_cntxt.rcv_wscale =
2969 I40IW_CM_DEFAULT_RCV_WND_SCALE;
2970 cm_node->loopbackpartner = loopback_remotenode;
2971 memcpy(loopback_remotenode->pdata_buf, private_data,
2972 private_data_len);
2973 loopback_remotenode->pdata.size = private_data_len;
2975 if (loopback_remotenode->ord_size > cm_node->ird_size)
2976 loopback_remotenode->ord_size =
2977 cm_node->ird_size;
2979 cm_node->state = I40IW_CM_STATE_OFFLOADED;
2980 cm_node->tcp_cntxt.rcv_nxt =
2981 loopback_remotenode->tcp_cntxt.loc_seq_num;
2982 loopback_remotenode->tcp_cntxt.rcv_nxt =
2983 cm_node->tcp_cntxt.loc_seq_num;
2984 cm_node->tcp_cntxt.max_snd_wnd =
2985 loopback_remotenode->tcp_cntxt.rcv_wnd;
2986 loopback_remotenode->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2987 cm_node->tcp_cntxt.snd_wnd = loopback_remotenode->tcp_cntxt.rcv_wnd;
2988 loopback_remotenode->tcp_cntxt.snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2989 cm_node->tcp_cntxt.snd_wscale = loopback_remotenode->tcp_cntxt.rcv_wscale;
2990 loopback_remotenode->tcp_cntxt.snd_wscale = cm_node->tcp_cntxt.rcv_wscale;
2992 return cm_node;
2995 cm_node->pdata.size = private_data_len;
2996 cm_node->pdata.addr = cm_node->pdata_buf;
2998 memcpy(cm_node->pdata_buf, private_data, private_data_len);
3000 cm_node->state = I40IW_CM_STATE_SYN_SENT;
3001 return cm_node;
3005 * i40iw_cm_reject - reject and teardown a connection
3006 * @cm_node: connection's node
3007 * @pdate: ptr to private data for reject
3008 * @plen: size of private data
3010 static int i40iw_cm_reject(struct i40iw_cm_node *cm_node, const void *pdata, u8 plen)
3012 int ret = 0;
3013 int err;
3014 int passive_state;
3015 struct iw_cm_id *cm_id = cm_node->cm_id;
3016 struct i40iw_cm_node *loopback = cm_node->loopbackpartner;
3018 if (cm_node->tcp_cntxt.client)
3019 return ret;
3020 i40iw_cleanup_retrans_entry(cm_node);
3022 if (!loopback) {
3023 passive_state = atomic_inc_return(&cm_node->passive_state);
3024 if (passive_state == I40IW_SEND_RESET_EVENT) {
3025 cm_node->state = I40IW_CM_STATE_CLOSED;
3026 i40iw_rem_ref_cm_node(cm_node);
3027 } else {
3028 if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3029 i40iw_rem_ref_cm_node(cm_node);
3030 } else {
3031 ret = i40iw_send_mpa_reject(cm_node, pdata, plen);
3032 if (ret) {
3033 cm_node->state = I40IW_CM_STATE_CLOSED;
3034 err = i40iw_send_reset(cm_node);
3035 if (err)
3036 i40iw_pr_err("send reset failed\n");
3037 } else {
3038 cm_id->add_ref(cm_id);
3042 } else {
3043 cm_node->cm_id = NULL;
3044 if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3045 i40iw_rem_ref_cm_node(cm_node);
3046 i40iw_rem_ref_cm_node(loopback);
3047 } else {
3048 ret = i40iw_send_cm_event(loopback,
3049 loopback->cm_id,
3050 IW_CM_EVENT_CONNECT_REPLY,
3051 -ECONNREFUSED);
3052 i40iw_rem_ref_cm_node(cm_node);
3053 loopback->state = I40IW_CM_STATE_CLOSING;
3055 cm_id = loopback->cm_id;
3056 i40iw_rem_ref_cm_node(loopback);
3057 cm_id->rem_ref(cm_id);
3061 return ret;
3065 * i40iw_cm_close - close of cm connection
3066 * @cm_node: connection's node
3068 static int i40iw_cm_close(struct i40iw_cm_node *cm_node)
3070 int ret = 0;
3072 if (!cm_node)
3073 return -EINVAL;
3075 switch (cm_node->state) {
3076 case I40IW_CM_STATE_SYN_RCVD:
3077 case I40IW_CM_STATE_SYN_SENT:
3078 case I40IW_CM_STATE_ONE_SIDE_ESTABLISHED:
3079 case I40IW_CM_STATE_ESTABLISHED:
3080 case I40IW_CM_STATE_ACCEPTING:
3081 case I40IW_CM_STATE_MPAREQ_SENT:
3082 case I40IW_CM_STATE_MPAREQ_RCVD:
3083 i40iw_cleanup_retrans_entry(cm_node);
3084 i40iw_send_reset(cm_node);
3085 break;
3086 case I40IW_CM_STATE_CLOSE_WAIT:
3087 cm_node->state = I40IW_CM_STATE_LAST_ACK;
3088 i40iw_send_fin(cm_node);
3089 break;
3090 case I40IW_CM_STATE_FIN_WAIT1:
3091 case I40IW_CM_STATE_FIN_WAIT2:
3092 case I40IW_CM_STATE_LAST_ACK:
3093 case I40IW_CM_STATE_TIME_WAIT:
3094 case I40IW_CM_STATE_CLOSING:
3095 ret = -1;
3096 break;
3097 case I40IW_CM_STATE_LISTENING:
3098 i40iw_cleanup_retrans_entry(cm_node);
3099 i40iw_send_reset(cm_node);
3100 break;
3101 case I40IW_CM_STATE_MPAREJ_RCVD:
3102 case I40IW_CM_STATE_UNKNOWN:
3103 case I40IW_CM_STATE_INITED:
3104 case I40IW_CM_STATE_CLOSED:
3105 case I40IW_CM_STATE_LISTENER_DESTROYED:
3106 i40iw_rem_ref_cm_node(cm_node);
3107 break;
3108 case I40IW_CM_STATE_OFFLOADED:
3109 if (cm_node->send_entry)
3110 i40iw_pr_err("send_entry\n");
3111 i40iw_rem_ref_cm_node(cm_node);
3112 break;
3114 return ret;
3118 * i40iw_receive_ilq - recv an ETHERNET packet, and process it
3119 * through CM
3120 * @vsi: pointer to the vsi structure
3121 * @rbuf: receive buffer
3123 void i40iw_receive_ilq(struct i40iw_sc_vsi *vsi, struct i40iw_puda_buf *rbuf)
3125 struct i40iw_cm_node *cm_node;
3126 struct i40iw_cm_listener *listener;
3127 struct iphdr *iph;
3128 struct ipv6hdr *ip6h;
3129 struct tcphdr *tcph;
3130 struct i40iw_cm_info cm_info;
3131 struct i40iw_sc_dev *dev = vsi->dev;
3132 struct i40iw_device *iwdev = (struct i40iw_device *)dev->back_dev;
3133 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3134 struct vlan_ethhdr *ethh;
3135 u16 vtag;
3137 /* if vlan, then maclen = 18 else 14 */
3138 iph = (struct iphdr *)rbuf->iph;
3139 memset(&cm_info, 0, sizeof(cm_info));
3141 i40iw_debug_buf(dev,
3142 I40IW_DEBUG_ILQ,
3143 "RECEIVE ILQ BUFFER",
3144 rbuf->mem.va,
3145 rbuf->totallen);
3146 ethh = (struct vlan_ethhdr *)rbuf->mem.va;
3148 if (ethh->h_vlan_proto == htons(ETH_P_8021Q)) {
3149 vtag = ntohs(ethh->h_vlan_TCI);
3150 cm_info.user_pri = (vtag & VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
3151 cm_info.vlan_id = vtag & VLAN_VID_MASK;
3152 i40iw_debug(cm_core->dev,
3153 I40IW_DEBUG_CM,
3154 "%s vlan_id=%d\n",
3155 __func__,
3156 cm_info.vlan_id);
3157 } else {
3158 cm_info.vlan_id = I40IW_NO_VLAN;
3160 tcph = (struct tcphdr *)rbuf->tcph;
3162 if (rbuf->ipv4) {
3163 cm_info.loc_addr[0] = ntohl(iph->daddr);
3164 cm_info.rem_addr[0] = ntohl(iph->saddr);
3165 cm_info.ipv4 = true;
3166 cm_info.tos = iph->tos;
3167 } else {
3168 ip6h = (struct ipv6hdr *)rbuf->iph;
3169 i40iw_copy_ip_ntohl(cm_info.loc_addr,
3170 ip6h->daddr.in6_u.u6_addr32);
3171 i40iw_copy_ip_ntohl(cm_info.rem_addr,
3172 ip6h->saddr.in6_u.u6_addr32);
3173 cm_info.ipv4 = false;
3174 cm_info.tos = (ip6h->priority << 4) | (ip6h->flow_lbl[0] >> 4);
3176 cm_info.loc_port = ntohs(tcph->dest);
3177 cm_info.rem_port = ntohs(tcph->source);
3178 cm_node = i40iw_find_node(cm_core,
3179 cm_info.rem_port,
3180 cm_info.rem_addr,
3181 cm_info.loc_port,
3182 cm_info.loc_addr,
3183 true,
3184 false);
3186 if (!cm_node) {
3187 /* Only type of packet accepted are for */
3188 /* the PASSIVE open (syn only) */
3189 if (!tcph->syn || tcph->ack)
3190 return;
3191 listener =
3192 i40iw_find_listener(cm_core,
3193 cm_info.loc_addr,
3194 cm_info.loc_port,
3195 cm_info.vlan_id,
3196 I40IW_CM_LISTENER_ACTIVE_STATE);
3197 if (!listener) {
3198 cm_info.cm_id = NULL;
3199 i40iw_debug(cm_core->dev,
3200 I40IW_DEBUG_CM,
3201 "%s no listener found\n",
3202 __func__);
3203 return;
3205 cm_info.cm_id = listener->cm_id;
3206 cm_node = i40iw_make_cm_node(cm_core, iwdev, &cm_info, listener);
3207 if (!cm_node) {
3208 i40iw_debug(cm_core->dev,
3209 I40IW_DEBUG_CM,
3210 "%s allocate node failed\n",
3211 __func__);
3212 atomic_dec(&listener->ref_count);
3213 return;
3215 if (!tcph->rst && !tcph->fin) {
3216 cm_node->state = I40IW_CM_STATE_LISTENING;
3217 } else {
3218 i40iw_rem_ref_cm_node(cm_node);
3219 return;
3221 atomic_inc(&cm_node->ref_count);
3222 } else if (cm_node->state == I40IW_CM_STATE_OFFLOADED) {
3223 i40iw_rem_ref_cm_node(cm_node);
3224 return;
3226 i40iw_process_packet(cm_node, rbuf);
3227 i40iw_rem_ref_cm_node(cm_node);
3231 * i40iw_setup_cm_core - allocate a top level instance of a cm
3232 * core
3233 * @iwdev: iwarp device structure
3235 int i40iw_setup_cm_core(struct i40iw_device *iwdev)
3237 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3239 cm_core->iwdev = iwdev;
3240 cm_core->dev = &iwdev->sc_dev;
3242 INIT_LIST_HEAD(&cm_core->accelerated_list);
3243 INIT_LIST_HEAD(&cm_core->non_accelerated_list);
3244 INIT_LIST_HEAD(&cm_core->listen_nodes);
3246 timer_setup(&cm_core->tcp_timer, i40iw_cm_timer_tick, 0);
3248 spin_lock_init(&cm_core->ht_lock);
3249 spin_lock_init(&cm_core->listen_list_lock);
3250 spin_lock_init(&cm_core->apbvt_lock);
3252 cm_core->event_wq = alloc_ordered_workqueue("iwewq",
3253 WQ_MEM_RECLAIM);
3254 if (!cm_core->event_wq)
3255 goto error;
3257 cm_core->disconn_wq = alloc_ordered_workqueue("iwdwq",
3258 WQ_MEM_RECLAIM);
3259 if (!cm_core->disconn_wq)
3260 goto error;
3262 return 0;
3263 error:
3264 i40iw_cleanup_cm_core(&iwdev->cm_core);
3266 return -ENOMEM;
3270 * i40iw_cleanup_cm_core - deallocate a top level instance of a
3271 * cm core
3272 * @cm_core: cm's core
3274 void i40iw_cleanup_cm_core(struct i40iw_cm_core *cm_core)
3276 unsigned long flags;
3278 if (!cm_core)
3279 return;
3281 spin_lock_irqsave(&cm_core->ht_lock, flags);
3282 if (timer_pending(&cm_core->tcp_timer))
3283 del_timer_sync(&cm_core->tcp_timer);
3284 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3286 if (cm_core->event_wq)
3287 destroy_workqueue(cm_core->event_wq);
3288 if (cm_core->disconn_wq)
3289 destroy_workqueue(cm_core->disconn_wq);
3293 * i40iw_init_tcp_ctx - setup qp context
3294 * @cm_node: connection's node
3295 * @tcp_info: offload info for tcp
3296 * @iwqp: associate qp for the connection
3298 static void i40iw_init_tcp_ctx(struct i40iw_cm_node *cm_node,
3299 struct i40iw_tcp_offload_info *tcp_info,
3300 struct i40iw_qp *iwqp)
3302 tcp_info->ipv4 = cm_node->ipv4;
3303 tcp_info->drop_ooo_seg = true;
3304 tcp_info->wscale = true;
3305 tcp_info->ignore_tcp_opt = true;
3306 tcp_info->ignore_tcp_uns_opt = true;
3307 tcp_info->no_nagle = false;
3309 tcp_info->ttl = I40IW_DEFAULT_TTL;
3310 tcp_info->rtt_var = cpu_to_le32(I40IW_DEFAULT_RTT_VAR);
3311 tcp_info->ss_thresh = cpu_to_le32(I40IW_DEFAULT_SS_THRESH);
3312 tcp_info->rexmit_thresh = I40IW_DEFAULT_REXMIT_THRESH;
3314 tcp_info->tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3315 tcp_info->snd_wscale = cm_node->tcp_cntxt.snd_wscale;
3316 tcp_info->rcv_wscale = cm_node->tcp_cntxt.rcv_wscale;
3318 tcp_info->snd_nxt = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3319 tcp_info->snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.snd_wnd);
3320 tcp_info->rcv_nxt = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3321 tcp_info->snd_max = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3323 tcp_info->snd_una = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3324 tcp_info->cwnd = cpu_to_le32(2 * cm_node->tcp_cntxt.mss);
3325 tcp_info->snd_wl1 = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3326 tcp_info->snd_wl2 = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3327 tcp_info->max_snd_window = cpu_to_le32(cm_node->tcp_cntxt.max_snd_wnd);
3328 tcp_info->rcv_wnd = cpu_to_le32(cm_node->tcp_cntxt.rcv_wnd <<
3329 cm_node->tcp_cntxt.rcv_wscale);
3331 tcp_info->flow_label = 0;
3332 tcp_info->snd_mss = cpu_to_le32(((u32)cm_node->tcp_cntxt.mss));
3333 if (cm_node->vlan_id <= VLAN_VID_MASK) {
3334 tcp_info->insert_vlan_tag = true;
3335 tcp_info->vlan_tag = cpu_to_le16(((u16)cm_node->user_pri << I40IW_VLAN_PRIO_SHIFT) |
3336 cm_node->vlan_id);
3338 if (cm_node->ipv4) {
3339 tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3340 tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3342 tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[0]);
3343 tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[0]);
3344 tcp_info->arp_idx =
3345 cpu_to_le16((u16)i40iw_arp_table(
3346 iwqp->iwdev,
3347 &tcp_info->dest_ip_addr3,
3348 true,
3349 NULL,
3350 I40IW_ARP_RESOLVE));
3351 } else {
3352 tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3353 tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3354 tcp_info->dest_ip_addr0 = cpu_to_le32(cm_node->rem_addr[0]);
3355 tcp_info->dest_ip_addr1 = cpu_to_le32(cm_node->rem_addr[1]);
3356 tcp_info->dest_ip_addr2 = cpu_to_le32(cm_node->rem_addr[2]);
3357 tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[3]);
3358 tcp_info->local_ipaddr0 = cpu_to_le32(cm_node->loc_addr[0]);
3359 tcp_info->local_ipaddr1 = cpu_to_le32(cm_node->loc_addr[1]);
3360 tcp_info->local_ipaddr2 = cpu_to_le32(cm_node->loc_addr[2]);
3361 tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[3]);
3362 tcp_info->arp_idx =
3363 cpu_to_le16((u16)i40iw_arp_table(
3364 iwqp->iwdev,
3365 &tcp_info->dest_ip_addr0,
3366 false,
3367 NULL,
3368 I40IW_ARP_RESOLVE));
3373 * i40iw_cm_init_tsa_conn - setup qp for RTS
3374 * @iwqp: associate qp for the connection
3375 * @cm_node: connection's node
3377 static void i40iw_cm_init_tsa_conn(struct i40iw_qp *iwqp,
3378 struct i40iw_cm_node *cm_node)
3380 struct i40iw_tcp_offload_info tcp_info;
3381 struct i40iwarp_offload_info *iwarp_info;
3382 struct i40iw_qp_host_ctx_info *ctx_info;
3383 struct i40iw_device *iwdev = iwqp->iwdev;
3384 struct i40iw_sc_dev *dev = &iwqp->iwdev->sc_dev;
3386 memset(&tcp_info, 0x00, sizeof(struct i40iw_tcp_offload_info));
3387 iwarp_info = &iwqp->iwarp_info;
3388 ctx_info = &iwqp->ctx_info;
3390 ctx_info->tcp_info = &tcp_info;
3391 ctx_info->send_cq_num = iwqp->iwscq->sc_cq.cq_uk.cq_id;
3392 ctx_info->rcv_cq_num = iwqp->iwrcq->sc_cq.cq_uk.cq_id;
3394 iwarp_info->ord_size = cm_node->ord_size;
3395 iwarp_info->ird_size = i40iw_derive_hw_ird_setting(cm_node->ird_size);
3397 if (iwarp_info->ord_size == 1)
3398 iwarp_info->ord_size = 2;
3400 iwarp_info->rd_enable = true;
3401 iwarp_info->rdmap_ver = 1;
3402 iwarp_info->ddp_ver = 1;
3404 iwarp_info->pd_id = iwqp->iwpd->sc_pd.pd_id;
3406 ctx_info->tcp_info_valid = true;
3407 ctx_info->iwarp_info_valid = true;
3408 ctx_info->add_to_qoslist = true;
3409 ctx_info->user_pri = cm_node->user_pri;
3411 i40iw_init_tcp_ctx(cm_node, &tcp_info, iwqp);
3412 if (cm_node->snd_mark_en) {
3413 iwarp_info->snd_mark_en = true;
3414 iwarp_info->snd_mark_offset = (tcp_info.snd_nxt &
3415 SNDMARKER_SEQNMASK) + cm_node->lsmm_size;
3418 cm_node->state = I40IW_CM_STATE_OFFLOADED;
3419 tcp_info.tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3420 tcp_info.src_mac_addr_idx = iwdev->mac_ip_table_idx;
3421 tcp_info.tos = cm_node->tos;
3423 dev->iw_priv_qp_ops->qp_setctx(&iwqp->sc_qp, (u64 *)(iwqp->host_ctx.va), ctx_info);
3425 /* once tcp_info is set, no need to do it again */
3426 ctx_info->tcp_info_valid = false;
3427 ctx_info->iwarp_info_valid = false;
3428 ctx_info->add_to_qoslist = false;
3432 * i40iw_cm_disconn - when a connection is being closed
3433 * @iwqp: associate qp for the connection
3435 void i40iw_cm_disconn(struct i40iw_qp *iwqp)
3437 struct disconn_work *work;
3438 struct i40iw_device *iwdev = iwqp->iwdev;
3439 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3440 unsigned long flags;
3442 work = kzalloc(sizeof(*work), GFP_ATOMIC);
3443 if (!work)
3444 return; /* Timer will clean up */
3446 spin_lock_irqsave(&iwdev->qptable_lock, flags);
3447 if (!iwdev->qp_table[iwqp->ibqp.qp_num]) {
3448 spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3449 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
3450 "%s qp_id %d is already freed\n",
3451 __func__, iwqp->ibqp.qp_num);
3452 kfree(work);
3453 return;
3455 i40iw_qp_add_ref(&iwqp->ibqp);
3456 spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3458 work->iwqp = iwqp;
3459 INIT_WORK(&work->work, i40iw_disconnect_worker);
3460 queue_work(cm_core->disconn_wq, &work->work);
3461 return;
3465 * i40iw_qp_disconnect - free qp and close cm
3466 * @iwqp: associate qp for the connection
3468 static void i40iw_qp_disconnect(struct i40iw_qp *iwqp)
3470 struct i40iw_device *iwdev;
3471 struct i40iw_ib_device *iwibdev;
3473 iwdev = to_iwdev(iwqp->ibqp.device);
3474 if (!iwdev) {
3475 i40iw_pr_err("iwdev == NULL\n");
3476 return;
3479 iwibdev = iwdev->iwibdev;
3481 if (iwqp->active_conn) {
3482 /* indicate this connection is NOT active */
3483 iwqp->active_conn = 0;
3484 } else {
3485 /* Need to free the Last Streaming Mode Message */
3486 if (iwqp->ietf_mem.va) {
3487 if (iwqp->lsmm_mr)
3488 iwibdev->ibdev.ops.dereg_mr(iwqp->lsmm_mr,
3489 NULL);
3490 i40iw_free_dma_mem(iwdev->sc_dev.hw, &iwqp->ietf_mem);
3494 /* close the CM node down if it is still active */
3495 if (iwqp->cm_node) {
3496 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "%s Call close API\n", __func__);
3497 i40iw_cm_close(iwqp->cm_node);
3502 * i40iw_cm_disconn_true - called by worker thread to disconnect qp
3503 * @iwqp: associate qp for the connection
3505 static void i40iw_cm_disconn_true(struct i40iw_qp *iwqp)
3507 struct iw_cm_id *cm_id;
3508 struct i40iw_device *iwdev;
3509 struct i40iw_sc_qp *qp = &iwqp->sc_qp;
3510 u16 last_ae;
3511 u8 original_hw_tcp_state;
3512 u8 original_ibqp_state;
3513 int disconn_status = 0;
3514 int issue_disconn = 0;
3515 int issue_close = 0;
3516 int issue_flush = 0;
3517 struct ib_event ibevent;
3518 unsigned long flags;
3519 int ret;
3521 if (!iwqp) {
3522 i40iw_pr_err("iwqp == NULL\n");
3523 return;
3526 spin_lock_irqsave(&iwqp->lock, flags);
3527 cm_id = iwqp->cm_id;
3528 /* make sure we havent already closed this connection */
3529 if (!cm_id) {
3530 spin_unlock_irqrestore(&iwqp->lock, flags);
3531 return;
3534 iwdev = to_iwdev(iwqp->ibqp.device);
3536 original_hw_tcp_state = iwqp->hw_tcp_state;
3537 original_ibqp_state = iwqp->ibqp_state;
3538 last_ae = iwqp->last_aeq;
3540 if (qp->term_flags) {
3541 issue_disconn = 1;
3542 issue_close = 1;
3543 iwqp->cm_id = NULL;
3544 /*When term timer expires after cm_timer, don't want
3545 *terminate-handler to issue cm_disconn which can re-free
3546 *a QP even after its refcnt=0.
3548 i40iw_terminate_del_timer(qp);
3549 if (!iwqp->flush_issued) {
3550 iwqp->flush_issued = 1;
3551 issue_flush = 1;
3553 } else if ((original_hw_tcp_state == I40IW_TCP_STATE_CLOSE_WAIT) ||
3554 ((original_ibqp_state == IB_QPS_RTS) &&
3555 (last_ae == I40IW_AE_LLP_CONNECTION_RESET))) {
3556 issue_disconn = 1;
3557 if (last_ae == I40IW_AE_LLP_CONNECTION_RESET)
3558 disconn_status = -ECONNRESET;
3561 if (((original_hw_tcp_state == I40IW_TCP_STATE_CLOSED) ||
3562 (original_hw_tcp_state == I40IW_TCP_STATE_TIME_WAIT) ||
3563 (last_ae == I40IW_AE_RDMAP_ROE_BAD_LLP_CLOSE) ||
3564 (last_ae == I40IW_AE_LLP_CONNECTION_RESET) ||
3565 iwdev->reset)) {
3566 issue_close = 1;
3567 iwqp->cm_id = NULL;
3568 if (!iwqp->flush_issued) {
3569 iwqp->flush_issued = 1;
3570 issue_flush = 1;
3574 spin_unlock_irqrestore(&iwqp->lock, flags);
3575 if (issue_flush && !iwqp->destroyed) {
3576 /* Flush the queues */
3577 i40iw_flush_wqes(iwdev, iwqp);
3579 if (qp->term_flags && iwqp->ibqp.event_handler) {
3580 ibevent.device = iwqp->ibqp.device;
3581 ibevent.event = (qp->eventtype == TERM_EVENT_QP_FATAL) ?
3582 IB_EVENT_QP_FATAL : IB_EVENT_QP_ACCESS_ERR;
3583 ibevent.element.qp = &iwqp->ibqp;
3584 iwqp->ibqp.event_handler(&ibevent, iwqp->ibqp.qp_context);
3588 if (cm_id && cm_id->event_handler) {
3589 if (issue_disconn) {
3590 ret = i40iw_send_cm_event(NULL,
3591 cm_id,
3592 IW_CM_EVENT_DISCONNECT,
3593 disconn_status);
3595 if (ret)
3596 i40iw_debug(&iwdev->sc_dev,
3597 I40IW_DEBUG_CM,
3598 "disconnect event failed %s: - cm_id = %p\n",
3599 __func__, cm_id);
3601 if (issue_close) {
3602 i40iw_qp_disconnect(iwqp);
3603 cm_id->provider_data = iwqp;
3604 ret = i40iw_send_cm_event(NULL, cm_id, IW_CM_EVENT_CLOSE, 0);
3605 if (ret)
3606 i40iw_debug(&iwdev->sc_dev,
3607 I40IW_DEBUG_CM,
3608 "close event failed %s: - cm_id = %p\n",
3609 __func__, cm_id);
3610 cm_id->rem_ref(cm_id);
3616 * i40iw_disconnect_worker - worker for connection close
3617 * @work: points or disconn structure
3619 static void i40iw_disconnect_worker(struct work_struct *work)
3621 struct disconn_work *dwork = container_of(work, struct disconn_work, work);
3622 struct i40iw_qp *iwqp = dwork->iwqp;
3624 kfree(dwork);
3625 i40iw_cm_disconn_true(iwqp);
3626 i40iw_qp_rem_ref(&iwqp->ibqp);
3630 * i40iw_accept - registered call for connection to be accepted
3631 * @cm_id: cm information for passive connection
3632 * @conn_param: accpet parameters
3634 int i40iw_accept(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3636 struct ib_qp *ibqp;
3637 struct i40iw_qp *iwqp;
3638 struct i40iw_device *iwdev;
3639 struct i40iw_sc_dev *dev;
3640 struct i40iw_cm_core *cm_core;
3641 struct i40iw_cm_node *cm_node;
3642 struct ib_qp_attr attr;
3643 int passive_state;
3644 struct ib_mr *ibmr;
3645 struct i40iw_pd *iwpd;
3646 u16 buf_len = 0;
3647 struct i40iw_kmem_info accept;
3648 enum i40iw_status_code status;
3649 u64 tagged_offset;
3650 unsigned long flags;
3652 memset(&attr, 0, sizeof(attr));
3653 ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3654 if (!ibqp)
3655 return -EINVAL;
3657 iwqp = to_iwqp(ibqp);
3658 iwdev = iwqp->iwdev;
3659 dev = &iwdev->sc_dev;
3660 cm_core = &iwdev->cm_core;
3661 cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3663 if (((struct sockaddr_in *)&cm_id->local_addr)->sin_family == AF_INET) {
3664 cm_node->ipv4 = true;
3665 cm_node->vlan_id = i40iw_get_vlan_ipv4(cm_node->loc_addr);
3666 } else {
3667 cm_node->ipv4 = false;
3668 i40iw_netdev_vlan_ipv6(cm_node->loc_addr, &cm_node->vlan_id);
3670 i40iw_debug(cm_node->dev,
3671 I40IW_DEBUG_CM,
3672 "Accept vlan_id=%d\n",
3673 cm_node->vlan_id);
3674 if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3675 if (cm_node->loopbackpartner)
3676 i40iw_rem_ref_cm_node(cm_node->loopbackpartner);
3677 i40iw_rem_ref_cm_node(cm_node);
3678 return -EINVAL;
3681 passive_state = atomic_inc_return(&cm_node->passive_state);
3682 if (passive_state == I40IW_SEND_RESET_EVENT) {
3683 i40iw_rem_ref_cm_node(cm_node);
3684 return -ECONNRESET;
3687 cm_node->cm_core->stats_accepts++;
3688 iwqp->cm_node = (void *)cm_node;
3689 cm_node->iwqp = iwqp;
3691 buf_len = conn_param->private_data_len + I40IW_MAX_IETF_SIZE;
3693 status = i40iw_allocate_dma_mem(dev->hw, &iwqp->ietf_mem, buf_len, 1);
3695 if (status)
3696 return -ENOMEM;
3697 cm_node->pdata.size = conn_param->private_data_len;
3698 accept.addr = iwqp->ietf_mem.va;
3699 accept.size = i40iw_cm_build_mpa_frame(cm_node, &accept, MPA_KEY_REPLY);
3700 memcpy(accept.addr + accept.size, conn_param->private_data,
3701 conn_param->private_data_len);
3703 /* setup our first outgoing iWarp send WQE (the IETF frame response) */
3704 if ((cm_node->ipv4 &&
3705 !i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
3706 (!cm_node->ipv4 &&
3707 !i40iw_ipv6_is_loopback(cm_node->loc_addr, cm_node->rem_addr))) {
3708 iwpd = iwqp->iwpd;
3709 tagged_offset = (uintptr_t)iwqp->ietf_mem.va;
3710 ibmr = i40iw_reg_phys_mr(&iwpd->ibpd,
3711 iwqp->ietf_mem.pa,
3712 buf_len,
3713 IB_ACCESS_LOCAL_WRITE,
3714 &tagged_offset);
3715 if (IS_ERR(ibmr)) {
3716 i40iw_free_dma_mem(dev->hw, &iwqp->ietf_mem);
3717 return -ENOMEM;
3720 ibmr->pd = &iwpd->ibpd;
3721 ibmr->device = iwpd->ibpd.device;
3722 iwqp->lsmm_mr = ibmr;
3723 if (iwqp->page)
3724 iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3725 dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp,
3726 iwqp->ietf_mem.va,
3727 (accept.size + conn_param->private_data_len),
3728 ibmr->lkey);
3730 } else {
3731 if (iwqp->page)
3732 iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3733 dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp, NULL, 0, 0);
3736 if (iwqp->page)
3737 kunmap(iwqp->page);
3739 iwqp->cm_id = cm_id;
3740 cm_node->cm_id = cm_id;
3742 cm_id->provider_data = (void *)iwqp;
3743 iwqp->active_conn = 0;
3745 cm_node->lsmm_size = accept.size + conn_param->private_data_len;
3746 i40iw_cm_init_tsa_conn(iwqp, cm_node);
3747 cm_id->add_ref(cm_id);
3748 i40iw_qp_add_ref(&iwqp->ibqp);
3750 attr.qp_state = IB_QPS_RTS;
3751 cm_node->qhash_set = false;
3752 i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
3754 cm_node->accelerated = true;
3755 spin_lock_irqsave(&cm_core->ht_lock, flags);
3756 list_move_tail(&cm_node->list, &cm_core->accelerated_list);
3757 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3759 status =
3760 i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_ESTABLISHED, 0);
3761 if (status)
3762 i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - ESTABLISHED\n");
3764 if (cm_node->loopbackpartner) {
3765 cm_node->loopbackpartner->pdata.size = conn_param->private_data_len;
3767 /* copy entire MPA frame to our cm_node's frame */
3768 memcpy(cm_node->loopbackpartner->pdata_buf,
3769 conn_param->private_data,
3770 conn_param->private_data_len);
3771 i40iw_create_event(cm_node->loopbackpartner, I40IW_CM_EVENT_CONNECTED);
3774 if (cm_node->accept_pend) {
3775 atomic_dec(&cm_node->listener->pend_accepts_cnt);
3776 cm_node->accept_pend = 0;
3778 return 0;
3782 * i40iw_reject - registered call for connection to be rejected
3783 * @cm_id: cm information for passive connection
3784 * @pdata: private data to be sent
3785 * @pdata_len: private data length
3787 int i40iw_reject(struct iw_cm_id *cm_id, const void *pdata, u8 pdata_len)
3789 struct i40iw_device *iwdev;
3790 struct i40iw_cm_node *cm_node;
3791 struct i40iw_cm_node *loopback;
3793 cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3794 loopback = cm_node->loopbackpartner;
3795 cm_node->cm_id = cm_id;
3796 cm_node->pdata.size = pdata_len;
3798 iwdev = to_iwdev(cm_id->device);
3799 if (!iwdev)
3800 return -EINVAL;
3801 cm_node->cm_core->stats_rejects++;
3803 if (pdata_len + sizeof(struct ietf_mpa_v2) > MAX_CM_BUFFER)
3804 return -EINVAL;
3806 if (loopback) {
3807 memcpy(&loopback->pdata_buf, pdata, pdata_len);
3808 loopback->pdata.size = pdata_len;
3811 return i40iw_cm_reject(cm_node, pdata, pdata_len);
3815 * i40iw_connect - registered call for connection to be established
3816 * @cm_id: cm information for passive connection
3817 * @conn_param: Information about the connection
3819 int i40iw_connect(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3821 struct ib_qp *ibqp;
3822 struct i40iw_qp *iwqp;
3823 struct i40iw_device *iwdev;
3824 struct i40iw_cm_node *cm_node;
3825 struct i40iw_cm_info cm_info;
3826 struct sockaddr_in *laddr;
3827 struct sockaddr_in *raddr;
3828 struct sockaddr_in6 *laddr6;
3829 struct sockaddr_in6 *raddr6;
3830 int ret = 0;
3832 ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3833 if (!ibqp)
3834 return -EINVAL;
3835 iwqp = to_iwqp(ibqp);
3836 if (!iwqp)
3837 return -EINVAL;
3838 iwdev = to_iwdev(iwqp->ibqp.device);
3839 if (!iwdev)
3840 return -EINVAL;
3842 laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3843 raddr = (struct sockaddr_in *)&cm_id->m_remote_addr;
3844 laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3845 raddr6 = (struct sockaddr_in6 *)&cm_id->m_remote_addr;
3847 if (!(laddr->sin_port) || !(raddr->sin_port))
3848 return -EINVAL;
3850 iwqp->active_conn = 1;
3851 iwqp->cm_id = NULL;
3852 cm_id->provider_data = iwqp;
3854 /* set up the connection params for the node */
3855 if (cm_id->remote_addr.ss_family == AF_INET) {
3856 cm_info.ipv4 = true;
3857 memset(cm_info.loc_addr, 0, sizeof(cm_info.loc_addr));
3858 memset(cm_info.rem_addr, 0, sizeof(cm_info.rem_addr));
3859 cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3860 cm_info.rem_addr[0] = ntohl(raddr->sin_addr.s_addr);
3861 cm_info.loc_port = ntohs(laddr->sin_port);
3862 cm_info.rem_port = ntohs(raddr->sin_port);
3863 cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3864 } else {
3865 cm_info.ipv4 = false;
3866 i40iw_copy_ip_ntohl(cm_info.loc_addr,
3867 laddr6->sin6_addr.in6_u.u6_addr32);
3868 i40iw_copy_ip_ntohl(cm_info.rem_addr,
3869 raddr6->sin6_addr.in6_u.u6_addr32);
3870 cm_info.loc_port = ntohs(laddr6->sin6_port);
3871 cm_info.rem_port = ntohs(raddr6->sin6_port);
3872 i40iw_netdev_vlan_ipv6(cm_info.loc_addr, &cm_info.vlan_id);
3874 cm_info.cm_id = cm_id;
3875 cm_info.tos = cm_id->tos;
3876 cm_info.user_pri = rt_tos2priority(cm_id->tos);
3877 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "%s TOS:[%d] UP:[%d]\n",
3878 __func__, cm_id->tos, cm_info.user_pri);
3879 cm_id->add_ref(cm_id);
3880 cm_node = i40iw_create_cm_node(&iwdev->cm_core, iwdev,
3881 conn_param, &cm_info);
3883 if (IS_ERR(cm_node)) {
3884 ret = PTR_ERR(cm_node);
3885 cm_id->rem_ref(cm_id);
3886 return ret;
3889 if ((cm_info.ipv4 && (laddr->sin_addr.s_addr != raddr->sin_addr.s_addr)) ||
3890 (!cm_info.ipv4 && memcmp(laddr6->sin6_addr.in6_u.u6_addr32,
3891 raddr6->sin6_addr.in6_u.u6_addr32,
3892 sizeof(laddr6->sin6_addr.in6_u.u6_addr32)))) {
3893 if (i40iw_manage_qhash(iwdev, &cm_info, I40IW_QHASH_TYPE_TCP_ESTABLISHED,
3894 I40IW_QHASH_MANAGE_TYPE_ADD, NULL, true)) {
3895 ret = -EINVAL;
3896 goto err;
3898 cm_node->qhash_set = true;
3901 if (i40iw_manage_apbvt(iwdev, cm_info.loc_port,
3902 I40IW_MANAGE_APBVT_ADD)) {
3903 ret = -EINVAL;
3904 goto err;
3907 cm_node->apbvt_set = true;
3908 iwqp->cm_node = cm_node;
3909 cm_node->iwqp = iwqp;
3910 iwqp->cm_id = cm_id;
3911 i40iw_qp_add_ref(&iwqp->ibqp);
3913 if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
3914 cm_node->state = I40IW_CM_STATE_SYN_SENT;
3915 ret = i40iw_send_syn(cm_node, 0);
3916 if (ret)
3917 goto err;
3920 if (cm_node->loopbackpartner) {
3921 cm_node->loopbackpartner->state = I40IW_CM_STATE_MPAREQ_RCVD;
3922 i40iw_create_event(cm_node->loopbackpartner,
3923 I40IW_CM_EVENT_MPA_REQ);
3926 i40iw_debug(cm_node->dev,
3927 I40IW_DEBUG_CM,
3928 "Api - connect(): port=0x%04x, cm_node=%p, cm_id = %p.\n",
3929 cm_node->rem_port,
3930 cm_node,
3931 cm_node->cm_id);
3933 return 0;
3935 err:
3936 if (cm_info.ipv4)
3937 i40iw_debug(&iwdev->sc_dev,
3938 I40IW_DEBUG_CM,
3939 "Api - connect() FAILED: dest addr=%pI4",
3940 cm_info.rem_addr);
3941 else
3942 i40iw_debug(&iwdev->sc_dev,
3943 I40IW_DEBUG_CM,
3944 "Api - connect() FAILED: dest addr=%pI6",
3945 cm_info.rem_addr);
3947 i40iw_rem_ref_cm_node(cm_node);
3948 cm_id->rem_ref(cm_id);
3949 iwdev->cm_core.stats_connect_errs++;
3950 return ret;
3954 * i40iw_create_listen - registered call creating listener
3955 * @cm_id: cm information for passive connection
3956 * @backlog: to max accept pending count
3958 int i40iw_create_listen(struct iw_cm_id *cm_id, int backlog)
3960 struct i40iw_device *iwdev;
3961 struct i40iw_cm_listener *cm_listen_node;
3962 struct i40iw_cm_info cm_info;
3963 enum i40iw_status_code ret;
3964 struct sockaddr_in *laddr;
3965 struct sockaddr_in6 *laddr6;
3966 bool wildcard = false;
3968 iwdev = to_iwdev(cm_id->device);
3969 if (!iwdev)
3970 return -EINVAL;
3972 laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3973 laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3974 memset(&cm_info, 0, sizeof(cm_info));
3975 if (laddr->sin_family == AF_INET) {
3976 cm_info.ipv4 = true;
3977 cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3978 cm_info.loc_port = ntohs(laddr->sin_port);
3980 if (laddr->sin_addr.s_addr != INADDR_ANY)
3981 cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3982 else
3983 wildcard = true;
3985 } else {
3986 cm_info.ipv4 = false;
3987 i40iw_copy_ip_ntohl(cm_info.loc_addr,
3988 laddr6->sin6_addr.in6_u.u6_addr32);
3989 cm_info.loc_port = ntohs(laddr6->sin6_port);
3990 if (ipv6_addr_type(&laddr6->sin6_addr) != IPV6_ADDR_ANY)
3991 i40iw_netdev_vlan_ipv6(cm_info.loc_addr,
3992 &cm_info.vlan_id);
3993 else
3994 wildcard = true;
3996 cm_info.backlog = backlog;
3997 cm_info.cm_id = cm_id;
3999 cm_listen_node = i40iw_make_listen_node(&iwdev->cm_core, iwdev, &cm_info);
4000 if (!cm_listen_node) {
4001 i40iw_pr_err("cm_listen_node == NULL\n");
4002 return -ENOMEM;
4005 cm_id->provider_data = cm_listen_node;
4007 cm_listen_node->tos = cm_id->tos;
4008 cm_listen_node->user_pri = rt_tos2priority(cm_id->tos);
4009 cm_info.user_pri = cm_listen_node->user_pri;
4011 if (!cm_listen_node->reused_node) {
4012 if (wildcard) {
4013 if (cm_info.ipv4)
4014 ret = i40iw_add_mqh_4(iwdev,
4015 &cm_info,
4016 cm_listen_node);
4017 else
4018 ret = i40iw_add_mqh_6(iwdev,
4019 &cm_info,
4020 cm_listen_node);
4021 if (ret)
4022 goto error;
4024 ret = i40iw_manage_apbvt(iwdev,
4025 cm_info.loc_port,
4026 I40IW_MANAGE_APBVT_ADD);
4028 if (ret)
4029 goto error;
4030 } else {
4031 ret = i40iw_manage_qhash(iwdev,
4032 &cm_info,
4033 I40IW_QHASH_TYPE_TCP_SYN,
4034 I40IW_QHASH_MANAGE_TYPE_ADD,
4035 NULL,
4036 true);
4037 if (ret)
4038 goto error;
4039 cm_listen_node->qhash_set = true;
4040 ret = i40iw_manage_apbvt(iwdev,
4041 cm_info.loc_port,
4042 I40IW_MANAGE_APBVT_ADD);
4043 if (ret)
4044 goto error;
4047 cm_id->add_ref(cm_id);
4048 cm_listen_node->cm_core->stats_listen_created++;
4049 return 0;
4050 error:
4051 i40iw_cm_del_listen(&iwdev->cm_core, (void *)cm_listen_node, false);
4052 return -EINVAL;
4056 * i40iw_destroy_listen - registered call to destroy listener
4057 * @cm_id: cm information for passive connection
4059 int i40iw_destroy_listen(struct iw_cm_id *cm_id)
4061 struct i40iw_device *iwdev;
4063 iwdev = to_iwdev(cm_id->device);
4064 if (cm_id->provider_data)
4065 i40iw_cm_del_listen(&iwdev->cm_core, cm_id->provider_data, true);
4066 else
4067 i40iw_pr_err("cm_id->provider_data was NULL\n");
4069 cm_id->rem_ref(cm_id);
4071 return 0;
4075 * i40iw_cm_event_connected - handle connected active node
4076 * @event: the info for cm_node of connection
4078 static void i40iw_cm_event_connected(struct i40iw_cm_event *event)
4080 struct i40iw_qp *iwqp;
4081 struct i40iw_device *iwdev;
4082 struct i40iw_cm_core *cm_core;
4083 struct i40iw_cm_node *cm_node;
4084 struct i40iw_sc_dev *dev;
4085 struct ib_qp_attr attr;
4086 struct iw_cm_id *cm_id;
4087 unsigned long flags;
4088 int status;
4089 bool read0;
4091 cm_node = event->cm_node;
4092 cm_id = cm_node->cm_id;
4093 iwqp = (struct i40iw_qp *)cm_id->provider_data;
4094 iwdev = to_iwdev(iwqp->ibqp.device);
4095 dev = &iwdev->sc_dev;
4096 cm_core = &iwdev->cm_core;
4098 if (iwqp->destroyed) {
4099 status = -ETIMEDOUT;
4100 goto error;
4102 i40iw_cm_init_tsa_conn(iwqp, cm_node);
4103 read0 = (cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO);
4104 if (iwqp->page)
4105 iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
4106 dev->iw_priv_qp_ops->qp_send_rtt(&iwqp->sc_qp, read0);
4107 if (iwqp->page)
4108 kunmap(iwqp->page);
4110 memset(&attr, 0, sizeof(attr));
4111 attr.qp_state = IB_QPS_RTS;
4112 cm_node->qhash_set = false;
4113 i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4115 cm_node->accelerated = true;
4116 spin_lock_irqsave(&cm_core->ht_lock, flags);
4117 list_move_tail(&cm_node->list, &cm_core->accelerated_list);
4118 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4119 status = i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_CONNECT_REPLY,
4121 if (status)
4122 i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - CONNECT_REPLY\n");
4124 return;
4126 error:
4127 iwqp->cm_id = NULL;
4128 cm_id->provider_data = NULL;
4129 i40iw_send_cm_event(event->cm_node,
4130 cm_id,
4131 IW_CM_EVENT_CONNECT_REPLY,
4132 status);
4133 cm_id->rem_ref(cm_id);
4134 i40iw_rem_ref_cm_node(event->cm_node);
4138 * i40iw_cm_event_reset - handle reset
4139 * @event: the info for cm_node of connection
4141 static void i40iw_cm_event_reset(struct i40iw_cm_event *event)
4143 struct i40iw_cm_node *cm_node = event->cm_node;
4144 struct iw_cm_id *cm_id = cm_node->cm_id;
4145 struct i40iw_qp *iwqp;
4147 if (!cm_id)
4148 return;
4150 iwqp = cm_id->provider_data;
4151 if (!iwqp)
4152 return;
4154 i40iw_debug(cm_node->dev,
4155 I40IW_DEBUG_CM,
4156 "reset event %p - cm_id = %p\n",
4157 event->cm_node, cm_id);
4158 iwqp->cm_id = NULL;
4160 i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_DISCONNECT, -ECONNRESET);
4161 i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_CLOSE, 0);
4165 * i40iw_cm_event_handler - worker thread callback to send event to cm upper layer
4166 * @work: pointer of cm event info.
4168 static void i40iw_cm_event_handler(struct work_struct *work)
4170 struct i40iw_cm_event *event = container_of(work,
4171 struct i40iw_cm_event,
4172 event_work);
4173 struct i40iw_cm_node *cm_node;
4175 if (!event || !event->cm_node || !event->cm_node->cm_core)
4176 return;
4178 cm_node = event->cm_node;
4180 switch (event->type) {
4181 case I40IW_CM_EVENT_MPA_REQ:
4182 i40iw_send_cm_event(cm_node,
4183 cm_node->cm_id,
4184 IW_CM_EVENT_CONNECT_REQUEST,
4186 break;
4187 case I40IW_CM_EVENT_RESET:
4188 i40iw_cm_event_reset(event);
4189 break;
4190 case I40IW_CM_EVENT_CONNECTED:
4191 if (!event->cm_node->cm_id ||
4192 (event->cm_node->state != I40IW_CM_STATE_OFFLOADED))
4193 break;
4194 i40iw_cm_event_connected(event);
4195 break;
4196 case I40IW_CM_EVENT_MPA_REJECT:
4197 if (!event->cm_node->cm_id ||
4198 (cm_node->state == I40IW_CM_STATE_OFFLOADED))
4199 break;
4200 i40iw_send_cm_event(cm_node,
4201 cm_node->cm_id,
4202 IW_CM_EVENT_CONNECT_REPLY,
4203 -ECONNREFUSED);
4204 break;
4205 case I40IW_CM_EVENT_ABORTED:
4206 if (!event->cm_node->cm_id ||
4207 (event->cm_node->state == I40IW_CM_STATE_OFFLOADED))
4208 break;
4209 i40iw_event_connect_error(event);
4210 break;
4211 default:
4212 i40iw_pr_err("event type = %d\n", event->type);
4213 break;
4216 event->cm_info.cm_id->rem_ref(event->cm_info.cm_id);
4217 i40iw_rem_ref_cm_node(event->cm_node);
4218 kfree(event);
4222 * i40iw_cm_post_event - queue event request for worker thread
4223 * @event: cm node's info for up event call
4225 static void i40iw_cm_post_event(struct i40iw_cm_event *event)
4227 atomic_inc(&event->cm_node->ref_count);
4228 event->cm_info.cm_id->add_ref(event->cm_info.cm_id);
4229 INIT_WORK(&event->event_work, i40iw_cm_event_handler);
4231 queue_work(event->cm_node->cm_core->event_wq, &event->event_work);
4235 * i40iw_qhash_ctrl - enable/disable qhash for list
4236 * @iwdev: device pointer
4237 * @parent_listen_node: parent listen node
4238 * @nfo: cm info node
4239 * @ipaddr: Pointer to IPv4 or IPv6 address
4240 * @ipv4: flag indicating IPv4 when true
4241 * @ifup: flag indicating interface up when true
4243 * Enables or disables the qhash for the node in the child
4244 * listen list that matches ipaddr. If no matching IP was found
4245 * it will allocate and add a new child listen node to the
4246 * parent listen node. The listen_list_lock is assumed to be
4247 * held when called.
4249 static void i40iw_qhash_ctrl(struct i40iw_device *iwdev,
4250 struct i40iw_cm_listener *parent_listen_node,
4251 struct i40iw_cm_info *nfo,
4252 u32 *ipaddr, bool ipv4, bool ifup)
4254 struct list_head *child_listen_list = &parent_listen_node->child_listen_list;
4255 struct i40iw_cm_listener *child_listen_node;
4256 struct list_head *pos, *tpos;
4257 enum i40iw_status_code ret;
4258 bool node_allocated = false;
4259 enum i40iw_quad_hash_manage_type op =
4260 ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4262 list_for_each_safe(pos, tpos, child_listen_list) {
4263 child_listen_node =
4264 list_entry(pos,
4265 struct i40iw_cm_listener,
4266 child_listen_list);
4267 if (!memcmp(child_listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16))
4268 goto set_qhash;
4271 /* if not found then add a child listener if interface is going up */
4272 if (!ifup)
4273 return;
4274 child_listen_node = kmemdup(parent_listen_node,
4275 sizeof(*child_listen_node), GFP_ATOMIC);
4276 if (!child_listen_node)
4277 return;
4278 node_allocated = true;
4280 memcpy(child_listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16);
4282 set_qhash:
4283 memcpy(nfo->loc_addr,
4284 child_listen_node->loc_addr,
4285 sizeof(nfo->loc_addr));
4286 nfo->vlan_id = child_listen_node->vlan_id;
4287 ret = i40iw_manage_qhash(iwdev, nfo,
4288 I40IW_QHASH_TYPE_TCP_SYN,
4290 NULL, false);
4291 if (!ret) {
4292 child_listen_node->qhash_set = ifup;
4293 if (node_allocated)
4294 list_add(&child_listen_node->child_listen_list,
4295 &parent_listen_node->child_listen_list);
4296 } else if (node_allocated) {
4297 kfree(child_listen_node);
4302 * i40iw_cm_teardown_connections - teardown QPs
4303 * @iwdev: device pointer
4304 * @ipaddr: Pointer to IPv4 or IPv6 address
4305 * @ipv4: flag indicating IPv4 when true
4306 * @disconnect_all: flag indicating disconnect all QPs
4307 * teardown QPs where source or destination addr matches ip addr
4309 void i40iw_cm_teardown_connections(struct i40iw_device *iwdev, u32 *ipaddr,
4310 struct i40iw_cm_info *nfo,
4311 bool disconnect_all)
4313 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4314 struct list_head *list_core_temp;
4315 struct list_head *list_node;
4316 struct i40iw_cm_node *cm_node;
4317 unsigned long flags;
4318 struct list_head teardown_list;
4319 struct ib_qp_attr attr;
4321 INIT_LIST_HEAD(&teardown_list);
4322 spin_lock_irqsave(&cm_core->ht_lock, flags);
4323 list_for_each_safe(list_node, list_core_temp,
4324 &cm_core->accelerated_list) {
4325 cm_node = container_of(list_node, struct i40iw_cm_node, list);
4326 if (disconnect_all ||
4327 (nfo->vlan_id == cm_node->vlan_id &&
4328 (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4329 !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4330 atomic_inc(&cm_node->ref_count);
4331 list_add(&cm_node->teardown_entry, &teardown_list);
4334 list_for_each_safe(list_node, list_core_temp,
4335 &cm_core->non_accelerated_list) {
4336 cm_node = container_of(list_node, struct i40iw_cm_node, list);
4337 if (disconnect_all ||
4338 (nfo->vlan_id == cm_node->vlan_id &&
4339 (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4340 !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4341 atomic_inc(&cm_node->ref_count);
4342 list_add(&cm_node->teardown_entry, &teardown_list);
4345 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4347 list_for_each_safe(list_node, list_core_temp, &teardown_list) {
4348 cm_node = container_of(list_node, struct i40iw_cm_node,
4349 teardown_entry);
4350 attr.qp_state = IB_QPS_ERR;
4351 i40iw_modify_qp(&cm_node->iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4352 if (iwdev->reset)
4353 i40iw_cm_disconn(cm_node->iwqp);
4354 i40iw_rem_ref_cm_node(cm_node);
4359 * i40iw_ifdown_notify - process an ifdown on an interface
4360 * @iwdev: device pointer
4361 * @ipaddr: Pointer to IPv4 or IPv6 address
4362 * @ipv4: flag indicating IPv4 when true
4363 * @ifup: flag indicating interface up when true
4365 void i40iw_if_notify(struct i40iw_device *iwdev, struct net_device *netdev,
4366 u32 *ipaddr, bool ipv4, bool ifup)
4368 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4369 unsigned long flags;
4370 struct i40iw_cm_listener *listen_node;
4371 static const u32 ip_zero[4] = { 0, 0, 0, 0 };
4372 struct i40iw_cm_info nfo;
4373 u16 vlan_id = rdma_vlan_dev_vlan_id(netdev);
4374 enum i40iw_status_code ret;
4375 enum i40iw_quad_hash_manage_type op =
4376 ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4378 nfo.vlan_id = vlan_id;
4379 nfo.ipv4 = ipv4;
4381 /* Disable or enable qhash for listeners */
4382 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
4383 list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
4384 if (vlan_id == listen_node->vlan_id &&
4385 (!memcmp(listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16) ||
4386 !memcmp(listen_node->loc_addr, ip_zero, ipv4 ? 4 : 16))) {
4387 memcpy(nfo.loc_addr, listen_node->loc_addr,
4388 sizeof(nfo.loc_addr));
4389 nfo.loc_port = listen_node->loc_port;
4390 nfo.user_pri = listen_node->user_pri;
4391 if (!list_empty(&listen_node->child_listen_list)) {
4392 i40iw_qhash_ctrl(iwdev,
4393 listen_node,
4394 &nfo,
4395 ipaddr, ipv4, ifup);
4396 } else if (memcmp(listen_node->loc_addr, ip_zero,
4397 ipv4 ? 4 : 16)) {
4398 ret = i40iw_manage_qhash(iwdev,
4399 &nfo,
4400 I40IW_QHASH_TYPE_TCP_SYN,
4402 NULL,
4403 false);
4404 if (!ret)
4405 listen_node->qhash_set = ifup;
4409 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
4411 /* teardown connected qp's on ifdown */
4412 if (!ifup)
4413 i40iw_cm_teardown_connections(iwdev, ipaddr, &nfo, false);