x86, UV: Fix for nodes with memory and no cpus
[linux/fpc-iii.git] / drivers / infiniband / hw / nes / nes_cm.c
blob52425154acd48f9d4a8e3043d9b10295fe59440a
1 /*
2 * Copyright (c) 2006 - 2009 Intel-NE, Inc. All rights reserved.
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
35 #define TCPOPT_TIMESTAMP 8
37 #include <asm/atomic.h>
38 #include <linux/skbuff.h>
39 #include <linux/ip.h>
40 #include <linux/tcp.h>
41 #include <linux/init.h>
42 #include <linux/if_arp.h>
43 #include <linux/if_vlan.h>
44 #include <linux/notifier.h>
45 #include <linux/net.h>
46 #include <linux/types.h>
47 #include <linux/timer.h>
48 #include <linux/time.h>
49 #include <linux/delay.h>
50 #include <linux/etherdevice.h>
51 #include <linux/netdevice.h>
52 #include <linux/random.h>
53 #include <linux/list.h>
54 #include <linux/threads.h>
55 #include <net/arp.h>
56 #include <net/neighbour.h>
57 #include <net/route.h>
58 #include <net/ip_fib.h>
60 #include "nes.h"
62 u32 cm_packets_sent;
63 u32 cm_packets_bounced;
64 u32 cm_packets_dropped;
65 u32 cm_packets_retrans;
66 u32 cm_packets_created;
67 u32 cm_packets_received;
68 u32 cm_listens_created;
69 u32 cm_listens_destroyed;
70 u32 cm_backlog_drops;
71 atomic_t cm_loopbacks;
72 atomic_t cm_nodes_created;
73 atomic_t cm_nodes_destroyed;
74 atomic_t cm_accel_dropped_pkts;
75 atomic_t cm_resets_recvd;
77 static inline int mini_cm_accelerated(struct nes_cm_core *,
78 struct nes_cm_node *);
79 static struct nes_cm_listener *mini_cm_listen(struct nes_cm_core *,
80 struct nes_vnic *, struct nes_cm_info *);
81 static int mini_cm_del_listen(struct nes_cm_core *, struct nes_cm_listener *);
82 static struct nes_cm_node *mini_cm_connect(struct nes_cm_core *,
83 struct nes_vnic *, u16, void *, struct nes_cm_info *);
84 static int mini_cm_close(struct nes_cm_core *, struct nes_cm_node *);
85 static int mini_cm_accept(struct nes_cm_core *, struct ietf_mpa_frame *,
86 struct nes_cm_node *);
87 static int mini_cm_reject(struct nes_cm_core *, struct ietf_mpa_frame *,
88 struct nes_cm_node *);
89 static int mini_cm_recv_pkt(struct nes_cm_core *, struct nes_vnic *,
90 struct sk_buff *);
91 static int mini_cm_dealloc_core(struct nes_cm_core *);
92 static int mini_cm_get(struct nes_cm_core *);
93 static int mini_cm_set(struct nes_cm_core *, u32, u32);
95 static void form_cm_frame(struct sk_buff *, struct nes_cm_node *,
96 void *, u32, void *, u32, u8);
97 static int add_ref_cm_node(struct nes_cm_node *);
98 static int rem_ref_cm_node(struct nes_cm_core *, struct nes_cm_node *);
100 static int nes_cm_disconn_true(struct nes_qp *);
101 static int nes_cm_post_event(struct nes_cm_event *event);
102 static int nes_disconnect(struct nes_qp *nesqp, int abrupt);
103 static void nes_disconnect_worker(struct work_struct *work);
105 static int send_mpa_request(struct nes_cm_node *, struct sk_buff *);
106 static int send_mpa_reject(struct nes_cm_node *);
107 static int send_syn(struct nes_cm_node *, u32, struct sk_buff *);
108 static int send_reset(struct nes_cm_node *, struct sk_buff *);
109 static int send_ack(struct nes_cm_node *cm_node, struct sk_buff *skb);
110 static int send_fin(struct nes_cm_node *cm_node, struct sk_buff *skb);
111 static void process_packet(struct nes_cm_node *, struct sk_buff *,
112 struct nes_cm_core *);
114 static void active_open_err(struct nes_cm_node *, struct sk_buff *, int);
115 static void passive_open_err(struct nes_cm_node *, struct sk_buff *, int);
116 static void cleanup_retrans_entry(struct nes_cm_node *);
117 static void handle_rcv_mpa(struct nes_cm_node *, struct sk_buff *);
118 static void free_retrans_entry(struct nes_cm_node *cm_node);
119 static int handle_tcp_options(struct nes_cm_node *cm_node, struct tcphdr *tcph,
120 struct sk_buff *skb, int optionsize, int passive);
122 /* CM event handler functions */
123 static void cm_event_connected(struct nes_cm_event *);
124 static void cm_event_connect_error(struct nes_cm_event *);
125 static void cm_event_reset(struct nes_cm_event *);
126 static void cm_event_mpa_req(struct nes_cm_event *);
127 static void cm_event_mpa_reject(struct nes_cm_event *);
128 static void handle_recv_entry(struct nes_cm_node *cm_node, u32 rem_node);
130 static void print_core(struct nes_cm_core *core);
132 /* External CM API Interface */
133 /* instance of function pointers for client API */
134 /* set address of this instance to cm_core->cm_ops at cm_core alloc */
135 static struct nes_cm_ops nes_cm_api = {
136 mini_cm_accelerated,
137 mini_cm_listen,
138 mini_cm_del_listen,
139 mini_cm_connect,
140 mini_cm_close,
141 mini_cm_accept,
142 mini_cm_reject,
143 mini_cm_recv_pkt,
144 mini_cm_dealloc_core,
145 mini_cm_get,
146 mini_cm_set
149 static struct nes_cm_core *g_cm_core;
151 atomic_t cm_connects;
152 atomic_t cm_accepts;
153 atomic_t cm_disconnects;
154 atomic_t cm_closes;
155 atomic_t cm_connecteds;
156 atomic_t cm_connect_reqs;
157 atomic_t cm_rejects;
161 * create_event
163 static struct nes_cm_event *create_event(struct nes_cm_node *cm_node,
164 enum nes_cm_event_type type)
166 struct nes_cm_event *event;
168 if (!cm_node->cm_id)
169 return NULL;
171 /* allocate an empty event */
172 event = kzalloc(sizeof(*event), GFP_ATOMIC);
174 if (!event)
175 return NULL;
177 event->type = type;
178 event->cm_node = cm_node;
179 event->cm_info.rem_addr = cm_node->rem_addr;
180 event->cm_info.loc_addr = cm_node->loc_addr;
181 event->cm_info.rem_port = cm_node->rem_port;
182 event->cm_info.loc_port = cm_node->loc_port;
183 event->cm_info.cm_id = cm_node->cm_id;
185 nes_debug(NES_DBG_CM, "cm_node=%p Created event=%p, type=%u, "
186 "dst_addr=%08x[%x], src_addr=%08x[%x]\n",
187 cm_node, event, type, event->cm_info.loc_addr,
188 event->cm_info.loc_port, event->cm_info.rem_addr,
189 event->cm_info.rem_port);
191 nes_cm_post_event(event);
192 return event;
197 * send_mpa_request
199 static int send_mpa_request(struct nes_cm_node *cm_node, struct sk_buff *skb)
201 if (!skb) {
202 nes_debug(NES_DBG_CM, "skb set to NULL\n");
203 return -1;
206 /* send an MPA Request frame */
207 form_cm_frame(skb, cm_node, NULL, 0, &cm_node->mpa_frame,
208 cm_node->mpa_frame_size, SET_ACK);
210 return schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
215 static int send_mpa_reject(struct nes_cm_node *cm_node)
217 struct sk_buff *skb = NULL;
219 skb = dev_alloc_skb(MAX_CM_BUFFER);
220 if (!skb) {
221 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
222 return -ENOMEM;
225 /* send an MPA reject frame */
226 form_cm_frame(skb, cm_node, NULL, 0, &cm_node->mpa_frame,
227 cm_node->mpa_frame_size, SET_ACK | SET_FIN);
229 cm_node->state = NES_CM_STATE_FIN_WAIT1;
230 return schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
235 * recv_mpa - process a received TCP pkt, we are expecting an
236 * IETF MPA frame
238 static int parse_mpa(struct nes_cm_node *cm_node, u8 *buffer, u32 *type,
239 u32 len)
241 struct ietf_mpa_frame *mpa_frame;
243 *type = NES_MPA_REQUEST_ACCEPT;
245 /* assume req frame is in tcp data payload */
246 if (len < sizeof(struct ietf_mpa_frame)) {
247 nes_debug(NES_DBG_CM, "The received ietf buffer was too small (%x)\n", len);
248 return -EINVAL;
251 mpa_frame = (struct ietf_mpa_frame *)buffer;
252 cm_node->mpa_frame_size = ntohs(mpa_frame->priv_data_len);
254 if (cm_node->mpa_frame_size + sizeof(struct ietf_mpa_frame) != len) {
255 nes_debug(NES_DBG_CM, "The received ietf buffer was not right"
256 " complete (%x + %x != %x)\n",
257 cm_node->mpa_frame_size,
258 (u32)sizeof(struct ietf_mpa_frame), len);
259 return -EINVAL;
261 /* make sure it does not exceed the max size */
262 if (len > MAX_CM_BUFFER) {
263 nes_debug(NES_DBG_CM, "The received ietf buffer was too large"
264 " (%x + %x != %x)\n",
265 cm_node->mpa_frame_size,
266 (u32)sizeof(struct ietf_mpa_frame), len);
267 return -EINVAL;
270 /* copy entire MPA frame to our cm_node's frame */
271 memcpy(cm_node->mpa_frame_buf, buffer + sizeof(struct ietf_mpa_frame),
272 cm_node->mpa_frame_size);
274 if (mpa_frame->flags & IETF_MPA_FLAGS_REJECT)
275 *type = NES_MPA_REQUEST_REJECT;
276 return 0;
281 * form_cm_frame - get a free packet and build empty frame Use
282 * node info to build.
284 static void form_cm_frame(struct sk_buff *skb,
285 struct nes_cm_node *cm_node, void *options, u32 optionsize,
286 void *data, u32 datasize, u8 flags)
288 struct tcphdr *tcph;
289 struct iphdr *iph;
290 struct ethhdr *ethh;
291 u8 *buf;
292 u16 packetsize = sizeof(*iph);
294 packetsize += sizeof(*tcph);
295 packetsize += optionsize + datasize;
297 memset(skb->data, 0x00, ETH_HLEN + sizeof(*iph) + sizeof(*tcph));
299 skb->len = 0;
300 buf = skb_put(skb, packetsize + ETH_HLEN);
302 ethh = (struct ethhdr *) buf;
303 buf += ETH_HLEN;
305 iph = (struct iphdr *)buf;
306 buf += sizeof(*iph);
307 tcph = (struct tcphdr *)buf;
308 skb_reset_mac_header(skb);
309 skb_set_network_header(skb, ETH_HLEN);
310 skb_set_transport_header(skb, ETH_HLEN+sizeof(*iph));
311 buf += sizeof(*tcph);
313 skb->ip_summed = CHECKSUM_PARTIAL;
314 skb->protocol = htons(0x800);
315 skb->data_len = 0;
316 skb->mac_len = ETH_HLEN;
318 memcpy(ethh->h_dest, cm_node->rem_mac, ETH_ALEN);
319 memcpy(ethh->h_source, cm_node->loc_mac, ETH_ALEN);
320 ethh->h_proto = htons(0x0800);
322 iph->version = IPVERSION;
323 iph->ihl = 5; /* 5 * 4Byte words, IP headr len */
324 iph->tos = 0;
325 iph->tot_len = htons(packetsize);
326 iph->id = htons(++cm_node->tcp_cntxt.loc_id);
328 iph->frag_off = htons(0x4000);
329 iph->ttl = 0x40;
330 iph->protocol = 0x06; /* IPPROTO_TCP */
332 iph->saddr = htonl(cm_node->loc_addr);
333 iph->daddr = htonl(cm_node->rem_addr);
335 tcph->source = htons(cm_node->loc_port);
336 tcph->dest = htons(cm_node->rem_port);
337 tcph->seq = htonl(cm_node->tcp_cntxt.loc_seq_num);
339 if (flags & SET_ACK) {
340 cm_node->tcp_cntxt.loc_ack_num = cm_node->tcp_cntxt.rcv_nxt;
341 tcph->ack_seq = htonl(cm_node->tcp_cntxt.loc_ack_num);
342 tcph->ack = 1;
343 } else
344 tcph->ack_seq = 0;
346 if (flags & SET_SYN) {
347 cm_node->tcp_cntxt.loc_seq_num++;
348 tcph->syn = 1;
349 } else
350 cm_node->tcp_cntxt.loc_seq_num += datasize;
352 if (flags & SET_FIN) {
353 cm_node->tcp_cntxt.loc_seq_num++;
354 tcph->fin = 1;
357 if (flags & SET_RST)
358 tcph->rst = 1;
360 tcph->doff = (u16)((sizeof(*tcph) + optionsize + 3) >> 2);
361 tcph->window = htons(cm_node->tcp_cntxt.rcv_wnd);
362 tcph->urg_ptr = 0;
363 if (optionsize)
364 memcpy(buf, options, optionsize);
365 buf += optionsize;
366 if (datasize)
367 memcpy(buf, data, datasize);
369 skb_shinfo(skb)->nr_frags = 0;
370 cm_packets_created++;
376 * print_core - dump a cm core
378 static void print_core(struct nes_cm_core *core)
380 nes_debug(NES_DBG_CM, "---------------------------------------------\n");
381 nes_debug(NES_DBG_CM, "CM Core -- (core = %p )\n", core);
382 if (!core)
383 return;
384 nes_debug(NES_DBG_CM, "---------------------------------------------\n");
386 nes_debug(NES_DBG_CM, "State : %u \n", core->state);
388 nes_debug(NES_DBG_CM, "Listen Nodes : %u \n", atomic_read(&core->listen_node_cnt));
389 nes_debug(NES_DBG_CM, "Active Nodes : %u \n", atomic_read(&core->node_cnt));
391 nes_debug(NES_DBG_CM, "core : %p \n", core);
393 nes_debug(NES_DBG_CM, "-------------- end core ---------------\n");
398 * schedule_nes_timer
399 * note - cm_node needs to be protected before calling this. Encase in:
400 * rem_ref_cm_node(cm_core, cm_node);add_ref_cm_node(cm_node);
402 int schedule_nes_timer(struct nes_cm_node *cm_node, struct sk_buff *skb,
403 enum nes_timer_type type, int send_retrans,
404 int close_when_complete)
406 unsigned long flags;
407 struct nes_cm_core *cm_core = cm_node->cm_core;
408 struct nes_timer_entry *new_send;
409 int ret = 0;
410 u32 was_timer_set;
412 new_send = kzalloc(sizeof(*new_send), GFP_ATOMIC);
413 if (!new_send)
414 return -ENOMEM;
416 /* new_send->timetosend = currenttime */
417 new_send->retrycount = NES_DEFAULT_RETRYS;
418 new_send->retranscount = NES_DEFAULT_RETRANS;
419 new_send->skb = skb;
420 new_send->timetosend = jiffies;
421 new_send->type = type;
422 new_send->netdev = cm_node->netdev;
423 new_send->send_retrans = send_retrans;
424 new_send->close_when_complete = close_when_complete;
426 if (type == NES_TIMER_TYPE_CLOSE) {
427 new_send->timetosend += (HZ/10);
428 if (cm_node->recv_entry) {
429 WARN_ON(1);
430 return -EINVAL;
432 cm_node->recv_entry = new_send;
435 if (type == NES_TIMER_TYPE_SEND) {
436 new_send->seq_num = ntohl(tcp_hdr(skb)->seq);
437 atomic_inc(&new_send->skb->users);
438 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
439 cm_node->send_entry = new_send;
440 add_ref_cm_node(cm_node);
441 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
442 new_send->timetosend = jiffies + NES_RETRY_TIMEOUT;
444 ret = nes_nic_cm_xmit(new_send->skb, cm_node->netdev);
445 if (ret != NETDEV_TX_OK) {
446 nes_debug(NES_DBG_CM, "Error sending packet %p "
447 "(jiffies = %lu)\n", new_send, jiffies);
448 atomic_dec(&new_send->skb->users);
449 new_send->timetosend = jiffies;
450 } else {
451 cm_packets_sent++;
452 if (!send_retrans) {
453 cleanup_retrans_entry(cm_node);
454 if (close_when_complete)
455 rem_ref_cm_node(cm_core, cm_node);
456 return ret;
461 was_timer_set = timer_pending(&cm_core->tcp_timer);
463 if (!was_timer_set) {
464 cm_core->tcp_timer.expires = new_send->timetosend;
465 add_timer(&cm_core->tcp_timer);
468 return ret;
471 static void nes_retrans_expired(struct nes_cm_node *cm_node)
473 switch (cm_node->state) {
474 case NES_CM_STATE_SYN_RCVD:
475 case NES_CM_STATE_CLOSING:
476 rem_ref_cm_node(cm_node->cm_core, cm_node);
477 break;
478 case NES_CM_STATE_LAST_ACK:
479 case NES_CM_STATE_FIN_WAIT1:
480 case NES_CM_STATE_MPAREJ_RCVD:
481 send_reset(cm_node, NULL);
482 break;
483 default:
484 create_event(cm_node, NES_CM_EVENT_ABORTED);
488 static void handle_recv_entry(struct nes_cm_node *cm_node, u32 rem_node)
490 struct nes_timer_entry *recv_entry = cm_node->recv_entry;
491 struct iw_cm_id *cm_id = cm_node->cm_id;
492 struct nes_qp *nesqp;
493 unsigned long qplockflags;
495 if (!recv_entry)
496 return;
497 nesqp = (struct nes_qp *)recv_entry->skb;
498 if (nesqp) {
499 spin_lock_irqsave(&nesqp->lock, qplockflags);
500 if (nesqp->cm_id) {
501 nes_debug(NES_DBG_CM, "QP%u: cm_id = %p, "
502 "refcount = %d: HIT A "
503 "NES_TIMER_TYPE_CLOSE with something "
504 "to do!!!\n", nesqp->hwqp.qp_id, cm_id,
505 atomic_read(&nesqp->refcount));
506 nesqp->hw_tcp_state = NES_AEQE_TCP_STATE_CLOSED;
507 nesqp->last_aeq = NES_AEQE_AEID_RESET_SENT;
508 nesqp->ibqp_state = IB_QPS_ERR;
509 spin_unlock_irqrestore(&nesqp->lock, qplockflags);
510 nes_cm_disconn(nesqp);
511 } else {
512 spin_unlock_irqrestore(&nesqp->lock, qplockflags);
513 nes_debug(NES_DBG_CM, "QP%u: cm_id = %p, "
514 "refcount = %d: HIT A "
515 "NES_TIMER_TYPE_CLOSE with nothing "
516 "to do!!!\n", nesqp->hwqp.qp_id, cm_id,
517 atomic_read(&nesqp->refcount));
519 } else if (rem_node) {
520 /* TIME_WAIT state */
521 rem_ref_cm_node(cm_node->cm_core, cm_node);
523 if (cm_node->cm_id)
524 cm_id->rem_ref(cm_id);
525 kfree(recv_entry);
526 cm_node->recv_entry = NULL;
530 * nes_cm_timer_tick
532 static void nes_cm_timer_tick(unsigned long pass)
534 unsigned long flags;
535 unsigned long nexttimeout = jiffies + NES_LONG_TIME;
536 struct nes_cm_node *cm_node;
537 struct nes_timer_entry *send_entry, *recv_entry;
538 struct list_head *list_core_temp;
539 struct list_head *list_node;
540 struct nes_cm_core *cm_core = g_cm_core;
541 u32 settimer = 0;
542 int ret = NETDEV_TX_OK;
544 struct list_head timer_list;
545 INIT_LIST_HEAD(&timer_list);
546 spin_lock_irqsave(&cm_core->ht_lock, flags);
548 list_for_each_safe(list_node, list_core_temp,
549 &cm_core->connected_nodes) {
550 cm_node = container_of(list_node, struct nes_cm_node, list);
551 if ((cm_node->recv_entry) || (cm_node->send_entry)) {
552 add_ref_cm_node(cm_node);
553 list_add(&cm_node->timer_entry, &timer_list);
556 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
558 list_for_each_safe(list_node, list_core_temp, &timer_list) {
559 cm_node = container_of(list_node, struct nes_cm_node,
560 timer_entry);
561 recv_entry = cm_node->recv_entry;
563 if (recv_entry) {
564 if (time_after(recv_entry->timetosend, jiffies)) {
565 if (nexttimeout > recv_entry->timetosend ||
566 !settimer) {
567 nexttimeout = recv_entry->timetosend;
568 settimer = 1;
570 } else
571 handle_recv_entry(cm_node, 1);
574 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
575 do {
576 send_entry = cm_node->send_entry;
577 if (!send_entry)
578 break;
579 if (time_after(send_entry->timetosend, jiffies)) {
580 if (cm_node->state != NES_CM_STATE_TSA) {
581 if ((nexttimeout >
582 send_entry->timetosend) ||
583 !settimer) {
584 nexttimeout =
585 send_entry->timetosend;
586 settimer = 1;
588 } else {
589 free_retrans_entry(cm_node);
591 break;
594 if ((cm_node->state == NES_CM_STATE_TSA) ||
595 (cm_node->state == NES_CM_STATE_CLOSED)) {
596 free_retrans_entry(cm_node);
597 break;
600 if (!send_entry->retranscount ||
601 !send_entry->retrycount) {
602 cm_packets_dropped++;
603 free_retrans_entry(cm_node);
605 spin_unlock_irqrestore(
606 &cm_node->retrans_list_lock, flags);
607 nes_retrans_expired(cm_node);
608 cm_node->state = NES_CM_STATE_CLOSED;
609 spin_lock_irqsave(&cm_node->retrans_list_lock,
610 flags);
611 break;
613 atomic_inc(&send_entry->skb->users);
614 cm_packets_retrans++;
615 nes_debug(NES_DBG_CM, "Retransmitting send_entry %p "
616 "for node %p, jiffies = %lu, time to send = "
617 "%lu, retranscount = %u, send_entry->seq_num = "
618 "0x%08X, cm_node->tcp_cntxt.rem_ack_num = "
619 "0x%08X\n", send_entry, cm_node, jiffies,
620 send_entry->timetosend,
621 send_entry->retranscount,
622 send_entry->seq_num,
623 cm_node->tcp_cntxt.rem_ack_num);
625 spin_unlock_irqrestore(&cm_node->retrans_list_lock,
626 flags);
627 ret = nes_nic_cm_xmit(send_entry->skb, cm_node->netdev);
628 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
629 if (ret != NETDEV_TX_OK) {
630 nes_debug(NES_DBG_CM, "rexmit failed for "
631 "node=%p\n", cm_node);
632 cm_packets_bounced++;
633 atomic_dec(&send_entry->skb->users);
634 send_entry->retrycount--;
635 nexttimeout = jiffies + NES_SHORT_TIME;
636 settimer = 1;
637 break;
638 } else {
639 cm_packets_sent++;
641 nes_debug(NES_DBG_CM, "Packet Sent: retrans count = "
642 "%u, retry count = %u.\n",
643 send_entry->retranscount,
644 send_entry->retrycount);
645 if (send_entry->send_retrans) {
646 send_entry->retranscount--;
647 send_entry->timetosend = jiffies +
648 NES_RETRY_TIMEOUT;
649 if (nexttimeout > send_entry->timetosend ||
650 !settimer) {
651 nexttimeout = send_entry->timetosend;
652 settimer = 1;
654 } else {
655 int close_when_complete;
656 close_when_complete =
657 send_entry->close_when_complete;
658 nes_debug(NES_DBG_CM, "cm_node=%p state=%d\n",
659 cm_node, cm_node->state);
660 free_retrans_entry(cm_node);
661 if (close_when_complete)
662 rem_ref_cm_node(cm_node->cm_core,
663 cm_node);
665 } while (0);
667 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
668 rem_ref_cm_node(cm_node->cm_core, cm_node);
669 if (ret != NETDEV_TX_OK) {
670 nes_debug(NES_DBG_CM, "rexmit failed for cm_node=%p\n",
671 cm_node);
672 break;
676 if (settimer) {
677 if (!timer_pending(&cm_core->tcp_timer)) {
678 cm_core->tcp_timer.expires = nexttimeout;
679 add_timer(&cm_core->tcp_timer);
686 * send_syn
688 static int send_syn(struct nes_cm_node *cm_node, u32 sendack,
689 struct sk_buff *skb)
691 int ret;
692 int flags = SET_SYN;
693 char optionsbuffer[sizeof(struct option_mss) +
694 sizeof(struct option_windowscale) + sizeof(struct option_base) +
695 TCP_OPTIONS_PADDING];
697 int optionssize = 0;
698 /* Sending MSS option */
699 union all_known_options *options;
701 if (!cm_node)
702 return -EINVAL;
704 options = (union all_known_options *)&optionsbuffer[optionssize];
705 options->as_mss.optionnum = OPTION_NUMBER_MSS;
706 options->as_mss.length = sizeof(struct option_mss);
707 options->as_mss.mss = htons(cm_node->tcp_cntxt.mss);
708 optionssize += sizeof(struct option_mss);
710 options = (union all_known_options *)&optionsbuffer[optionssize];
711 options->as_windowscale.optionnum = OPTION_NUMBER_WINDOW_SCALE;
712 options->as_windowscale.length = sizeof(struct option_windowscale);
713 options->as_windowscale.shiftcount = cm_node->tcp_cntxt.rcv_wscale;
714 optionssize += sizeof(struct option_windowscale);
716 if (sendack && !(NES_DRV_OPT_SUPRESS_OPTION_BC & nes_drv_opt)) {
717 options = (union all_known_options *)&optionsbuffer[optionssize];
718 options->as_base.optionnum = OPTION_NUMBER_WRITE0;
719 options->as_base.length = sizeof(struct option_base);
720 optionssize += sizeof(struct option_base);
721 /* we need the size to be a multiple of 4 */
722 options = (union all_known_options *)&optionsbuffer[optionssize];
723 options->as_end = 1;
724 optionssize += 1;
725 options = (union all_known_options *)&optionsbuffer[optionssize];
726 options->as_end = 1;
727 optionssize += 1;
730 options = (union all_known_options *)&optionsbuffer[optionssize];
731 options->as_end = OPTION_NUMBER_END;
732 optionssize += 1;
734 if (!skb)
735 skb = dev_alloc_skb(MAX_CM_BUFFER);
736 if (!skb) {
737 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
738 return -1;
741 if (sendack)
742 flags |= SET_ACK;
744 form_cm_frame(skb, cm_node, optionsbuffer, optionssize, NULL, 0, flags);
745 ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
747 return ret;
752 * send_reset
754 static int send_reset(struct nes_cm_node *cm_node, struct sk_buff *skb)
756 int ret;
757 int flags = SET_RST | SET_ACK;
759 if (!skb)
760 skb = dev_alloc_skb(MAX_CM_BUFFER);
761 if (!skb) {
762 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
763 return -ENOMEM;
766 form_cm_frame(skb, cm_node, NULL, 0, NULL, 0, flags);
767 ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 0, 1);
769 return ret;
774 * send_ack
776 static int send_ack(struct nes_cm_node *cm_node, struct sk_buff *skb)
778 int ret;
780 if (!skb)
781 skb = dev_alloc_skb(MAX_CM_BUFFER);
783 if (!skb) {
784 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
785 return -1;
788 form_cm_frame(skb, cm_node, NULL, 0, NULL, 0, SET_ACK);
789 ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 0, 0);
791 return ret;
796 * send_fin
798 static int send_fin(struct nes_cm_node *cm_node, struct sk_buff *skb)
800 int ret;
802 /* if we didn't get a frame get one */
803 if (!skb)
804 skb = dev_alloc_skb(MAX_CM_BUFFER);
806 if (!skb) {
807 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
808 return -1;
811 form_cm_frame(skb, cm_node, NULL, 0, NULL, 0, SET_ACK | SET_FIN);
812 ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
814 return ret;
819 * find_node - find a cm node that matches the reference cm node
821 static struct nes_cm_node *find_node(struct nes_cm_core *cm_core,
822 u16 rem_port, nes_addr_t rem_addr, u16 loc_port, nes_addr_t loc_addr)
824 unsigned long flags;
825 struct list_head *hte;
826 struct nes_cm_node *cm_node;
828 /* get a handle on the hte */
829 hte = &cm_core->connected_nodes;
831 /* walk list and find cm_node associated with this session ID */
832 spin_lock_irqsave(&cm_core->ht_lock, flags);
833 list_for_each_entry(cm_node, hte, list) {
834 /* compare quad, return node handle if a match */
835 nes_debug(NES_DBG_CM, "finding node %x:%x =? %x:%x ^ %x:%x =? %x:%x\n",
836 cm_node->loc_addr, cm_node->loc_port,
837 loc_addr, loc_port,
838 cm_node->rem_addr, cm_node->rem_port,
839 rem_addr, rem_port);
840 if ((cm_node->loc_addr == loc_addr) && (cm_node->loc_port == loc_port) &&
841 (cm_node->rem_addr == rem_addr) && (cm_node->rem_port == rem_port)) {
842 add_ref_cm_node(cm_node);
843 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
844 return cm_node;
847 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
849 /* no owner node */
850 return NULL;
855 * find_listener - find a cm node listening on this addr-port pair
857 static struct nes_cm_listener *find_listener(struct nes_cm_core *cm_core,
858 nes_addr_t dst_addr, u16 dst_port, enum nes_cm_listener_state listener_state)
860 unsigned long flags;
861 struct nes_cm_listener *listen_node;
862 __be32 tmp_addr = cpu_to_be32(dst_addr);
864 /* walk list and find cm_node associated with this session ID */
865 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
866 list_for_each_entry(listen_node, &cm_core->listen_list.list, list) {
867 /* compare node pair, return node handle if a match */
868 if (((listen_node->loc_addr == dst_addr) ||
869 listen_node->loc_addr == 0x00000000) &&
870 (listen_node->loc_port == dst_port) &&
871 (listener_state & listen_node->listener_state)) {
872 atomic_inc(&listen_node->ref_count);
873 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
874 return listen_node;
877 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
879 nes_debug(NES_DBG_CM, "Unable to find listener for %pI4:%x\n",
880 &tmp_addr, dst_port);
882 /* no listener */
883 return NULL;
888 * add_hte_node - add a cm node to the hash table
890 static int add_hte_node(struct nes_cm_core *cm_core, struct nes_cm_node *cm_node)
892 unsigned long flags;
893 struct list_head *hte;
895 if (!cm_node || !cm_core)
896 return -EINVAL;
898 nes_debug(NES_DBG_CM, "Adding Node %p to Active Connection HT\n",
899 cm_node);
901 spin_lock_irqsave(&cm_core->ht_lock, flags);
903 /* get a handle on the hash table element (list head for this slot) */
904 hte = &cm_core->connected_nodes;
905 list_add_tail(&cm_node->list, hte);
906 atomic_inc(&cm_core->ht_node_cnt);
908 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
910 return 0;
915 * mini_cm_dec_refcnt_listen
917 static int mini_cm_dec_refcnt_listen(struct nes_cm_core *cm_core,
918 struct nes_cm_listener *listener, int free_hanging_nodes)
920 int ret = -EINVAL;
921 int err = 0;
922 unsigned long flags;
923 struct list_head *list_pos = NULL;
924 struct list_head *list_temp = NULL;
925 struct nes_cm_node *cm_node = NULL;
926 struct list_head reset_list;
928 nes_debug(NES_DBG_CM, "attempting listener= %p free_nodes= %d, "
929 "refcnt=%d\n", listener, free_hanging_nodes,
930 atomic_read(&listener->ref_count));
931 /* free non-accelerated child nodes for this listener */
932 INIT_LIST_HEAD(&reset_list);
933 if (free_hanging_nodes) {
934 spin_lock_irqsave(&cm_core->ht_lock, flags);
935 list_for_each_safe(list_pos, list_temp,
936 &g_cm_core->connected_nodes) {
937 cm_node = container_of(list_pos, struct nes_cm_node,
938 list);
939 if ((cm_node->listener == listener) &&
940 (!cm_node->accelerated)) {
941 add_ref_cm_node(cm_node);
942 list_add(&cm_node->reset_entry, &reset_list);
945 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
948 list_for_each_safe(list_pos, list_temp, &reset_list) {
949 cm_node = container_of(list_pos, struct nes_cm_node,
950 reset_entry);
952 struct nes_cm_node *loopback = cm_node->loopbackpartner;
953 if (NES_CM_STATE_FIN_WAIT1 <= cm_node->state) {
954 rem_ref_cm_node(cm_node->cm_core, cm_node);
955 } else {
956 if (!loopback) {
957 cleanup_retrans_entry(cm_node);
958 err = send_reset(cm_node, NULL);
959 if (err) {
960 cm_node->state =
961 NES_CM_STATE_CLOSED;
962 WARN_ON(1);
963 } else {
964 cm_node->state =
965 NES_CM_STATE_CLOSED;
966 rem_ref_cm_node(
967 cm_node->cm_core,
968 cm_node);
970 } else {
971 struct nes_cm_event event;
973 event.cm_node = loopback;
974 event.cm_info.rem_addr =
975 loopback->rem_addr;
976 event.cm_info.loc_addr =
977 loopback->loc_addr;
978 event.cm_info.rem_port =
979 loopback->rem_port;
980 event.cm_info.loc_port =
981 loopback->loc_port;
982 event.cm_info.cm_id = loopback->cm_id;
983 cm_event_connect_error(&event);
984 loopback->state = NES_CM_STATE_CLOSED;
986 event.cm_node = cm_node;
987 event.cm_info.rem_addr =
988 cm_node->rem_addr;
989 event.cm_info.loc_addr =
990 cm_node->loc_addr;
991 event.cm_info.rem_port =
992 cm_node->rem_port;
993 event.cm_info.loc_port =
994 cm_node->loc_port;
995 event.cm_info.cm_id = cm_node->cm_id;
996 cm_event_reset(&event);
998 rem_ref_cm_node(cm_node->cm_core,
999 cm_node);
1006 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1007 if (!atomic_dec_return(&listener->ref_count)) {
1008 list_del(&listener->list);
1010 /* decrement our listen node count */
1011 atomic_dec(&cm_core->listen_node_cnt);
1013 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1015 if (listener->nesvnic) {
1016 nes_manage_apbvt(listener->nesvnic, listener->loc_port,
1017 PCI_FUNC(listener->nesvnic->nesdev->pcidev->devfn), NES_MANAGE_APBVT_DEL);
1020 nes_debug(NES_DBG_CM, "destroying listener (%p)\n", listener);
1022 kfree(listener);
1023 listener = NULL;
1024 ret = 0;
1025 cm_listens_destroyed++;
1026 } else {
1027 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1029 if (listener) {
1030 if (atomic_read(&listener->pend_accepts_cnt) > 0)
1031 nes_debug(NES_DBG_CM, "destroying listener (%p)"
1032 " with non-zero pending accepts=%u\n",
1033 listener, atomic_read(&listener->pend_accepts_cnt));
1036 return ret;
1041 * mini_cm_del_listen
1043 static int mini_cm_del_listen(struct nes_cm_core *cm_core,
1044 struct nes_cm_listener *listener)
1046 listener->listener_state = NES_CM_LISTENER_PASSIVE_STATE;
1047 listener->cm_id = NULL; /* going to be destroyed pretty soon */
1048 return mini_cm_dec_refcnt_listen(cm_core, listener, 1);
1053 * mini_cm_accelerated
1055 static inline int mini_cm_accelerated(struct nes_cm_core *cm_core,
1056 struct nes_cm_node *cm_node)
1058 u32 was_timer_set;
1059 cm_node->accelerated = 1;
1061 if (cm_node->accept_pend) {
1062 BUG_ON(!cm_node->listener);
1063 atomic_dec(&cm_node->listener->pend_accepts_cnt);
1064 cm_node->accept_pend = 0;
1065 BUG_ON(atomic_read(&cm_node->listener->pend_accepts_cnt) < 0);
1068 was_timer_set = timer_pending(&cm_core->tcp_timer);
1069 if (!was_timer_set) {
1070 cm_core->tcp_timer.expires = jiffies + NES_SHORT_TIME;
1071 add_timer(&cm_core->tcp_timer);
1074 return 0;
1079 * nes_addr_resolve_neigh
1081 static int nes_addr_resolve_neigh(struct nes_vnic *nesvnic, u32 dst_ip)
1083 struct rtable *rt;
1084 struct flowi fl;
1085 struct neighbour *neigh;
1086 int rc = -1;
1088 memset(&fl, 0, sizeof fl);
1089 fl.nl_u.ip4_u.daddr = htonl(dst_ip);
1090 if (ip_route_output_key(&init_net, &rt, &fl)) {
1091 printk(KERN_ERR "%s: ip_route_output_key failed for 0x%08X\n",
1092 __func__, dst_ip);
1093 return rc;
1096 neigh = neigh_lookup(&arp_tbl, &rt->rt_gateway, nesvnic->netdev);
1097 if (neigh) {
1098 if (neigh->nud_state & NUD_VALID) {
1099 nes_debug(NES_DBG_CM, "Neighbor MAC address for 0x%08X"
1100 " is %pM, Gateway is 0x%08X \n", dst_ip,
1101 neigh->ha, ntohl(rt->rt_gateway));
1102 nes_manage_arp_cache(nesvnic->netdev, neigh->ha,
1103 dst_ip, NES_ARP_ADD);
1104 rc = nes_arp_table(nesvnic->nesdev, dst_ip, NULL,
1105 NES_ARP_RESOLVE);
1107 neigh_release(neigh);
1110 if ((neigh == NULL) || (!(neigh->nud_state & NUD_VALID)))
1111 neigh_event_send(rt->u.dst.neighbour, NULL);
1113 ip_rt_put(rt);
1114 return rc;
1119 * make_cm_node - create a new instance of a cm node
1121 static struct nes_cm_node *make_cm_node(struct nes_cm_core *cm_core,
1122 struct nes_vnic *nesvnic, struct nes_cm_info *cm_info,
1123 struct nes_cm_listener *listener)
1125 struct nes_cm_node *cm_node;
1126 struct timespec ts;
1127 int arpindex = 0;
1128 struct nes_device *nesdev;
1129 struct nes_adapter *nesadapter;
1131 /* create an hte and cm_node for this instance */
1132 cm_node = kzalloc(sizeof(*cm_node), GFP_ATOMIC);
1133 if (!cm_node)
1134 return NULL;
1136 /* set our node specific transport info */
1137 cm_node->loc_addr = cm_info->loc_addr;
1138 cm_node->rem_addr = cm_info->rem_addr;
1139 cm_node->loc_port = cm_info->loc_port;
1140 cm_node->rem_port = cm_info->rem_port;
1141 cm_node->send_write0 = send_first;
1142 nes_debug(NES_DBG_CM, "Make node addresses : loc = %pI4:%x, rem = %pI4:%x\n",
1143 &cm_node->loc_addr, cm_node->loc_port,
1144 &cm_node->rem_addr, cm_node->rem_port);
1145 cm_node->listener = listener;
1146 cm_node->netdev = nesvnic->netdev;
1147 cm_node->cm_id = cm_info->cm_id;
1148 memcpy(cm_node->loc_mac, nesvnic->netdev->dev_addr, ETH_ALEN);
1150 nes_debug(NES_DBG_CM, "listener=%p, cm_id=%p\n", cm_node->listener,
1151 cm_node->cm_id);
1153 spin_lock_init(&cm_node->retrans_list_lock);
1155 cm_node->loopbackpartner = NULL;
1156 atomic_set(&cm_node->ref_count, 1);
1157 /* associate our parent CM core */
1158 cm_node->cm_core = cm_core;
1159 cm_node->tcp_cntxt.loc_id = NES_CM_DEF_LOCAL_ID;
1160 cm_node->tcp_cntxt.rcv_wscale = NES_CM_DEFAULT_RCV_WND_SCALE;
1161 cm_node->tcp_cntxt.rcv_wnd = NES_CM_DEFAULT_RCV_WND_SCALED >>
1162 NES_CM_DEFAULT_RCV_WND_SCALE;
1163 ts = current_kernel_time();
1164 cm_node->tcp_cntxt.loc_seq_num = htonl(ts.tv_nsec);
1165 cm_node->tcp_cntxt.mss = nesvnic->max_frame_size - sizeof(struct iphdr) -
1166 sizeof(struct tcphdr) - ETH_HLEN - VLAN_HLEN;
1167 cm_node->tcp_cntxt.rcv_nxt = 0;
1168 /* get a unique session ID , add thread_id to an upcounter to handle race */
1169 atomic_inc(&cm_core->node_cnt);
1170 cm_node->conn_type = cm_info->conn_type;
1171 cm_node->apbvt_set = 0;
1172 cm_node->accept_pend = 0;
1174 cm_node->nesvnic = nesvnic;
1175 /* get some device handles, for arp lookup */
1176 nesdev = nesvnic->nesdev;
1177 nesadapter = nesdev->nesadapter;
1179 cm_node->loopbackpartner = NULL;
1180 /* get the mac addr for the remote node */
1181 if (ipv4_is_loopback(htonl(cm_node->rem_addr)))
1182 arpindex = nes_arp_table(nesdev, ntohl(nesvnic->local_ipaddr), NULL, NES_ARP_RESOLVE);
1183 else
1184 arpindex = nes_arp_table(nesdev, cm_node->rem_addr, NULL, NES_ARP_RESOLVE);
1185 if (arpindex < 0) {
1186 arpindex = nes_addr_resolve_neigh(nesvnic, cm_info->rem_addr);
1187 if (arpindex < 0) {
1188 kfree(cm_node);
1189 return NULL;
1193 /* copy the mac addr to node context */
1194 memcpy(cm_node->rem_mac, nesadapter->arp_table[arpindex].mac_addr, ETH_ALEN);
1195 nes_debug(NES_DBG_CM, "Remote mac addr from arp table: %pM\n",
1196 cm_node->rem_mac);
1198 add_hte_node(cm_core, cm_node);
1199 atomic_inc(&cm_nodes_created);
1201 return cm_node;
1206 * add_ref_cm_node - destroy an instance of a cm node
1208 static int add_ref_cm_node(struct nes_cm_node *cm_node)
1210 atomic_inc(&cm_node->ref_count);
1211 return 0;
1216 * rem_ref_cm_node - destroy an instance of a cm node
1218 static int rem_ref_cm_node(struct nes_cm_core *cm_core,
1219 struct nes_cm_node *cm_node)
1221 unsigned long flags;
1222 struct nes_qp *nesqp;
1224 if (!cm_node)
1225 return -EINVAL;
1227 spin_lock_irqsave(&cm_node->cm_core->ht_lock, flags);
1228 if (atomic_dec_return(&cm_node->ref_count)) {
1229 spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
1230 return 0;
1232 list_del(&cm_node->list);
1233 atomic_dec(&cm_core->ht_node_cnt);
1234 spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
1236 /* if the node is destroyed before connection was accelerated */
1237 if (!cm_node->accelerated && cm_node->accept_pend) {
1238 BUG_ON(!cm_node->listener);
1239 atomic_dec(&cm_node->listener->pend_accepts_cnt);
1240 BUG_ON(atomic_read(&cm_node->listener->pend_accepts_cnt) < 0);
1242 WARN_ON(cm_node->send_entry);
1243 if (cm_node->recv_entry)
1244 handle_recv_entry(cm_node, 0);
1245 if (cm_node->listener) {
1246 mini_cm_dec_refcnt_listen(cm_core, cm_node->listener, 0);
1247 } else {
1248 if (cm_node->apbvt_set && cm_node->nesvnic) {
1249 nes_manage_apbvt(cm_node->nesvnic, cm_node->loc_port,
1250 PCI_FUNC(
1251 cm_node->nesvnic->nesdev->pcidev->devfn),
1252 NES_MANAGE_APBVT_DEL);
1256 atomic_dec(&cm_core->node_cnt);
1257 atomic_inc(&cm_nodes_destroyed);
1258 nesqp = cm_node->nesqp;
1259 if (nesqp) {
1260 nesqp->cm_node = NULL;
1261 nes_rem_ref(&nesqp->ibqp);
1262 cm_node->nesqp = NULL;
1265 cm_node->freed = 1;
1266 kfree(cm_node);
1267 return 0;
1271 * process_options
1273 static int process_options(struct nes_cm_node *cm_node, u8 *optionsloc,
1274 u32 optionsize, u32 syn_packet)
1276 u32 tmp;
1277 u32 offset = 0;
1278 union all_known_options *all_options;
1279 char got_mss_option = 0;
1281 while (offset < optionsize) {
1282 all_options = (union all_known_options *)(optionsloc + offset);
1283 switch (all_options->as_base.optionnum) {
1284 case OPTION_NUMBER_END:
1285 offset = optionsize;
1286 break;
1287 case OPTION_NUMBER_NONE:
1288 offset += 1;
1289 continue;
1290 case OPTION_NUMBER_MSS:
1291 nes_debug(NES_DBG_CM, "%s: MSS Length: %d Offset: %d "
1292 "Size: %d\n", __func__,
1293 all_options->as_mss.length, offset, optionsize);
1294 got_mss_option = 1;
1295 if (all_options->as_mss.length != 4) {
1296 return 1;
1297 } else {
1298 tmp = ntohs(all_options->as_mss.mss);
1299 if (tmp > 0 && tmp <
1300 cm_node->tcp_cntxt.mss)
1301 cm_node->tcp_cntxt.mss = tmp;
1303 break;
1304 case OPTION_NUMBER_WINDOW_SCALE:
1305 cm_node->tcp_cntxt.snd_wscale =
1306 all_options->as_windowscale.shiftcount;
1307 break;
1308 case OPTION_NUMBER_WRITE0:
1309 cm_node->send_write0 = 1;
1310 break;
1311 default:
1312 nes_debug(NES_DBG_CM, "TCP Option not understood: %x\n",
1313 all_options->as_base.optionnum);
1314 break;
1316 offset += all_options->as_base.length;
1318 if ((!got_mss_option) && (syn_packet))
1319 cm_node->tcp_cntxt.mss = NES_CM_DEFAULT_MSS;
1320 return 0;
1323 static void drop_packet(struct sk_buff *skb)
1325 atomic_inc(&cm_accel_dropped_pkts);
1326 dev_kfree_skb_any(skb);
1329 static void handle_fin_pkt(struct nes_cm_node *cm_node)
1331 nes_debug(NES_DBG_CM, "Received FIN, cm_node = %p, state = %u. "
1332 "refcnt=%d\n", cm_node, cm_node->state,
1333 atomic_read(&cm_node->ref_count));
1334 cm_node->tcp_cntxt.rcv_nxt++;
1335 cleanup_retrans_entry(cm_node);
1336 switch (cm_node->state) {
1337 case NES_CM_STATE_SYN_RCVD:
1338 case NES_CM_STATE_SYN_SENT:
1339 case NES_CM_STATE_ESTABLISHED:
1340 case NES_CM_STATE_MPAREQ_SENT:
1341 case NES_CM_STATE_MPAREJ_RCVD:
1342 cm_node->state = NES_CM_STATE_LAST_ACK;
1343 send_fin(cm_node, NULL);
1344 break;
1345 case NES_CM_STATE_FIN_WAIT1:
1346 cm_node->state = NES_CM_STATE_CLOSING;
1347 send_ack(cm_node, NULL);
1348 /* Wait for ACK as this is simultanous close..
1349 * After we receive ACK, do not send anything..
1350 * Just rm the node.. Done.. */
1351 break;
1352 case NES_CM_STATE_FIN_WAIT2:
1353 cm_node->state = NES_CM_STATE_TIME_WAIT;
1354 send_ack(cm_node, NULL);
1355 schedule_nes_timer(cm_node, NULL, NES_TIMER_TYPE_CLOSE, 1, 0);
1356 break;
1357 case NES_CM_STATE_TIME_WAIT:
1358 cm_node->state = NES_CM_STATE_CLOSED;
1359 rem_ref_cm_node(cm_node->cm_core, cm_node);
1360 break;
1361 case NES_CM_STATE_TSA:
1362 default:
1363 nes_debug(NES_DBG_CM, "Error Rcvd FIN for node-%p state = %d\n",
1364 cm_node, cm_node->state);
1365 break;
1370 static void handle_rst_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1371 struct tcphdr *tcph)
1374 int reset = 0; /* whether to send reset in case of err.. */
1375 int passive_state;
1376 atomic_inc(&cm_resets_recvd);
1377 nes_debug(NES_DBG_CM, "Received Reset, cm_node = %p, state = %u."
1378 " refcnt=%d\n", cm_node, cm_node->state,
1379 atomic_read(&cm_node->ref_count));
1380 cleanup_retrans_entry(cm_node);
1381 switch (cm_node->state) {
1382 case NES_CM_STATE_SYN_SENT:
1383 case NES_CM_STATE_MPAREQ_SENT:
1384 nes_debug(NES_DBG_CM, "%s[%u] create abort for cm_node=%p "
1385 "listener=%p state=%d\n", __func__, __LINE__, cm_node,
1386 cm_node->listener, cm_node->state);
1387 active_open_err(cm_node, skb, reset);
1388 break;
1389 case NES_CM_STATE_MPAREQ_RCVD:
1390 passive_state = atomic_add_return(1, &cm_node->passive_state);
1391 if (passive_state == NES_SEND_RESET_EVENT)
1392 create_event(cm_node, NES_CM_EVENT_RESET);
1393 cleanup_retrans_entry(cm_node);
1394 cm_node->state = NES_CM_STATE_CLOSED;
1395 dev_kfree_skb_any(skb);
1396 break;
1397 case NES_CM_STATE_ESTABLISHED:
1398 case NES_CM_STATE_SYN_RCVD:
1399 case NES_CM_STATE_LISTENING:
1400 nes_debug(NES_DBG_CM, "Bad state %s[%u]\n", __func__, __LINE__);
1401 passive_open_err(cm_node, skb, reset);
1402 break;
1403 case NES_CM_STATE_TSA:
1404 active_open_err(cm_node, skb, reset);
1405 break;
1406 case NES_CM_STATE_CLOSED:
1407 cleanup_retrans_entry(cm_node);
1408 drop_packet(skb);
1409 break;
1410 case NES_CM_STATE_TIME_WAIT:
1411 cleanup_retrans_entry(cm_node);
1412 cm_node->state = NES_CM_STATE_CLOSED;
1413 rem_ref_cm_node(cm_node->cm_core, cm_node);
1414 drop_packet(skb);
1415 break;
1416 case NES_CM_STATE_FIN_WAIT1:
1417 cleanup_retrans_entry(cm_node);
1418 nes_debug(NES_DBG_CM, "Bad state %s[%u]\n", __func__, __LINE__);
1419 default:
1420 drop_packet(skb);
1421 break;
1426 static void handle_rcv_mpa(struct nes_cm_node *cm_node, struct sk_buff *skb)
1429 int ret = 0;
1430 int datasize = skb->len;
1431 u8 *dataloc = skb->data;
1433 enum nes_cm_event_type type = NES_CM_EVENT_UNKNOWN;
1434 u32 res_type;
1435 ret = parse_mpa(cm_node, dataloc, &res_type, datasize);
1436 if (ret) {
1437 nes_debug(NES_DBG_CM, "didn't like MPA Request\n");
1438 if (cm_node->state == NES_CM_STATE_MPAREQ_SENT) {
1439 nes_debug(NES_DBG_CM, "%s[%u] create abort for "
1440 "cm_node=%p listener=%p state=%d\n", __func__,
1441 __LINE__, cm_node, cm_node->listener,
1442 cm_node->state);
1443 active_open_err(cm_node, skb, 1);
1444 } else {
1445 passive_open_err(cm_node, skb, 1);
1447 return;
1450 switch (cm_node->state) {
1451 case NES_CM_STATE_ESTABLISHED:
1452 if (res_type == NES_MPA_REQUEST_REJECT) {
1453 /*BIG problem as we are receiving the MPA.. So should
1454 * not be REJECT.. This is Passive Open.. We can
1455 * only receive it Reject for Active Open...*/
1456 WARN_ON(1);
1458 cm_node->state = NES_CM_STATE_MPAREQ_RCVD;
1459 type = NES_CM_EVENT_MPA_REQ;
1460 atomic_set(&cm_node->passive_state,
1461 NES_PASSIVE_STATE_INDICATED);
1462 break;
1463 case NES_CM_STATE_MPAREQ_SENT:
1464 if (res_type == NES_MPA_REQUEST_REJECT) {
1465 type = NES_CM_EVENT_MPA_REJECT;
1466 cm_node->state = NES_CM_STATE_MPAREJ_RCVD;
1467 } else {
1468 type = NES_CM_EVENT_CONNECTED;
1469 cm_node->state = NES_CM_STATE_TSA;
1472 break;
1473 default:
1474 WARN_ON(1);
1475 break;
1477 dev_kfree_skb_any(skb);
1478 create_event(cm_node, type);
1481 static void indicate_pkt_err(struct nes_cm_node *cm_node, struct sk_buff *skb)
1483 switch (cm_node->state) {
1484 case NES_CM_STATE_SYN_SENT:
1485 case NES_CM_STATE_MPAREQ_SENT:
1486 nes_debug(NES_DBG_CM, "%s[%u] create abort for cm_node=%p "
1487 "listener=%p state=%d\n", __func__, __LINE__, cm_node,
1488 cm_node->listener, cm_node->state);
1489 active_open_err(cm_node, skb, 1);
1490 break;
1491 case NES_CM_STATE_ESTABLISHED:
1492 case NES_CM_STATE_SYN_RCVD:
1493 passive_open_err(cm_node, skb, 1);
1494 break;
1495 case NES_CM_STATE_TSA:
1496 default:
1497 drop_packet(skb);
1501 static int check_syn(struct nes_cm_node *cm_node, struct tcphdr *tcph,
1502 struct sk_buff *skb)
1504 int err;
1506 err = ((ntohl(tcph->ack_seq) == cm_node->tcp_cntxt.loc_seq_num))? 0 : 1;
1507 if (err)
1508 active_open_err(cm_node, skb, 1);
1510 return err;
1513 static int check_seq(struct nes_cm_node *cm_node, struct tcphdr *tcph,
1514 struct sk_buff *skb)
1516 int err = 0;
1517 u32 seq;
1518 u32 ack_seq;
1519 u32 loc_seq_num = cm_node->tcp_cntxt.loc_seq_num;
1520 u32 rcv_nxt = cm_node->tcp_cntxt.rcv_nxt;
1521 u32 rcv_wnd;
1522 seq = ntohl(tcph->seq);
1523 ack_seq = ntohl(tcph->ack_seq);
1524 rcv_wnd = cm_node->tcp_cntxt.rcv_wnd;
1525 if (ack_seq != loc_seq_num)
1526 err = 1;
1527 else if ((seq + rcv_wnd) < rcv_nxt)
1528 err = 1;
1529 if (err) {
1530 nes_debug(NES_DBG_CM, "%s[%u] create abort for cm_node=%p "
1531 "listener=%p state=%d\n", __func__, __LINE__, cm_node,
1532 cm_node->listener, cm_node->state);
1533 indicate_pkt_err(cm_node, skb);
1534 nes_debug(NES_DBG_CM, "seq ERROR cm_node =%p seq=0x%08X "
1535 "rcv_nxt=0x%08X rcv_wnd=0x%x\n", cm_node, seq, rcv_nxt,
1536 rcv_wnd);
1538 return err;
1542 * handle_syn_pkt() is for Passive node. The syn packet is received when a node
1543 * is created with a listener or it may comein as rexmitted packet which in
1544 * that case will be just dropped.
1547 static void handle_syn_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1548 struct tcphdr *tcph)
1550 int ret;
1551 u32 inc_sequence;
1552 int optionsize;
1554 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
1555 skb_trim(skb, 0);
1556 inc_sequence = ntohl(tcph->seq);
1558 switch (cm_node->state) {
1559 case NES_CM_STATE_SYN_SENT:
1560 case NES_CM_STATE_MPAREQ_SENT:
1561 /* Rcvd syn on active open connection*/
1562 active_open_err(cm_node, skb, 1);
1563 break;
1564 case NES_CM_STATE_LISTENING:
1565 /* Passive OPEN */
1566 if (atomic_read(&cm_node->listener->pend_accepts_cnt) >
1567 cm_node->listener->backlog) {
1568 nes_debug(NES_DBG_CM, "drop syn due to backlog "
1569 "pressure \n");
1570 cm_backlog_drops++;
1571 passive_open_err(cm_node, skb, 0);
1572 break;
1574 ret = handle_tcp_options(cm_node, tcph, skb, optionsize,
1576 if (ret) {
1577 passive_open_err(cm_node, skb, 0);
1578 /* drop pkt */
1579 break;
1581 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
1582 BUG_ON(cm_node->send_entry);
1583 cm_node->accept_pend = 1;
1584 atomic_inc(&cm_node->listener->pend_accepts_cnt);
1586 cm_node->state = NES_CM_STATE_SYN_RCVD;
1587 send_syn(cm_node, 1, skb);
1588 break;
1589 case NES_CM_STATE_CLOSED:
1590 cleanup_retrans_entry(cm_node);
1591 send_reset(cm_node, skb);
1592 break;
1593 case NES_CM_STATE_TSA:
1594 case NES_CM_STATE_ESTABLISHED:
1595 case NES_CM_STATE_FIN_WAIT1:
1596 case NES_CM_STATE_FIN_WAIT2:
1597 case NES_CM_STATE_MPAREQ_RCVD:
1598 case NES_CM_STATE_LAST_ACK:
1599 case NES_CM_STATE_CLOSING:
1600 case NES_CM_STATE_UNKNOWN:
1601 default:
1602 drop_packet(skb);
1603 break;
1607 static void handle_synack_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1608 struct tcphdr *tcph)
1611 int ret;
1612 u32 inc_sequence;
1613 int optionsize;
1615 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
1616 skb_trim(skb, 0);
1617 inc_sequence = ntohl(tcph->seq);
1618 switch (cm_node->state) {
1619 case NES_CM_STATE_SYN_SENT:
1620 cleanup_retrans_entry(cm_node);
1621 /* active open */
1622 if (check_syn(cm_node, tcph, skb))
1623 return;
1624 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
1625 /* setup options */
1626 ret = handle_tcp_options(cm_node, tcph, skb, optionsize, 0);
1627 if (ret) {
1628 nes_debug(NES_DBG_CM, "cm_node=%p tcp_options failed\n",
1629 cm_node);
1630 break;
1632 cleanup_retrans_entry(cm_node);
1633 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
1634 send_mpa_request(cm_node, skb);
1635 cm_node->state = NES_CM_STATE_MPAREQ_SENT;
1636 break;
1637 case NES_CM_STATE_MPAREQ_RCVD:
1638 /* passive open, so should not be here */
1639 passive_open_err(cm_node, skb, 1);
1640 break;
1641 case NES_CM_STATE_LISTENING:
1642 case NES_CM_STATE_CLOSED:
1643 cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
1644 cleanup_retrans_entry(cm_node);
1645 send_reset(cm_node, skb);
1646 break;
1647 case NES_CM_STATE_ESTABLISHED:
1648 case NES_CM_STATE_FIN_WAIT1:
1649 case NES_CM_STATE_FIN_WAIT2:
1650 case NES_CM_STATE_LAST_ACK:
1651 case NES_CM_STATE_TSA:
1652 case NES_CM_STATE_CLOSING:
1653 case NES_CM_STATE_UNKNOWN:
1654 case NES_CM_STATE_MPAREQ_SENT:
1655 default:
1656 drop_packet(skb);
1657 break;
1661 static void handle_ack_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1662 struct tcphdr *tcph)
1664 int datasize = 0;
1665 u32 inc_sequence;
1666 u32 rem_seq_ack;
1667 u32 rem_seq;
1668 int ret;
1669 int optionsize;
1670 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
1672 if (check_seq(cm_node, tcph, skb))
1673 return;
1675 skb_pull(skb, tcph->doff << 2);
1676 inc_sequence = ntohl(tcph->seq);
1677 rem_seq = ntohl(tcph->seq);
1678 rem_seq_ack = ntohl(tcph->ack_seq);
1679 datasize = skb->len;
1680 cleanup_retrans_entry(cm_node);
1681 switch (cm_node->state) {
1682 case NES_CM_STATE_SYN_RCVD:
1683 /* Passive OPEN */
1684 ret = handle_tcp_options(cm_node, tcph, skb, optionsize, 1);
1685 if (ret)
1686 break;
1687 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
1688 if (cm_node->tcp_cntxt.rem_ack_num !=
1689 cm_node->tcp_cntxt.loc_seq_num) {
1690 nes_debug(NES_DBG_CM, "rem_ack_num != loc_seq_num\n");
1691 cleanup_retrans_entry(cm_node);
1692 send_reset(cm_node, skb);
1693 return;
1695 cm_node->state = NES_CM_STATE_ESTABLISHED;
1696 cleanup_retrans_entry(cm_node);
1697 if (datasize) {
1698 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
1699 handle_rcv_mpa(cm_node, skb);
1700 } else { /* rcvd ACK only */
1701 dev_kfree_skb_any(skb);
1702 cleanup_retrans_entry(cm_node);
1704 break;
1705 case NES_CM_STATE_ESTABLISHED:
1706 /* Passive OPEN */
1707 cleanup_retrans_entry(cm_node);
1708 if (datasize) {
1709 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
1710 handle_rcv_mpa(cm_node, skb);
1711 } else
1712 drop_packet(skb);
1713 break;
1714 case NES_CM_STATE_MPAREQ_SENT:
1715 cleanup_retrans_entry(cm_node);
1716 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
1717 if (datasize) {
1718 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
1719 handle_rcv_mpa(cm_node, skb);
1720 } else { /* Could be just an ack pkt.. */
1721 cleanup_retrans_entry(cm_node);
1722 dev_kfree_skb_any(skb);
1724 break;
1725 case NES_CM_STATE_LISTENING:
1726 case NES_CM_STATE_CLOSED:
1727 cleanup_retrans_entry(cm_node);
1728 send_reset(cm_node, skb);
1729 break;
1730 case NES_CM_STATE_LAST_ACK:
1731 cleanup_retrans_entry(cm_node);
1732 cm_node->state = NES_CM_STATE_CLOSED;
1733 cm_node->cm_id->rem_ref(cm_node->cm_id);
1734 case NES_CM_STATE_CLOSING:
1735 cleanup_retrans_entry(cm_node);
1736 rem_ref_cm_node(cm_node->cm_core, cm_node);
1737 drop_packet(skb);
1738 break;
1739 case NES_CM_STATE_FIN_WAIT1:
1740 cleanup_retrans_entry(cm_node);
1741 drop_packet(skb);
1742 cm_node->state = NES_CM_STATE_FIN_WAIT2;
1743 break;
1744 case NES_CM_STATE_SYN_SENT:
1745 case NES_CM_STATE_FIN_WAIT2:
1746 case NES_CM_STATE_TSA:
1747 case NES_CM_STATE_MPAREQ_RCVD:
1748 case NES_CM_STATE_UNKNOWN:
1749 default:
1750 drop_packet(skb);
1751 break;
1757 static int handle_tcp_options(struct nes_cm_node *cm_node, struct tcphdr *tcph,
1758 struct sk_buff *skb, int optionsize, int passive)
1760 u8 *optionsloc = (u8 *)&tcph[1];
1761 if (optionsize) {
1762 if (process_options(cm_node, optionsloc, optionsize,
1763 (u32)tcph->syn)) {
1764 nes_debug(NES_DBG_CM, "%s: Node %p, Sending RESET\n",
1765 __func__, cm_node);
1766 if (passive)
1767 passive_open_err(cm_node, skb, 1);
1768 else
1769 active_open_err(cm_node, skb, 1);
1770 return 1;
1774 cm_node->tcp_cntxt.snd_wnd = ntohs(tcph->window) <<
1775 cm_node->tcp_cntxt.snd_wscale;
1777 if (cm_node->tcp_cntxt.snd_wnd > cm_node->tcp_cntxt.max_snd_wnd)
1778 cm_node->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.snd_wnd;
1779 return 0;
1783 * active_open_err() will send reset() if flag set..
1784 * It will also send ABORT event.
1787 static void active_open_err(struct nes_cm_node *cm_node, struct sk_buff *skb,
1788 int reset)
1790 cleanup_retrans_entry(cm_node);
1791 if (reset) {
1792 nes_debug(NES_DBG_CM, "ERROR active err called for cm_node=%p, "
1793 "state=%d\n", cm_node, cm_node->state);
1794 add_ref_cm_node(cm_node);
1795 send_reset(cm_node, skb);
1796 } else
1797 dev_kfree_skb_any(skb);
1799 cm_node->state = NES_CM_STATE_CLOSED;
1800 create_event(cm_node, NES_CM_EVENT_ABORTED);
1804 * passive_open_err() will either do a reset() or will free up the skb and
1805 * remove the cm_node.
1808 static void passive_open_err(struct nes_cm_node *cm_node, struct sk_buff *skb,
1809 int reset)
1811 cleanup_retrans_entry(cm_node);
1812 cm_node->state = NES_CM_STATE_CLOSED;
1813 if (reset) {
1814 nes_debug(NES_DBG_CM, "passive_open_err sending RST for "
1815 "cm_node=%p state =%d\n", cm_node, cm_node->state);
1816 send_reset(cm_node, skb);
1817 } else {
1818 dev_kfree_skb_any(skb);
1819 rem_ref_cm_node(cm_node->cm_core, cm_node);
1824 * free_retrans_entry() routines assumes that the retrans_list_lock has
1825 * been acquired before calling.
1827 static void free_retrans_entry(struct nes_cm_node *cm_node)
1829 struct nes_timer_entry *send_entry;
1830 send_entry = cm_node->send_entry;
1831 if (send_entry) {
1832 cm_node->send_entry = NULL;
1833 dev_kfree_skb_any(send_entry->skb);
1834 kfree(send_entry);
1835 rem_ref_cm_node(cm_node->cm_core, cm_node);
1839 static void cleanup_retrans_entry(struct nes_cm_node *cm_node)
1841 unsigned long flags;
1843 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1844 free_retrans_entry(cm_node);
1845 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1849 * process_packet
1850 * Returns skb if to be freed, else it will return NULL if already used..
1852 static void process_packet(struct nes_cm_node *cm_node, struct sk_buff *skb,
1853 struct nes_cm_core *cm_core)
1855 enum nes_tcpip_pkt_type pkt_type = NES_PKT_TYPE_UNKNOWN;
1856 struct tcphdr *tcph = tcp_hdr(skb);
1857 u32 fin_set = 0;
1858 skb_pull(skb, ip_hdr(skb)->ihl << 2);
1860 nes_debug(NES_DBG_CM, "process_packet: cm_node=%p state =%d syn=%d "
1861 "ack=%d rst=%d fin=%d\n", cm_node, cm_node->state, tcph->syn,
1862 tcph->ack, tcph->rst, tcph->fin);
1864 if (tcph->rst)
1865 pkt_type = NES_PKT_TYPE_RST;
1866 else if (tcph->syn) {
1867 pkt_type = NES_PKT_TYPE_SYN;
1868 if (tcph->ack)
1869 pkt_type = NES_PKT_TYPE_SYNACK;
1870 } else if (tcph->ack)
1871 pkt_type = NES_PKT_TYPE_ACK;
1872 if (tcph->fin)
1873 fin_set = 1;
1875 switch (pkt_type) {
1876 case NES_PKT_TYPE_SYN:
1877 handle_syn_pkt(cm_node, skb, tcph);
1878 break;
1879 case NES_PKT_TYPE_SYNACK:
1880 handle_synack_pkt(cm_node, skb, tcph);
1881 break;
1882 case NES_PKT_TYPE_ACK:
1883 handle_ack_pkt(cm_node, skb, tcph);
1884 if (fin_set)
1885 handle_fin_pkt(cm_node);
1886 break;
1887 case NES_PKT_TYPE_RST:
1888 handle_rst_pkt(cm_node, skb, tcph);
1889 break;
1890 default:
1891 drop_packet(skb);
1892 if (fin_set)
1893 handle_fin_pkt(cm_node);
1894 break;
1899 * mini_cm_listen - create a listen node with params
1901 static struct nes_cm_listener *mini_cm_listen(struct nes_cm_core *cm_core,
1902 struct nes_vnic *nesvnic, struct nes_cm_info *cm_info)
1904 struct nes_cm_listener *listener;
1905 unsigned long flags;
1907 nes_debug(NES_DBG_CM, "Search for 0x%08x : 0x%04x\n",
1908 cm_info->loc_addr, cm_info->loc_port);
1910 /* cannot have multiple matching listeners */
1911 listener = find_listener(cm_core, htonl(cm_info->loc_addr),
1912 htons(cm_info->loc_port), NES_CM_LISTENER_EITHER_STATE);
1913 if (listener && listener->listener_state == NES_CM_LISTENER_ACTIVE_STATE) {
1914 /* find automatically incs ref count ??? */
1915 atomic_dec(&listener->ref_count);
1916 nes_debug(NES_DBG_CM, "Not creating listener since it already exists\n");
1917 return NULL;
1920 if (!listener) {
1921 /* create a CM listen node (1/2 node to compare incoming traffic to) */
1922 listener = kzalloc(sizeof(*listener), GFP_ATOMIC);
1923 if (!listener) {
1924 nes_debug(NES_DBG_CM, "Not creating listener memory allocation failed\n");
1925 return NULL;
1928 listener->loc_addr = htonl(cm_info->loc_addr);
1929 listener->loc_port = htons(cm_info->loc_port);
1930 listener->reused_node = 0;
1932 atomic_set(&listener->ref_count, 1);
1934 /* pasive case */
1935 /* find already inc'ed the ref count */
1936 else {
1937 listener->reused_node = 1;
1940 listener->cm_id = cm_info->cm_id;
1941 atomic_set(&listener->pend_accepts_cnt, 0);
1942 listener->cm_core = cm_core;
1943 listener->nesvnic = nesvnic;
1944 atomic_inc(&cm_core->node_cnt);
1946 listener->conn_type = cm_info->conn_type;
1947 listener->backlog = cm_info->backlog;
1948 listener->listener_state = NES_CM_LISTENER_ACTIVE_STATE;
1950 if (!listener->reused_node) {
1951 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1952 list_add(&listener->list, &cm_core->listen_list.list);
1953 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1954 atomic_inc(&cm_core->listen_node_cnt);
1957 nes_debug(NES_DBG_CM, "Api - listen(): addr=0x%08X, port=0x%04x,"
1958 " listener = %p, backlog = %d, cm_id = %p.\n",
1959 cm_info->loc_addr, cm_info->loc_port,
1960 listener, listener->backlog, listener->cm_id);
1962 return listener;
1967 * mini_cm_connect - make a connection node with params
1969 static struct nes_cm_node *mini_cm_connect(struct nes_cm_core *cm_core,
1970 struct nes_vnic *nesvnic, u16 private_data_len,
1971 void *private_data, struct nes_cm_info *cm_info)
1973 int ret = 0;
1974 struct nes_cm_node *cm_node;
1975 struct nes_cm_listener *loopbackremotelistener;
1976 struct nes_cm_node *loopbackremotenode;
1977 struct nes_cm_info loopback_cm_info;
1978 u16 mpa_frame_size = sizeof(struct ietf_mpa_frame) + private_data_len;
1979 struct ietf_mpa_frame *mpa_frame = NULL;
1981 /* create a CM connection node */
1982 cm_node = make_cm_node(cm_core, nesvnic, cm_info, NULL);
1983 if (!cm_node)
1984 return NULL;
1985 mpa_frame = &cm_node->mpa_frame;
1986 strcpy(mpa_frame->key, IEFT_MPA_KEY_REQ);
1987 mpa_frame->flags = IETF_MPA_FLAGS_CRC;
1988 mpa_frame->rev = IETF_MPA_VERSION;
1989 mpa_frame->priv_data_len = htons(private_data_len);
1991 /* set our node side to client (active) side */
1992 cm_node->tcp_cntxt.client = 1;
1993 cm_node->tcp_cntxt.rcv_wscale = NES_CM_DEFAULT_RCV_WND_SCALE;
1995 if (cm_info->loc_addr == cm_info->rem_addr) {
1996 loopbackremotelistener = find_listener(cm_core,
1997 ntohl(nesvnic->local_ipaddr), cm_node->rem_port,
1998 NES_CM_LISTENER_ACTIVE_STATE);
1999 if (loopbackremotelistener == NULL) {
2000 create_event(cm_node, NES_CM_EVENT_ABORTED);
2001 } else {
2002 atomic_inc(&cm_loopbacks);
2003 loopback_cm_info = *cm_info;
2004 loopback_cm_info.loc_port = cm_info->rem_port;
2005 loopback_cm_info.rem_port = cm_info->loc_port;
2006 loopback_cm_info.cm_id = loopbackremotelistener->cm_id;
2007 loopbackremotenode = make_cm_node(cm_core, nesvnic,
2008 &loopback_cm_info, loopbackremotelistener);
2009 loopbackremotenode->loopbackpartner = cm_node;
2010 loopbackremotenode->tcp_cntxt.rcv_wscale =
2011 NES_CM_DEFAULT_RCV_WND_SCALE;
2012 cm_node->loopbackpartner = loopbackremotenode;
2013 memcpy(loopbackremotenode->mpa_frame_buf, private_data,
2014 private_data_len);
2015 loopbackremotenode->mpa_frame_size = private_data_len;
2017 /* we are done handling this state. */
2018 /* set node to a TSA state */
2019 cm_node->state = NES_CM_STATE_TSA;
2020 cm_node->tcp_cntxt.rcv_nxt =
2021 loopbackremotenode->tcp_cntxt.loc_seq_num;
2022 loopbackremotenode->tcp_cntxt.rcv_nxt =
2023 cm_node->tcp_cntxt.loc_seq_num;
2024 cm_node->tcp_cntxt.max_snd_wnd =
2025 loopbackremotenode->tcp_cntxt.rcv_wnd;
2026 loopbackremotenode->tcp_cntxt.max_snd_wnd =
2027 cm_node->tcp_cntxt.rcv_wnd;
2028 cm_node->tcp_cntxt.snd_wnd =
2029 loopbackremotenode->tcp_cntxt.rcv_wnd;
2030 loopbackremotenode->tcp_cntxt.snd_wnd =
2031 cm_node->tcp_cntxt.rcv_wnd;
2032 cm_node->tcp_cntxt.snd_wscale =
2033 loopbackremotenode->tcp_cntxt.rcv_wscale;
2034 loopbackremotenode->tcp_cntxt.snd_wscale =
2035 cm_node->tcp_cntxt.rcv_wscale;
2036 loopbackremotenode->state = NES_CM_STATE_MPAREQ_RCVD;
2037 create_event(loopbackremotenode, NES_CM_EVENT_MPA_REQ);
2039 return cm_node;
2042 /* set our node side to client (active) side */
2043 cm_node->tcp_cntxt.client = 1;
2044 /* init our MPA frame ptr */
2045 memcpy(mpa_frame->priv_data, private_data, private_data_len);
2047 cm_node->mpa_frame_size = mpa_frame_size;
2049 /* send a syn and goto syn sent state */
2050 cm_node->state = NES_CM_STATE_SYN_SENT;
2051 ret = send_syn(cm_node, 0, NULL);
2053 if (ret) {
2054 /* error in sending the syn free up the cm_node struct */
2055 nes_debug(NES_DBG_CM, "Api - connect() FAILED: dest "
2056 "addr=0x%08X, port=0x%04x, cm_node=%p, cm_id = %p.\n",
2057 cm_node->rem_addr, cm_node->rem_port, cm_node,
2058 cm_node->cm_id);
2059 rem_ref_cm_node(cm_node->cm_core, cm_node);
2060 cm_node = NULL;
2063 if (cm_node)
2064 nes_debug(NES_DBG_CM, "Api - connect(): dest addr=0x%08X,"
2065 "port=0x%04x, cm_node=%p, cm_id = %p.\n",
2066 cm_node->rem_addr, cm_node->rem_port, cm_node,
2067 cm_node->cm_id);
2069 return cm_node;
2074 * mini_cm_accept - accept a connection
2075 * This function is never called
2077 static int mini_cm_accept(struct nes_cm_core *cm_core,
2078 struct ietf_mpa_frame *mpa_frame, struct nes_cm_node *cm_node)
2080 return 0;
2085 * mini_cm_reject - reject and teardown a connection
2087 static int mini_cm_reject(struct nes_cm_core *cm_core,
2088 struct ietf_mpa_frame *mpa_frame, struct nes_cm_node *cm_node)
2090 int ret = 0;
2091 int err = 0;
2092 int passive_state;
2093 struct nes_cm_event event;
2094 struct iw_cm_id *cm_id = cm_node->cm_id;
2095 struct nes_cm_node *loopback = cm_node->loopbackpartner;
2097 nes_debug(NES_DBG_CM, "%s cm_node=%p type=%d state=%d\n",
2098 __func__, cm_node, cm_node->tcp_cntxt.client, cm_node->state);
2100 if (cm_node->tcp_cntxt.client)
2101 return ret;
2102 cleanup_retrans_entry(cm_node);
2104 if (!loopback) {
2105 passive_state = atomic_add_return(1, &cm_node->passive_state);
2106 if (passive_state == NES_SEND_RESET_EVENT) {
2107 cm_node->state = NES_CM_STATE_CLOSED;
2108 rem_ref_cm_node(cm_core, cm_node);
2109 } else {
2110 ret = send_mpa_reject(cm_node);
2111 if (ret) {
2112 cm_node->state = NES_CM_STATE_CLOSED;
2113 err = send_reset(cm_node, NULL);
2114 if (err)
2115 WARN_ON(1);
2116 } else
2117 cm_id->add_ref(cm_id);
2119 } else {
2120 cm_node->cm_id = NULL;
2121 event.cm_node = loopback;
2122 event.cm_info.rem_addr = loopback->rem_addr;
2123 event.cm_info.loc_addr = loopback->loc_addr;
2124 event.cm_info.rem_port = loopback->rem_port;
2125 event.cm_info.loc_port = loopback->loc_port;
2126 event.cm_info.cm_id = loopback->cm_id;
2127 cm_event_mpa_reject(&event);
2128 rem_ref_cm_node(cm_core, cm_node);
2129 loopback->state = NES_CM_STATE_CLOSING;
2131 cm_id = loopback->cm_id;
2132 rem_ref_cm_node(cm_core, loopback);
2133 cm_id->rem_ref(cm_id);
2136 return ret;
2141 * mini_cm_close
2143 static int mini_cm_close(struct nes_cm_core *cm_core, struct nes_cm_node *cm_node)
2145 int ret = 0;
2147 if (!cm_core || !cm_node)
2148 return -EINVAL;
2150 switch (cm_node->state) {
2151 case NES_CM_STATE_SYN_RCVD:
2152 case NES_CM_STATE_SYN_SENT:
2153 case NES_CM_STATE_ONE_SIDE_ESTABLISHED:
2154 case NES_CM_STATE_ESTABLISHED:
2155 case NES_CM_STATE_ACCEPTING:
2156 case NES_CM_STATE_MPAREQ_SENT:
2157 case NES_CM_STATE_MPAREQ_RCVD:
2158 cleanup_retrans_entry(cm_node);
2159 send_reset(cm_node, NULL);
2160 break;
2161 case NES_CM_STATE_CLOSE_WAIT:
2162 cm_node->state = NES_CM_STATE_LAST_ACK;
2163 send_fin(cm_node, NULL);
2164 break;
2165 case NES_CM_STATE_FIN_WAIT1:
2166 case NES_CM_STATE_FIN_WAIT2:
2167 case NES_CM_STATE_LAST_ACK:
2168 case NES_CM_STATE_TIME_WAIT:
2169 case NES_CM_STATE_CLOSING:
2170 ret = -1;
2171 break;
2172 case NES_CM_STATE_MPAREJ_RCVD:
2173 case NES_CM_STATE_LISTENING:
2174 case NES_CM_STATE_UNKNOWN:
2175 case NES_CM_STATE_INITED:
2176 case NES_CM_STATE_CLOSED:
2177 ret = rem_ref_cm_node(cm_core, cm_node);
2178 break;
2179 case NES_CM_STATE_TSA:
2180 if (cm_node->send_entry)
2181 printk(KERN_ERR "ERROR Close got called from STATE_TSA "
2182 "send_entry=%p\n", cm_node->send_entry);
2183 ret = rem_ref_cm_node(cm_core, cm_node);
2184 break;
2186 return ret;
2191 * recv_pkt - recv an ETHERNET packet, and process it through CM
2192 * node state machine
2194 static int mini_cm_recv_pkt(struct nes_cm_core *cm_core,
2195 struct nes_vnic *nesvnic, struct sk_buff *skb)
2197 struct nes_cm_node *cm_node = NULL;
2198 struct nes_cm_listener *listener = NULL;
2199 struct iphdr *iph;
2200 struct tcphdr *tcph;
2201 struct nes_cm_info nfo;
2202 int skb_handled = 1;
2203 __be32 tmp_daddr, tmp_saddr;
2205 if (!skb)
2206 return 0;
2207 if (skb->len < sizeof(struct iphdr) + sizeof(struct tcphdr)) {
2208 return 0;
2211 iph = (struct iphdr *)skb->data;
2212 tcph = (struct tcphdr *)(skb->data + sizeof(struct iphdr));
2214 nfo.loc_addr = ntohl(iph->daddr);
2215 nfo.loc_port = ntohs(tcph->dest);
2216 nfo.rem_addr = ntohl(iph->saddr);
2217 nfo.rem_port = ntohs(tcph->source);
2219 tmp_daddr = cpu_to_be32(iph->daddr);
2220 tmp_saddr = cpu_to_be32(iph->saddr);
2222 nes_debug(NES_DBG_CM, "Received packet: dest=%pI4:0x%04X src=%pI4:0x%04X\n",
2223 &tmp_daddr, tcph->dest, &tmp_saddr, tcph->source);
2225 do {
2226 cm_node = find_node(cm_core,
2227 nfo.rem_port, nfo.rem_addr,
2228 nfo.loc_port, nfo.loc_addr);
2230 if (!cm_node) {
2231 /* Only type of packet accepted are for */
2232 /* the PASSIVE open (syn only) */
2233 if ((!tcph->syn) || (tcph->ack)) {
2234 skb_handled = 0;
2235 break;
2237 listener = find_listener(cm_core, nfo.loc_addr,
2238 nfo.loc_port,
2239 NES_CM_LISTENER_ACTIVE_STATE);
2240 if (!listener) {
2241 nfo.cm_id = NULL;
2242 nfo.conn_type = 0;
2243 nes_debug(NES_DBG_CM, "Unable to find listener for the pkt\n");
2244 skb_handled = 0;
2245 break;
2247 nfo.cm_id = listener->cm_id;
2248 nfo.conn_type = listener->conn_type;
2249 cm_node = make_cm_node(cm_core, nesvnic, &nfo,
2250 listener);
2251 if (!cm_node) {
2252 nes_debug(NES_DBG_CM, "Unable to allocate "
2253 "node\n");
2254 cm_packets_dropped++;
2255 atomic_dec(&listener->ref_count);
2256 dev_kfree_skb_any(skb);
2257 break;
2259 if (!tcph->rst && !tcph->fin) {
2260 cm_node->state = NES_CM_STATE_LISTENING;
2261 } else {
2262 cm_packets_dropped++;
2263 rem_ref_cm_node(cm_core, cm_node);
2264 dev_kfree_skb_any(skb);
2265 break;
2267 add_ref_cm_node(cm_node);
2268 } else if (cm_node->state == NES_CM_STATE_TSA) {
2269 rem_ref_cm_node(cm_core, cm_node);
2270 atomic_inc(&cm_accel_dropped_pkts);
2271 dev_kfree_skb_any(skb);
2272 break;
2274 skb_reset_network_header(skb);
2275 skb_set_transport_header(skb, sizeof(*tcph));
2276 skb->len = ntohs(iph->tot_len);
2277 process_packet(cm_node, skb, cm_core);
2278 rem_ref_cm_node(cm_core, cm_node);
2279 } while (0);
2280 return skb_handled;
2285 * nes_cm_alloc_core - allocate a top level instance of a cm core
2287 static struct nes_cm_core *nes_cm_alloc_core(void)
2289 struct nes_cm_core *cm_core;
2291 /* setup the CM core */
2292 /* alloc top level core control structure */
2293 cm_core = kzalloc(sizeof(*cm_core), GFP_KERNEL);
2294 if (!cm_core)
2295 return NULL;
2297 INIT_LIST_HEAD(&cm_core->connected_nodes);
2298 init_timer(&cm_core->tcp_timer);
2299 cm_core->tcp_timer.function = nes_cm_timer_tick;
2301 cm_core->mtu = NES_CM_DEFAULT_MTU;
2302 cm_core->state = NES_CM_STATE_INITED;
2303 cm_core->free_tx_pkt_max = NES_CM_DEFAULT_FREE_PKTS;
2305 atomic_set(&cm_core->events_posted, 0);
2307 cm_core->api = &nes_cm_api;
2309 spin_lock_init(&cm_core->ht_lock);
2310 spin_lock_init(&cm_core->listen_list_lock);
2312 INIT_LIST_HEAD(&cm_core->listen_list.list);
2314 nes_debug(NES_DBG_CM, "Init CM Core completed -- cm_core=%p\n", cm_core);
2316 nes_debug(NES_DBG_CM, "Enable QUEUE EVENTS\n");
2317 cm_core->event_wq = create_singlethread_workqueue("nesewq");
2318 cm_core->post_event = nes_cm_post_event;
2319 nes_debug(NES_DBG_CM, "Enable QUEUE DISCONNECTS\n");
2320 cm_core->disconn_wq = create_singlethread_workqueue("nesdwq");
2322 print_core(cm_core);
2323 return cm_core;
2328 * mini_cm_dealloc_core - deallocate a top level instance of a cm core
2330 static int mini_cm_dealloc_core(struct nes_cm_core *cm_core)
2332 nes_debug(NES_DBG_CM, "De-Alloc CM Core (%p)\n", cm_core);
2334 if (!cm_core)
2335 return -EINVAL;
2337 barrier();
2339 if (timer_pending(&cm_core->tcp_timer)) {
2340 del_timer(&cm_core->tcp_timer);
2343 destroy_workqueue(cm_core->event_wq);
2344 destroy_workqueue(cm_core->disconn_wq);
2345 nes_debug(NES_DBG_CM, "\n");
2346 kfree(cm_core);
2348 return 0;
2353 * mini_cm_get
2355 static int mini_cm_get(struct nes_cm_core *cm_core)
2357 return cm_core->state;
2362 * mini_cm_set
2364 static int mini_cm_set(struct nes_cm_core *cm_core, u32 type, u32 value)
2366 int ret = 0;
2368 switch (type) {
2369 case NES_CM_SET_PKT_SIZE:
2370 cm_core->mtu = value;
2371 break;
2372 case NES_CM_SET_FREE_PKT_Q_SIZE:
2373 cm_core->free_tx_pkt_max = value;
2374 break;
2375 default:
2376 /* unknown set option */
2377 ret = -EINVAL;
2380 return ret;
2385 * nes_cm_init_tsa_conn setup HW; MPA frames must be
2386 * successfully exchanged when this is called
2388 static int nes_cm_init_tsa_conn(struct nes_qp *nesqp, struct nes_cm_node *cm_node)
2390 int ret = 0;
2392 if (!nesqp)
2393 return -EINVAL;
2395 nesqp->nesqp_context->misc |= cpu_to_le32(NES_QPCONTEXT_MISC_IPV4 |
2396 NES_QPCONTEXT_MISC_NO_NAGLE | NES_QPCONTEXT_MISC_DO_NOT_FRAG |
2397 NES_QPCONTEXT_MISC_DROS);
2399 if (cm_node->tcp_cntxt.snd_wscale || cm_node->tcp_cntxt.rcv_wscale)
2400 nesqp->nesqp_context->misc |= cpu_to_le32(NES_QPCONTEXT_MISC_WSCALE);
2402 nesqp->nesqp_context->misc2 |= cpu_to_le32(64 << NES_QPCONTEXT_MISC2_TTL_SHIFT);
2404 nesqp->nesqp_context->mss |= cpu_to_le32(((u32)cm_node->tcp_cntxt.mss) << 16);
2406 nesqp->nesqp_context->tcp_state_flow_label |= cpu_to_le32(
2407 (u32)NES_QPCONTEXT_TCPSTATE_EST << NES_QPCONTEXT_TCPFLOW_TCP_STATE_SHIFT);
2409 nesqp->nesqp_context->pd_index_wscale |= cpu_to_le32(
2410 (cm_node->tcp_cntxt.snd_wscale << NES_QPCONTEXT_PDWSCALE_SND_WSCALE_SHIFT) &
2411 NES_QPCONTEXT_PDWSCALE_SND_WSCALE_MASK);
2413 nesqp->nesqp_context->pd_index_wscale |= cpu_to_le32(
2414 (cm_node->tcp_cntxt.rcv_wscale << NES_QPCONTEXT_PDWSCALE_RCV_WSCALE_SHIFT) &
2415 NES_QPCONTEXT_PDWSCALE_RCV_WSCALE_MASK);
2417 nesqp->nesqp_context->keepalive = cpu_to_le32(0x80);
2418 nesqp->nesqp_context->ts_recent = 0;
2419 nesqp->nesqp_context->ts_age = 0;
2420 nesqp->nesqp_context->snd_nxt = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2421 nesqp->nesqp_context->snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.snd_wnd);
2422 nesqp->nesqp_context->rcv_nxt = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
2423 nesqp->nesqp_context->rcv_wnd = cpu_to_le32(cm_node->tcp_cntxt.rcv_wnd <<
2424 cm_node->tcp_cntxt.rcv_wscale);
2425 nesqp->nesqp_context->snd_max = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2426 nesqp->nesqp_context->snd_una = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2427 nesqp->nesqp_context->srtt = 0;
2428 nesqp->nesqp_context->rttvar = cpu_to_le32(0x6);
2429 nesqp->nesqp_context->ssthresh = cpu_to_le32(0x3FFFC000);
2430 nesqp->nesqp_context->cwnd = cpu_to_le32(2*cm_node->tcp_cntxt.mss);
2431 nesqp->nesqp_context->snd_wl1 = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
2432 nesqp->nesqp_context->snd_wl2 = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2433 nesqp->nesqp_context->max_snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.max_snd_wnd);
2435 nes_debug(NES_DBG_CM, "QP%u: rcv_nxt = 0x%08X, snd_nxt = 0x%08X,"
2436 " Setting MSS to %u, PDWscale = 0x%08X, rcv_wnd = %u, context misc = 0x%08X.\n",
2437 nesqp->hwqp.qp_id, le32_to_cpu(nesqp->nesqp_context->rcv_nxt),
2438 le32_to_cpu(nesqp->nesqp_context->snd_nxt),
2439 cm_node->tcp_cntxt.mss, le32_to_cpu(nesqp->nesqp_context->pd_index_wscale),
2440 le32_to_cpu(nesqp->nesqp_context->rcv_wnd),
2441 le32_to_cpu(nesqp->nesqp_context->misc));
2442 nes_debug(NES_DBG_CM, " snd_wnd = 0x%08X.\n", le32_to_cpu(nesqp->nesqp_context->snd_wnd));
2443 nes_debug(NES_DBG_CM, " snd_cwnd = 0x%08X.\n", le32_to_cpu(nesqp->nesqp_context->cwnd));
2444 nes_debug(NES_DBG_CM, " max_swnd = 0x%08X.\n", le32_to_cpu(nesqp->nesqp_context->max_snd_wnd));
2446 nes_debug(NES_DBG_CM, "Change cm_node state to TSA\n");
2447 cm_node->state = NES_CM_STATE_TSA;
2449 return ret;
2454 * nes_cm_disconn
2456 int nes_cm_disconn(struct nes_qp *nesqp)
2458 unsigned long flags;
2460 spin_lock_irqsave(&nesqp->lock, flags);
2461 if (nesqp->disconn_pending == 0) {
2462 nesqp->disconn_pending++;
2463 spin_unlock_irqrestore(&nesqp->lock, flags);
2464 /* init our disconnect work element, to */
2465 INIT_WORK(&nesqp->disconn_work, nes_disconnect_worker);
2467 queue_work(g_cm_core->disconn_wq, &nesqp->disconn_work);
2468 } else
2469 spin_unlock_irqrestore(&nesqp->lock, flags);
2471 return 0;
2476 * nes_disconnect_worker
2478 static void nes_disconnect_worker(struct work_struct *work)
2480 struct nes_qp *nesqp = container_of(work, struct nes_qp, disconn_work);
2482 nes_debug(NES_DBG_CM, "processing AEQE id 0x%04X for QP%u.\n",
2483 nesqp->last_aeq, nesqp->hwqp.qp_id);
2484 nes_cm_disconn_true(nesqp);
2489 * nes_cm_disconn_true
2491 static int nes_cm_disconn_true(struct nes_qp *nesqp)
2493 unsigned long flags;
2494 int ret = 0;
2495 struct iw_cm_id *cm_id;
2496 struct iw_cm_event cm_event;
2497 struct nes_vnic *nesvnic;
2498 u16 last_ae;
2499 u8 original_hw_tcp_state;
2500 u8 original_ibqp_state;
2501 u8 issued_disconnect_reset = 0;
2503 if (!nesqp) {
2504 nes_debug(NES_DBG_CM, "disconnect_worker nesqp is NULL\n");
2505 return -1;
2508 spin_lock_irqsave(&nesqp->lock, flags);
2509 cm_id = nesqp->cm_id;
2510 /* make sure we havent already closed this connection */
2511 if (!cm_id) {
2512 nes_debug(NES_DBG_CM, "QP%u disconnect_worker cmid is NULL\n",
2513 nesqp->hwqp.qp_id);
2514 spin_unlock_irqrestore(&nesqp->lock, flags);
2515 return -1;
2518 nesvnic = to_nesvnic(nesqp->ibqp.device);
2519 nes_debug(NES_DBG_CM, "Disconnecting QP%u\n", nesqp->hwqp.qp_id);
2521 original_hw_tcp_state = nesqp->hw_tcp_state;
2522 original_ibqp_state = nesqp->ibqp_state;
2523 last_ae = nesqp->last_aeq;
2526 nes_debug(NES_DBG_CM, "set ibqp_state=%u\n", nesqp->ibqp_state);
2528 if ((nesqp->cm_id) && (cm_id->event_handler)) {
2529 if ((original_hw_tcp_state == NES_AEQE_TCP_STATE_CLOSE_WAIT) ||
2530 ((original_ibqp_state == IB_QPS_RTS) &&
2531 (last_ae == NES_AEQE_AEID_LLP_CONNECTION_RESET))) {
2532 atomic_inc(&cm_disconnects);
2533 cm_event.event = IW_CM_EVENT_DISCONNECT;
2534 if (last_ae == NES_AEQE_AEID_LLP_CONNECTION_RESET) {
2535 cm_event.status = IW_CM_EVENT_STATUS_RESET;
2536 nes_debug(NES_DBG_CM, "Generating a CM "
2537 "Disconnect Event (status reset) for "
2538 "QP%u, cm_id = %p. \n",
2539 nesqp->hwqp.qp_id, cm_id);
2540 } else
2541 cm_event.status = IW_CM_EVENT_STATUS_OK;
2543 cm_event.local_addr = cm_id->local_addr;
2544 cm_event.remote_addr = cm_id->remote_addr;
2545 cm_event.private_data = NULL;
2546 cm_event.private_data_len = 0;
2548 nes_debug(NES_DBG_CM, "Generating a CM Disconnect Event"
2549 " for QP%u, SQ Head = %u, SQ Tail = %u. "
2550 "cm_id = %p, refcount = %u.\n",
2551 nesqp->hwqp.qp_id, nesqp->hwqp.sq_head,
2552 nesqp->hwqp.sq_tail, cm_id,
2553 atomic_read(&nesqp->refcount));
2555 spin_unlock_irqrestore(&nesqp->lock, flags);
2556 ret = cm_id->event_handler(cm_id, &cm_event);
2557 if (ret)
2558 nes_debug(NES_DBG_CM, "OFA CM event_handler "
2559 "returned, ret=%d\n", ret);
2560 spin_lock_irqsave(&nesqp->lock, flags);
2563 nesqp->disconn_pending = 0;
2564 /* There might have been another AE while the lock was released */
2565 original_hw_tcp_state = nesqp->hw_tcp_state;
2566 original_ibqp_state = nesqp->ibqp_state;
2567 last_ae = nesqp->last_aeq;
2569 if ((issued_disconnect_reset == 0) && (nesqp->cm_id) &&
2570 ((original_hw_tcp_state == NES_AEQE_TCP_STATE_CLOSED) ||
2571 (original_hw_tcp_state == NES_AEQE_TCP_STATE_TIME_WAIT) ||
2572 (last_ae == NES_AEQE_AEID_RDMAP_ROE_BAD_LLP_CLOSE) ||
2573 (last_ae == NES_AEQE_AEID_LLP_CONNECTION_RESET))) {
2574 atomic_inc(&cm_closes);
2575 nesqp->cm_id = NULL;
2576 nesqp->in_disconnect = 0;
2577 spin_unlock_irqrestore(&nesqp->lock, flags);
2578 nes_disconnect(nesqp, 1);
2580 cm_id->provider_data = nesqp;
2581 /* Send up the close complete event */
2582 cm_event.event = IW_CM_EVENT_CLOSE;
2583 cm_event.status = IW_CM_EVENT_STATUS_OK;
2584 cm_event.provider_data = cm_id->provider_data;
2585 cm_event.local_addr = cm_id->local_addr;
2586 cm_event.remote_addr = cm_id->remote_addr;
2587 cm_event.private_data = NULL;
2588 cm_event.private_data_len = 0;
2590 ret = cm_id->event_handler(cm_id, &cm_event);
2591 if (ret) {
2592 nes_debug(NES_DBG_CM, "OFA CM event_handler returned, ret=%d\n", ret);
2595 cm_id->rem_ref(cm_id);
2597 spin_lock_irqsave(&nesqp->lock, flags);
2598 if (nesqp->flush_issued == 0) {
2599 nesqp->flush_issued = 1;
2600 spin_unlock_irqrestore(&nesqp->lock, flags);
2601 flush_wqes(nesvnic->nesdev, nesqp,
2602 NES_CQP_FLUSH_RQ, 1);
2603 } else
2604 spin_unlock_irqrestore(&nesqp->lock, flags);
2605 } else {
2606 cm_id = nesqp->cm_id;
2607 spin_unlock_irqrestore(&nesqp->lock, flags);
2608 /* check to see if the inbound reset beat the outbound reset */
2609 if ((!cm_id) && (last_ae==NES_AEQE_AEID_RESET_SENT)) {
2610 nes_debug(NES_DBG_CM, "QP%u: Decing refcount "
2611 "due to inbound reset beating the "
2612 "outbound reset.\n", nesqp->hwqp.qp_id);
2615 } else {
2616 nesqp->disconn_pending = 0;
2617 spin_unlock_irqrestore(&nesqp->lock, flags);
2620 return 0;
2625 * nes_disconnect
2627 static int nes_disconnect(struct nes_qp *nesqp, int abrupt)
2629 int ret = 0;
2630 struct nes_vnic *nesvnic;
2631 struct nes_device *nesdev;
2632 struct nes_ib_device *nesibdev;
2634 nesvnic = to_nesvnic(nesqp->ibqp.device);
2635 if (!nesvnic)
2636 return -EINVAL;
2638 nesdev = nesvnic->nesdev;
2639 nesibdev = nesvnic->nesibdev;
2641 nes_debug(NES_DBG_CM, "netdev refcnt = %u.\n",
2642 atomic_read(&nesvnic->netdev->refcnt));
2644 if (nesqp->active_conn) {
2646 /* indicate this connection is NOT active */
2647 nesqp->active_conn = 0;
2648 } else {
2649 /* Need to free the Last Streaming Mode Message */
2650 if (nesqp->ietf_frame) {
2651 if (nesqp->lsmm_mr)
2652 nesibdev->ibdev.dereg_mr(nesqp->lsmm_mr);
2653 pci_free_consistent(nesdev->pcidev,
2654 nesqp->private_data_len+sizeof(struct ietf_mpa_frame),
2655 nesqp->ietf_frame, nesqp->ietf_frame_pbase);
2659 /* close the CM node down if it is still active */
2660 if (nesqp->cm_node) {
2661 nes_debug(NES_DBG_CM, "Call close API\n");
2663 g_cm_core->api->close(g_cm_core, nesqp->cm_node);
2666 return ret;
2671 * nes_accept
2673 int nes_accept(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
2675 u64 u64temp;
2676 struct ib_qp *ibqp;
2677 struct nes_qp *nesqp;
2678 struct nes_vnic *nesvnic;
2679 struct nes_device *nesdev;
2680 struct nes_cm_node *cm_node;
2681 struct nes_adapter *adapter;
2682 struct ib_qp_attr attr;
2683 struct iw_cm_event cm_event;
2684 struct nes_hw_qp_wqe *wqe;
2685 struct nes_v4_quad nes_quad;
2686 u32 crc_value;
2687 int ret;
2688 int passive_state;
2689 struct nes_ib_device *nesibdev;
2690 struct ib_mr *ibmr = NULL;
2691 struct ib_phys_buf ibphysbuf;
2692 struct nes_pd *nespd;
2696 ibqp = nes_get_qp(cm_id->device, conn_param->qpn);
2697 if (!ibqp)
2698 return -EINVAL;
2700 /* get all our handles */
2701 nesqp = to_nesqp(ibqp);
2702 nesvnic = to_nesvnic(nesqp->ibqp.device);
2703 nesdev = nesvnic->nesdev;
2704 adapter = nesdev->nesadapter;
2706 cm_node = (struct nes_cm_node *)cm_id->provider_data;
2707 nes_debug(NES_DBG_CM, "nes_accept: cm_node= %p nesvnic=%p, netdev=%p,"
2708 "%s\n", cm_node, nesvnic, nesvnic->netdev,
2709 nesvnic->netdev->name);
2711 /* associate the node with the QP */
2712 nesqp->cm_node = (void *)cm_node;
2713 cm_node->nesqp = nesqp;
2714 nes_add_ref(&nesqp->ibqp);
2716 nes_debug(NES_DBG_CM, "QP%u, cm_node=%p, jiffies = %lu listener = %p\n",
2717 nesqp->hwqp.qp_id, cm_node, jiffies, cm_node->listener);
2718 atomic_inc(&cm_accepts);
2720 nes_debug(NES_DBG_CM, "netdev refcnt = %u.\n",
2721 atomic_read(&nesvnic->netdev->refcnt));
2723 /* allocate the ietf frame and space for private data */
2724 nesqp->ietf_frame = pci_alloc_consistent(nesdev->pcidev,
2725 sizeof(struct ietf_mpa_frame) + conn_param->private_data_len,
2726 &nesqp->ietf_frame_pbase);
2728 if (!nesqp->ietf_frame) {
2729 nes_debug(NES_DBG_CM, "Unable to allocate memory for private "
2730 "data\n");
2731 return -ENOMEM;
2735 /* setup the MPA frame */
2736 nesqp->private_data_len = conn_param->private_data_len;
2737 memcpy(nesqp->ietf_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE);
2739 memcpy(nesqp->ietf_frame->priv_data, conn_param->private_data,
2740 conn_param->private_data_len);
2742 nesqp->ietf_frame->priv_data_len =
2743 cpu_to_be16(conn_param->private_data_len);
2744 nesqp->ietf_frame->rev = mpa_version;
2745 nesqp->ietf_frame->flags = IETF_MPA_FLAGS_CRC;
2747 /* setup our first outgoing iWarp send WQE (the IETF frame response) */
2748 wqe = &nesqp->hwqp.sq_vbase[0];
2750 if (cm_id->remote_addr.sin_addr.s_addr !=
2751 cm_id->local_addr.sin_addr.s_addr) {
2752 u64temp = (unsigned long)nesqp;
2753 nesibdev = nesvnic->nesibdev;
2754 nespd = nesqp->nespd;
2755 ibphysbuf.addr = nesqp->ietf_frame_pbase;
2756 ibphysbuf.size = conn_param->private_data_len +
2757 sizeof(struct ietf_mpa_frame);
2758 ibmr = nesibdev->ibdev.reg_phys_mr((struct ib_pd *)nespd,
2759 &ibphysbuf, 1,
2760 IB_ACCESS_LOCAL_WRITE,
2761 (u64 *)&nesqp->ietf_frame);
2762 if (!ibmr) {
2763 nes_debug(NES_DBG_CM, "Unable to register memory region"
2764 "for lSMM for cm_node = %p \n",
2765 cm_node);
2766 return -ENOMEM;
2769 ibmr->pd = &nespd->ibpd;
2770 ibmr->device = nespd->ibpd.device;
2771 nesqp->lsmm_mr = ibmr;
2773 u64temp |= NES_SW_CONTEXT_ALIGN>>1;
2774 set_wqe_64bit_value(wqe->wqe_words,
2775 NES_IWARP_SQ_WQE_COMP_CTX_LOW_IDX,
2776 u64temp);
2777 wqe->wqe_words[NES_IWARP_SQ_WQE_MISC_IDX] =
2778 cpu_to_le32(NES_IWARP_SQ_WQE_STREAMING |
2779 NES_IWARP_SQ_WQE_WRPDU);
2780 wqe->wqe_words[NES_IWARP_SQ_WQE_TOTAL_PAYLOAD_IDX] =
2781 cpu_to_le32(conn_param->private_data_len +
2782 sizeof(struct ietf_mpa_frame));
2783 set_wqe_64bit_value(wqe->wqe_words,
2784 NES_IWARP_SQ_WQE_FRAG0_LOW_IDX,
2785 (u64)nesqp->ietf_frame);
2786 wqe->wqe_words[NES_IWARP_SQ_WQE_LENGTH0_IDX] =
2787 cpu_to_le32(conn_param->private_data_len +
2788 sizeof(struct ietf_mpa_frame));
2789 wqe->wqe_words[NES_IWARP_SQ_WQE_STAG0_IDX] = ibmr->lkey;
2791 nesqp->nesqp_context->ird_ord_sizes |=
2792 cpu_to_le32(NES_QPCONTEXT_ORDIRD_LSMM_PRESENT |
2793 NES_QPCONTEXT_ORDIRD_WRPDU);
2794 } else {
2795 nesqp->nesqp_context->ird_ord_sizes |=
2796 cpu_to_le32(NES_QPCONTEXT_ORDIRD_WRPDU);
2798 nesqp->skip_lsmm = 1;
2801 /* Cache the cm_id in the qp */
2802 nesqp->cm_id = cm_id;
2803 cm_node->cm_id = cm_id;
2805 /* nesqp->cm_node = (void *)cm_id->provider_data; */
2806 cm_id->provider_data = nesqp;
2807 nesqp->active_conn = 0;
2809 if (cm_node->state == NES_CM_STATE_TSA)
2810 nes_debug(NES_DBG_CM, "Already state = TSA for cm_node=%p\n",
2811 cm_node);
2813 nes_cm_init_tsa_conn(nesqp, cm_node);
2815 nesqp->nesqp_context->tcpPorts[0] =
2816 cpu_to_le16(ntohs(cm_id->local_addr.sin_port));
2817 nesqp->nesqp_context->tcpPorts[1] =
2818 cpu_to_le16(ntohs(cm_id->remote_addr.sin_port));
2820 if (ipv4_is_loopback(cm_id->remote_addr.sin_addr.s_addr))
2821 nesqp->nesqp_context->ip0 =
2822 cpu_to_le32(ntohl(nesvnic->local_ipaddr));
2823 else
2824 nesqp->nesqp_context->ip0 =
2825 cpu_to_le32(ntohl(cm_id->remote_addr.sin_addr.s_addr));
2827 nesqp->nesqp_context->misc2 |= cpu_to_le32(
2828 (u32)PCI_FUNC(nesdev->pcidev->devfn) <<
2829 NES_QPCONTEXT_MISC2_SRC_IP_SHIFT);
2831 nesqp->nesqp_context->arp_index_vlan |=
2832 cpu_to_le32(nes_arp_table(nesdev,
2833 le32_to_cpu(nesqp->nesqp_context->ip0), NULL,
2834 NES_ARP_RESOLVE) << 16);
2836 nesqp->nesqp_context->ts_val_delta = cpu_to_le32(
2837 jiffies - nes_read_indexed(nesdev, NES_IDX_TCP_NOW));
2839 nesqp->nesqp_context->ird_index = cpu_to_le32(nesqp->hwqp.qp_id);
2841 nesqp->nesqp_context->ird_ord_sizes |= cpu_to_le32(
2842 ((u32)1 << NES_QPCONTEXT_ORDIRD_IWARP_MODE_SHIFT));
2843 nesqp->nesqp_context->ird_ord_sizes |=
2844 cpu_to_le32((u32)conn_param->ord);
2846 memset(&nes_quad, 0, sizeof(nes_quad));
2847 nes_quad.DstIpAdrIndex =
2848 cpu_to_le32((u32)PCI_FUNC(nesdev->pcidev->devfn) << 24);
2849 if (ipv4_is_loopback(cm_id->remote_addr.sin_addr.s_addr))
2850 nes_quad.SrcIpadr = nesvnic->local_ipaddr;
2851 else
2852 nes_quad.SrcIpadr = cm_id->remote_addr.sin_addr.s_addr;
2853 nes_quad.TcpPorts[0] = cm_id->remote_addr.sin_port;
2854 nes_quad.TcpPorts[1] = cm_id->local_addr.sin_port;
2856 /* Produce hash key */
2857 crc_value = get_crc_value(&nes_quad);
2858 nesqp->hte_index = cpu_to_be32(crc_value ^ 0xffffffff);
2859 nes_debug(NES_DBG_CM, "HTE Index = 0x%08X, CRC = 0x%08X\n",
2860 nesqp->hte_index, nesqp->hte_index & adapter->hte_index_mask);
2862 nesqp->hte_index &= adapter->hte_index_mask;
2863 nesqp->nesqp_context->hte_index = cpu_to_le32(nesqp->hte_index);
2865 cm_node->cm_core->api->accelerated(cm_node->cm_core, cm_node);
2867 nes_debug(NES_DBG_CM, "QP%u, Destination IP = 0x%08X:0x%04X, local = "
2868 "0x%08X:0x%04X, rcv_nxt=0x%08X, snd_nxt=0x%08X, mpa + "
2869 "private data length=%zu.\n", nesqp->hwqp.qp_id,
2870 ntohl(cm_id->remote_addr.sin_addr.s_addr),
2871 ntohs(cm_id->remote_addr.sin_port),
2872 ntohl(cm_id->local_addr.sin_addr.s_addr),
2873 ntohs(cm_id->local_addr.sin_port),
2874 le32_to_cpu(nesqp->nesqp_context->rcv_nxt),
2875 le32_to_cpu(nesqp->nesqp_context->snd_nxt),
2876 conn_param->private_data_len +
2877 sizeof(struct ietf_mpa_frame));
2880 /* notify OF layer that accept event was successful */
2881 cm_id->add_ref(cm_id);
2883 cm_event.event = IW_CM_EVENT_ESTABLISHED;
2884 cm_event.status = IW_CM_EVENT_STATUS_ACCEPTED;
2885 cm_event.provider_data = (void *)nesqp;
2886 cm_event.local_addr = cm_id->local_addr;
2887 cm_event.remote_addr = cm_id->remote_addr;
2888 cm_event.private_data = NULL;
2889 cm_event.private_data_len = 0;
2890 ret = cm_id->event_handler(cm_id, &cm_event);
2891 attr.qp_state = IB_QPS_RTS;
2892 nes_modify_qp(&nesqp->ibqp, &attr, IB_QP_STATE, NULL);
2893 if (cm_node->loopbackpartner) {
2894 cm_node->loopbackpartner->mpa_frame_size =
2895 nesqp->private_data_len;
2896 /* copy entire MPA frame to our cm_node's frame */
2897 memcpy(cm_node->loopbackpartner->mpa_frame_buf,
2898 nesqp->ietf_frame->priv_data, nesqp->private_data_len);
2899 create_event(cm_node->loopbackpartner, NES_CM_EVENT_CONNECTED);
2901 if (ret)
2902 printk(KERN_ERR "%s[%u] OFA CM event_handler returned, "
2903 "ret=%d\n", __func__, __LINE__, ret);
2905 passive_state = atomic_add_return(1, &cm_node->passive_state);
2906 if (passive_state == NES_SEND_RESET_EVENT)
2907 create_event(cm_node, NES_CM_EVENT_RESET);
2908 return 0;
2913 * nes_reject
2915 int nes_reject(struct iw_cm_id *cm_id, const void *pdata, u8 pdata_len)
2917 struct nes_cm_node *cm_node;
2918 struct nes_cm_node *loopback;
2920 struct nes_cm_core *cm_core;
2922 atomic_inc(&cm_rejects);
2923 cm_node = (struct nes_cm_node *) cm_id->provider_data;
2924 loopback = cm_node->loopbackpartner;
2925 cm_core = cm_node->cm_core;
2926 cm_node->cm_id = cm_id;
2927 cm_node->mpa_frame_size = sizeof(struct ietf_mpa_frame) + pdata_len;
2929 if (cm_node->mpa_frame_size > MAX_CM_BUFFER)
2930 return -EINVAL;
2932 strcpy(&cm_node->mpa_frame.key[0], IEFT_MPA_KEY_REP);
2933 if (loopback) {
2934 memcpy(&loopback->mpa_frame.priv_data, pdata, pdata_len);
2935 loopback->mpa_frame.priv_data_len = pdata_len;
2936 loopback->mpa_frame_size = sizeof(struct ietf_mpa_frame) +
2937 pdata_len;
2938 } else {
2939 memcpy(&cm_node->mpa_frame.priv_data, pdata, pdata_len);
2940 cm_node->mpa_frame.priv_data_len = cpu_to_be16(pdata_len);
2943 cm_node->mpa_frame.rev = mpa_version;
2944 cm_node->mpa_frame.flags = IETF_MPA_FLAGS_CRC | IETF_MPA_FLAGS_REJECT;
2946 return cm_core->api->reject(cm_core, &cm_node->mpa_frame, cm_node);
2951 * nes_connect
2952 * setup and launch cm connect node
2954 int nes_connect(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
2956 struct ib_qp *ibqp;
2957 struct nes_qp *nesqp;
2958 struct nes_vnic *nesvnic;
2959 struct nes_device *nesdev;
2960 struct nes_cm_node *cm_node;
2961 struct nes_cm_info cm_info;
2963 ibqp = nes_get_qp(cm_id->device, conn_param->qpn);
2964 if (!ibqp)
2965 return -EINVAL;
2966 nesqp = to_nesqp(ibqp);
2967 if (!nesqp)
2968 return -EINVAL;
2969 nesvnic = to_nesvnic(nesqp->ibqp.device);
2970 if (!nesvnic)
2971 return -EINVAL;
2972 nesdev = nesvnic->nesdev;
2973 if (!nesdev)
2974 return -EINVAL;
2976 nes_debug(NES_DBG_CM, "QP%u, current IP = 0x%08X, Destination IP = "
2977 "0x%08X:0x%04X, local = 0x%08X:0x%04X.\n", nesqp->hwqp.qp_id,
2978 ntohl(nesvnic->local_ipaddr),
2979 ntohl(cm_id->remote_addr.sin_addr.s_addr),
2980 ntohs(cm_id->remote_addr.sin_port),
2981 ntohl(cm_id->local_addr.sin_addr.s_addr),
2982 ntohs(cm_id->local_addr.sin_port));
2984 atomic_inc(&cm_connects);
2985 nesqp->active_conn = 1;
2987 /* cache the cm_id in the qp */
2988 nesqp->cm_id = cm_id;
2990 cm_id->provider_data = nesqp;
2992 nesqp->private_data_len = conn_param->private_data_len;
2993 nesqp->nesqp_context->ird_ord_sizes |= cpu_to_le32((u32)conn_param->ord);
2994 nes_debug(NES_DBG_CM, "requested ord = 0x%08X.\n", (u32)conn_param->ord);
2995 nes_debug(NES_DBG_CM, "mpa private data len =%u\n",
2996 conn_param->private_data_len);
2998 if (cm_id->local_addr.sin_addr.s_addr !=
2999 cm_id->remote_addr.sin_addr.s_addr)
3000 nes_manage_apbvt(nesvnic, ntohs(cm_id->local_addr.sin_port),
3001 PCI_FUNC(nesdev->pcidev->devfn), NES_MANAGE_APBVT_ADD);
3003 /* set up the connection params for the node */
3004 cm_info.loc_addr = htonl(cm_id->local_addr.sin_addr.s_addr);
3005 cm_info.loc_port = htons(cm_id->local_addr.sin_port);
3006 cm_info.rem_addr = htonl(cm_id->remote_addr.sin_addr.s_addr);
3007 cm_info.rem_port = htons(cm_id->remote_addr.sin_port);
3008 cm_info.cm_id = cm_id;
3009 cm_info.conn_type = NES_CM_IWARP_CONN_TYPE;
3011 cm_id->add_ref(cm_id);
3013 /* create a connect CM node connection */
3014 cm_node = g_cm_core->api->connect(g_cm_core, nesvnic,
3015 conn_param->private_data_len, (void *)conn_param->private_data,
3016 &cm_info);
3017 if (!cm_node) {
3018 if (cm_id->local_addr.sin_addr.s_addr !=
3019 cm_id->remote_addr.sin_addr.s_addr)
3020 nes_manage_apbvt(nesvnic, ntohs(cm_id->local_addr.sin_port),
3021 PCI_FUNC(nesdev->pcidev->devfn),
3022 NES_MANAGE_APBVT_DEL);
3024 cm_id->rem_ref(cm_id);
3025 return -ENOMEM;
3028 cm_node->apbvt_set = 1;
3029 nesqp->cm_node = cm_node;
3030 cm_node->nesqp = nesqp;
3031 nes_add_ref(&nesqp->ibqp);
3033 return 0;
3038 * nes_create_listen
3040 int nes_create_listen(struct iw_cm_id *cm_id, int backlog)
3042 struct nes_vnic *nesvnic;
3043 struct nes_cm_listener *cm_node;
3044 struct nes_cm_info cm_info;
3045 struct nes_adapter *adapter;
3046 int err;
3049 nes_debug(NES_DBG_CM, "cm_id = %p, local port = 0x%04X.\n",
3050 cm_id, ntohs(cm_id->local_addr.sin_port));
3052 nesvnic = to_nesvnic(cm_id->device);
3053 if (!nesvnic)
3054 return -EINVAL;
3055 adapter = nesvnic->nesdev->nesadapter;
3056 nes_debug(NES_DBG_CM, "nesvnic=%p, netdev=%p, %s\n",
3057 nesvnic, nesvnic->netdev, nesvnic->netdev->name);
3059 nes_debug(NES_DBG_CM, "nesvnic->local_ipaddr=0x%08x, sin_addr.s_addr=0x%08x\n",
3060 nesvnic->local_ipaddr, cm_id->local_addr.sin_addr.s_addr);
3062 /* setup listen params in our api call struct */
3063 cm_info.loc_addr = nesvnic->local_ipaddr;
3064 cm_info.loc_port = cm_id->local_addr.sin_port;
3065 cm_info.backlog = backlog;
3066 cm_info.cm_id = cm_id;
3068 cm_info.conn_type = NES_CM_IWARP_CONN_TYPE;
3071 cm_node = g_cm_core->api->listen(g_cm_core, nesvnic, &cm_info);
3072 if (!cm_node) {
3073 printk(KERN_ERR "%s[%u] Error returned from listen API call\n",
3074 __func__, __LINE__);
3075 return -ENOMEM;
3078 cm_id->provider_data = cm_node;
3080 if (!cm_node->reused_node) {
3081 err = nes_manage_apbvt(nesvnic,
3082 ntohs(cm_id->local_addr.sin_port),
3083 PCI_FUNC(nesvnic->nesdev->pcidev->devfn),
3084 NES_MANAGE_APBVT_ADD);
3085 if (err) {
3086 printk(KERN_ERR "nes_manage_apbvt call returned %d.\n",
3087 err);
3088 g_cm_core->api->stop_listener(g_cm_core, (void *)cm_node);
3089 return err;
3091 cm_listens_created++;
3094 cm_id->add_ref(cm_id);
3095 cm_id->provider_data = (void *)cm_node;
3098 return 0;
3103 * nes_destroy_listen
3105 int nes_destroy_listen(struct iw_cm_id *cm_id)
3107 if (cm_id->provider_data)
3108 g_cm_core->api->stop_listener(g_cm_core, cm_id->provider_data);
3109 else
3110 nes_debug(NES_DBG_CM, "cm_id->provider_data was NULL\n");
3112 cm_id->rem_ref(cm_id);
3114 return 0;
3119 * nes_cm_recv
3121 int nes_cm_recv(struct sk_buff *skb, struct net_device *netdevice)
3123 int rc = 0;
3124 cm_packets_received++;
3125 if ((g_cm_core) && (g_cm_core->api)) {
3126 rc = g_cm_core->api->recv_pkt(g_cm_core, netdev_priv(netdevice), skb);
3127 } else {
3128 nes_debug(NES_DBG_CM, "Unable to process packet for CM,"
3129 " cm is not setup properly.\n");
3132 return rc;
3137 * nes_cm_start
3138 * Start and init a cm core module
3140 int nes_cm_start(void)
3142 nes_debug(NES_DBG_CM, "\n");
3143 /* create the primary CM core, pass this handle to subsequent core inits */
3144 g_cm_core = nes_cm_alloc_core();
3145 if (g_cm_core) {
3146 return 0;
3147 } else {
3148 return -ENOMEM;
3154 * nes_cm_stop
3155 * stop and dealloc all cm core instances
3157 int nes_cm_stop(void)
3159 g_cm_core->api->destroy_cm_core(g_cm_core);
3160 return 0;
3165 * cm_event_connected
3166 * handle a connected event, setup QPs and HW
3168 static void cm_event_connected(struct nes_cm_event *event)
3170 u64 u64temp;
3171 struct nes_qp *nesqp;
3172 struct nes_vnic *nesvnic;
3173 struct nes_device *nesdev;
3174 struct nes_cm_node *cm_node;
3175 struct nes_adapter *nesadapter;
3176 struct ib_qp_attr attr;
3177 struct iw_cm_id *cm_id;
3178 struct iw_cm_event cm_event;
3179 struct nes_hw_qp_wqe *wqe;
3180 struct nes_v4_quad nes_quad;
3181 u32 crc_value;
3182 int ret;
3184 /* get all our handles */
3185 cm_node = event->cm_node;
3186 cm_id = cm_node->cm_id;
3187 nes_debug(NES_DBG_CM, "cm_event_connected - %p - cm_id = %p\n", cm_node, cm_id);
3188 nesqp = (struct nes_qp *)cm_id->provider_data;
3189 nesvnic = to_nesvnic(nesqp->ibqp.device);
3190 nesdev = nesvnic->nesdev;
3191 nesadapter = nesdev->nesadapter;
3193 if (nesqp->destroyed) {
3194 return;
3196 atomic_inc(&cm_connecteds);
3197 nes_debug(NES_DBG_CM, "QP%u attempting to connect to 0x%08X:0x%04X on"
3198 " local port 0x%04X. jiffies = %lu.\n",
3199 nesqp->hwqp.qp_id,
3200 ntohl(cm_id->remote_addr.sin_addr.s_addr),
3201 ntohs(cm_id->remote_addr.sin_port),
3202 ntohs(cm_id->local_addr.sin_port),
3203 jiffies);
3205 nes_cm_init_tsa_conn(nesqp, cm_node);
3207 /* set the QP tsa context */
3208 nesqp->nesqp_context->tcpPorts[0] =
3209 cpu_to_le16(ntohs(cm_id->local_addr.sin_port));
3210 nesqp->nesqp_context->tcpPorts[1] =
3211 cpu_to_le16(ntohs(cm_id->remote_addr.sin_port));
3212 if (ipv4_is_loopback(cm_id->remote_addr.sin_addr.s_addr))
3213 nesqp->nesqp_context->ip0 =
3214 cpu_to_le32(ntohl(nesvnic->local_ipaddr));
3215 else
3216 nesqp->nesqp_context->ip0 =
3217 cpu_to_le32(ntohl(cm_id->remote_addr.sin_addr.s_addr));
3219 nesqp->nesqp_context->misc2 |= cpu_to_le32(
3220 (u32)PCI_FUNC(nesdev->pcidev->devfn) <<
3221 NES_QPCONTEXT_MISC2_SRC_IP_SHIFT);
3222 nesqp->nesqp_context->arp_index_vlan |= cpu_to_le32(
3223 nes_arp_table(nesdev,
3224 le32_to_cpu(nesqp->nesqp_context->ip0),
3225 NULL, NES_ARP_RESOLVE) << 16);
3226 nesqp->nesqp_context->ts_val_delta = cpu_to_le32(
3227 jiffies - nes_read_indexed(nesdev, NES_IDX_TCP_NOW));
3228 nesqp->nesqp_context->ird_index = cpu_to_le32(nesqp->hwqp.qp_id);
3229 nesqp->nesqp_context->ird_ord_sizes |=
3230 cpu_to_le32((u32)1 <<
3231 NES_QPCONTEXT_ORDIRD_IWARP_MODE_SHIFT);
3233 /* Adjust tail for not having a LSMM */
3234 nesqp->hwqp.sq_tail = 1;
3236 #if defined(NES_SEND_FIRST_WRITE)
3237 if (cm_node->send_write0) {
3238 nes_debug(NES_DBG_CM, "Sending first write.\n");
3239 wqe = &nesqp->hwqp.sq_vbase[0];
3240 u64temp = (unsigned long)nesqp;
3241 u64temp |= NES_SW_CONTEXT_ALIGN>>1;
3242 set_wqe_64bit_value(wqe->wqe_words,
3243 NES_IWARP_SQ_WQE_COMP_CTX_LOW_IDX, u64temp);
3244 wqe->wqe_words[NES_IWARP_SQ_WQE_MISC_IDX] =
3245 cpu_to_le32(NES_IWARP_SQ_OP_RDMAW);
3246 wqe->wqe_words[NES_IWARP_SQ_WQE_TOTAL_PAYLOAD_IDX] = 0;
3247 wqe->wqe_words[NES_IWARP_SQ_WQE_FRAG0_LOW_IDX] = 0;
3248 wqe->wqe_words[NES_IWARP_SQ_WQE_FRAG0_HIGH_IDX] = 0;
3249 wqe->wqe_words[NES_IWARP_SQ_WQE_LENGTH0_IDX] = 0;
3250 wqe->wqe_words[NES_IWARP_SQ_WQE_STAG0_IDX] = 0;
3252 /* use the reserved spot on the WQ for the extra first WQE */
3253 nesqp->nesqp_context->ird_ord_sizes &=
3254 cpu_to_le32(~(NES_QPCONTEXT_ORDIRD_LSMM_PRESENT |
3255 NES_QPCONTEXT_ORDIRD_WRPDU |
3256 NES_QPCONTEXT_ORDIRD_ALSMM));
3257 nesqp->skip_lsmm = 1;
3258 nesqp->hwqp.sq_tail = 0;
3259 nes_write32(nesdev->regs + NES_WQE_ALLOC,
3260 (1 << 24) | 0x00800000 | nesqp->hwqp.qp_id);
3262 #endif
3264 memset(&nes_quad, 0, sizeof(nes_quad));
3266 nes_quad.DstIpAdrIndex =
3267 cpu_to_le32((u32)PCI_FUNC(nesdev->pcidev->devfn) << 24);
3268 if (ipv4_is_loopback(cm_id->remote_addr.sin_addr.s_addr))
3269 nes_quad.SrcIpadr = nesvnic->local_ipaddr;
3270 else
3271 nes_quad.SrcIpadr = cm_id->remote_addr.sin_addr.s_addr;
3272 nes_quad.TcpPorts[0] = cm_id->remote_addr.sin_port;
3273 nes_quad.TcpPorts[1] = cm_id->local_addr.sin_port;
3275 /* Produce hash key */
3276 crc_value = get_crc_value(&nes_quad);
3277 nesqp->hte_index = cpu_to_be32(crc_value ^ 0xffffffff);
3278 nes_debug(NES_DBG_CM, "HTE Index = 0x%08X, After CRC = 0x%08X\n",
3279 nesqp->hte_index, nesqp->hte_index & nesadapter->hte_index_mask);
3281 nesqp->hte_index &= nesadapter->hte_index_mask;
3282 nesqp->nesqp_context->hte_index = cpu_to_le32(nesqp->hte_index);
3284 nesqp->ietf_frame = &cm_node->mpa_frame;
3285 nesqp->private_data_len = (u8) cm_node->mpa_frame_size;
3286 cm_node->cm_core->api->accelerated(cm_node->cm_core, cm_node);
3288 /* notify OF layer we successfully created the requested connection */
3289 cm_event.event = IW_CM_EVENT_CONNECT_REPLY;
3290 cm_event.status = IW_CM_EVENT_STATUS_ACCEPTED;
3291 cm_event.provider_data = cm_id->provider_data;
3292 cm_event.local_addr.sin_family = AF_INET;
3293 cm_event.local_addr.sin_port = cm_id->local_addr.sin_port;
3294 cm_event.remote_addr = cm_id->remote_addr;
3296 cm_event.private_data = (void *)event->cm_node->mpa_frame_buf;
3297 cm_event.private_data_len = (u8) event->cm_node->mpa_frame_size;
3299 cm_event.local_addr.sin_addr.s_addr = event->cm_info.rem_addr;
3300 ret = cm_id->event_handler(cm_id, &cm_event);
3301 nes_debug(NES_DBG_CM, "OFA CM event_handler returned, ret=%d\n", ret);
3303 if (ret)
3304 printk(KERN_ERR "%s[%u] OFA CM event_handler returned, "
3305 "ret=%d\n", __func__, __LINE__, ret);
3306 attr.qp_state = IB_QPS_RTS;
3307 nes_modify_qp(&nesqp->ibqp, &attr, IB_QP_STATE, NULL);
3309 nes_debug(NES_DBG_CM, "Exiting connect thread for QP%u. jiffies = "
3310 "%lu\n", nesqp->hwqp.qp_id, jiffies);
3312 return;
3317 * cm_event_connect_error
3319 static void cm_event_connect_error(struct nes_cm_event *event)
3321 struct nes_qp *nesqp;
3322 struct iw_cm_id *cm_id;
3323 struct iw_cm_event cm_event;
3324 /* struct nes_cm_info cm_info; */
3325 int ret;
3327 if (!event->cm_node)
3328 return;
3330 cm_id = event->cm_node->cm_id;
3331 if (!cm_id) {
3332 return;
3335 nes_debug(NES_DBG_CM, "cm_node=%p, cm_id=%p\n", event->cm_node, cm_id);
3336 nesqp = cm_id->provider_data;
3338 if (!nesqp) {
3339 return;
3342 /* notify OF layer about this connection error event */
3343 /* cm_id->rem_ref(cm_id); */
3344 nesqp->cm_id = NULL;
3345 cm_id->provider_data = NULL;
3346 cm_event.event = IW_CM_EVENT_CONNECT_REPLY;
3347 cm_event.status = IW_CM_EVENT_STATUS_REJECTED;
3348 cm_event.provider_data = cm_id->provider_data;
3349 cm_event.local_addr = cm_id->local_addr;
3350 cm_event.remote_addr = cm_id->remote_addr;
3351 cm_event.private_data = NULL;
3352 cm_event.private_data_len = 0;
3354 nes_debug(NES_DBG_CM, "call CM_EVENT REJECTED, local_addr=%08x, "
3355 "remove_addr=%08x\n", cm_event.local_addr.sin_addr.s_addr,
3356 cm_event.remote_addr.sin_addr.s_addr);
3358 ret = cm_id->event_handler(cm_id, &cm_event);
3359 nes_debug(NES_DBG_CM, "OFA CM event_handler returned, ret=%d\n", ret);
3360 if (ret)
3361 printk(KERN_ERR "%s[%u] OFA CM event_handler returned, "
3362 "ret=%d\n", __func__, __LINE__, ret);
3363 cm_id->rem_ref(cm_id);
3365 rem_ref_cm_node(event->cm_node->cm_core, event->cm_node);
3366 return;
3371 * cm_event_reset
3373 static void cm_event_reset(struct nes_cm_event *event)
3375 struct nes_qp *nesqp;
3376 struct iw_cm_id *cm_id;
3377 struct iw_cm_event cm_event;
3378 /* struct nes_cm_info cm_info; */
3379 int ret;
3381 if (!event->cm_node)
3382 return;
3384 if (!event->cm_node->cm_id)
3385 return;
3387 cm_id = event->cm_node->cm_id;
3389 nes_debug(NES_DBG_CM, "%p - cm_id = %p\n", event->cm_node, cm_id);
3390 nesqp = cm_id->provider_data;
3392 nesqp->cm_id = NULL;
3393 /* cm_id->provider_data = NULL; */
3394 cm_event.event = IW_CM_EVENT_DISCONNECT;
3395 cm_event.status = IW_CM_EVENT_STATUS_RESET;
3396 cm_event.provider_data = cm_id->provider_data;
3397 cm_event.local_addr = cm_id->local_addr;
3398 cm_event.remote_addr = cm_id->remote_addr;
3399 cm_event.private_data = NULL;
3400 cm_event.private_data_len = 0;
3402 ret = cm_id->event_handler(cm_id, &cm_event);
3403 cm_id->add_ref(cm_id);
3404 atomic_inc(&cm_closes);
3405 cm_event.event = IW_CM_EVENT_CLOSE;
3406 cm_event.status = IW_CM_EVENT_STATUS_OK;
3407 cm_event.provider_data = cm_id->provider_data;
3408 cm_event.local_addr = cm_id->local_addr;
3409 cm_event.remote_addr = cm_id->remote_addr;
3410 cm_event.private_data = NULL;
3411 cm_event.private_data_len = 0;
3412 nes_debug(NES_DBG_CM, "NODE %p Generating CLOSE\n", event->cm_node);
3413 ret = cm_id->event_handler(cm_id, &cm_event);
3415 nes_debug(NES_DBG_CM, "OFA CM event_handler returned, ret=%d\n", ret);
3418 /* notify OF layer about this connection error event */
3419 cm_id->rem_ref(cm_id);
3421 return;
3426 * cm_event_mpa_req
3428 static void cm_event_mpa_req(struct nes_cm_event *event)
3430 struct iw_cm_id *cm_id;
3431 struct iw_cm_event cm_event;
3432 int ret;
3433 struct nes_cm_node *cm_node;
3435 cm_node = event->cm_node;
3436 if (!cm_node)
3437 return;
3438 cm_id = cm_node->cm_id;
3440 atomic_inc(&cm_connect_reqs);
3441 nes_debug(NES_DBG_CM, "cm_node = %p - cm_id = %p, jiffies = %lu\n",
3442 cm_node, cm_id, jiffies);
3444 cm_event.event = IW_CM_EVENT_CONNECT_REQUEST;
3445 cm_event.status = IW_CM_EVENT_STATUS_OK;
3446 cm_event.provider_data = (void *)cm_node;
3448 cm_event.local_addr.sin_family = AF_INET;
3449 cm_event.local_addr.sin_port = htons(event->cm_info.loc_port);
3450 cm_event.local_addr.sin_addr.s_addr = htonl(event->cm_info.loc_addr);
3452 cm_event.remote_addr.sin_family = AF_INET;
3453 cm_event.remote_addr.sin_port = htons(event->cm_info.rem_port);
3454 cm_event.remote_addr.sin_addr.s_addr = htonl(event->cm_info.rem_addr);
3455 cm_event.private_data = cm_node->mpa_frame_buf;
3456 cm_event.private_data_len = (u8) cm_node->mpa_frame_size;
3458 ret = cm_id->event_handler(cm_id, &cm_event);
3459 if (ret)
3460 printk(KERN_ERR "%s[%u] OFA CM event_handler returned, ret=%d\n",
3461 __func__, __LINE__, ret);
3462 return;
3466 static void cm_event_mpa_reject(struct nes_cm_event *event)
3468 struct iw_cm_id *cm_id;
3469 struct iw_cm_event cm_event;
3470 struct nes_cm_node *cm_node;
3471 int ret;
3473 cm_node = event->cm_node;
3474 if (!cm_node)
3475 return;
3476 cm_id = cm_node->cm_id;
3478 atomic_inc(&cm_connect_reqs);
3479 nes_debug(NES_DBG_CM, "cm_node = %p - cm_id = %p, jiffies = %lu\n",
3480 cm_node, cm_id, jiffies);
3482 cm_event.event = IW_CM_EVENT_CONNECT_REPLY;
3483 cm_event.status = -ECONNREFUSED;
3484 cm_event.provider_data = cm_id->provider_data;
3486 cm_event.local_addr.sin_family = AF_INET;
3487 cm_event.local_addr.sin_port = htons(event->cm_info.loc_port);
3488 cm_event.local_addr.sin_addr.s_addr = htonl(event->cm_info.loc_addr);
3490 cm_event.remote_addr.sin_family = AF_INET;
3491 cm_event.remote_addr.sin_port = htons(event->cm_info.rem_port);
3492 cm_event.remote_addr.sin_addr.s_addr = htonl(event->cm_info.rem_addr);
3494 cm_event.private_data = cm_node->mpa_frame_buf;
3495 cm_event.private_data_len = (u8) cm_node->mpa_frame_size;
3497 nes_debug(NES_DBG_CM, "call CM_EVENT_MPA_REJECTED, local_addr=%08x, "
3498 "remove_addr=%08x\n",
3499 cm_event.local_addr.sin_addr.s_addr,
3500 cm_event.remote_addr.sin_addr.s_addr);
3502 ret = cm_id->event_handler(cm_id, &cm_event);
3503 if (ret)
3504 printk(KERN_ERR "%s[%u] OFA CM event_handler returned, ret=%d\n",
3505 __func__, __LINE__, ret);
3507 return;
3511 static void nes_cm_event_handler(struct work_struct *);
3514 * nes_cm_post_event
3515 * post an event to the cm event handler
3517 static int nes_cm_post_event(struct nes_cm_event *event)
3519 atomic_inc(&event->cm_node->cm_core->events_posted);
3520 add_ref_cm_node(event->cm_node);
3521 event->cm_info.cm_id->add_ref(event->cm_info.cm_id);
3522 INIT_WORK(&event->event_work, nes_cm_event_handler);
3523 nes_debug(NES_DBG_CM, "cm_node=%p queue_work, event=%p\n",
3524 event->cm_node, event);
3526 queue_work(event->cm_node->cm_core->event_wq, &event->event_work);
3528 nes_debug(NES_DBG_CM, "Exit\n");
3529 return 0;
3534 * nes_cm_event_handler
3535 * worker function to handle cm events
3536 * will free instance of nes_cm_event
3538 static void nes_cm_event_handler(struct work_struct *work)
3540 struct nes_cm_event *event = container_of(work, struct nes_cm_event,
3541 event_work);
3542 struct nes_cm_core *cm_core;
3544 if ((!event) || (!event->cm_node) || (!event->cm_node->cm_core))
3545 return;
3547 cm_core = event->cm_node->cm_core;
3548 nes_debug(NES_DBG_CM, "event=%p, event->type=%u, events posted=%u\n",
3549 event, event->type, atomic_read(&cm_core->events_posted));
3551 switch (event->type) {
3552 case NES_CM_EVENT_MPA_REQ:
3553 cm_event_mpa_req(event);
3554 nes_debug(NES_DBG_CM, "cm_node=%p CM Event: MPA REQUEST\n",
3555 event->cm_node);
3556 break;
3557 case NES_CM_EVENT_RESET:
3558 nes_debug(NES_DBG_CM, "cm_node = %p CM Event: RESET\n",
3559 event->cm_node);
3560 cm_event_reset(event);
3561 break;
3562 case NES_CM_EVENT_CONNECTED:
3563 if ((!event->cm_node->cm_id) ||
3564 (event->cm_node->state != NES_CM_STATE_TSA))
3565 break;
3566 cm_event_connected(event);
3567 nes_debug(NES_DBG_CM, "CM Event: CONNECTED\n");
3568 break;
3569 case NES_CM_EVENT_MPA_REJECT:
3570 if ((!event->cm_node->cm_id) ||
3571 (event->cm_node->state == NES_CM_STATE_TSA))
3572 break;
3573 cm_event_mpa_reject(event);
3574 nes_debug(NES_DBG_CM, "CM Event: REJECT\n");
3575 break;
3577 case NES_CM_EVENT_ABORTED:
3578 if ((!event->cm_node->cm_id) ||
3579 (event->cm_node->state == NES_CM_STATE_TSA))
3580 break;
3581 cm_event_connect_error(event);
3582 nes_debug(NES_DBG_CM, "CM Event: ABORTED\n");
3583 break;
3584 case NES_CM_EVENT_DROPPED_PKT:
3585 nes_debug(NES_DBG_CM, "CM Event: DROPPED PKT\n");
3586 break;
3587 default:
3588 nes_debug(NES_DBG_CM, "CM Event: UNKNOWN EVENT TYPE\n");
3589 break;
3592 atomic_dec(&cm_core->events_posted);
3593 event->cm_info.cm_id->rem_ref(event->cm_info.cm_id);
3594 rem_ref_cm_node(cm_core, event->cm_node);
3595 kfree(event);
3597 return;