Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/roland...
[pandora-kernel.git] / drivers / infiniband / hw / nes / nes_cm.c
1 /*
2  * Copyright (c) 2006 - 2009 Intel Corporation.  All rights reserved.
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and/or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  *
32  */
33
34
35 #define TCPOPT_TIMESTAMP 8
36
37 #include <linux/atomic.h>
38 #include <linux/skbuff.h>
39 #include <linux/ip.h>
40 #include <linux/tcp.h>
41 #include <linux/init.h>
42 #include <linux/if_arp.h>
43 #include <linux/if_vlan.h>
44 #include <linux/notifier.h>
45 #include <linux/net.h>
46 #include <linux/types.h>
47 #include <linux/timer.h>
48 #include <linux/time.h>
49 #include <linux/delay.h>
50 #include <linux/etherdevice.h>
51 #include <linux/netdevice.h>
52 #include <linux/random.h>
53 #include <linux/list.h>
54 #include <linux/threads.h>
55 #include <linux/highmem.h>
56 #include <linux/slab.h>
57 #include <net/arp.h>
58 #include <net/neighbour.h>
59 #include <net/route.h>
60 #include <net/ip_fib.h>
61 #include <net/tcp.h>
62
63 #include "nes.h"
64
65 u32 cm_packets_sent;
66 u32 cm_packets_bounced;
67 u32 cm_packets_dropped;
68 u32 cm_packets_retrans;
69 u32 cm_packets_created;
70 u32 cm_packets_received;
71 atomic_t cm_listens_created;
72 atomic_t cm_listens_destroyed;
73 u32 cm_backlog_drops;
74 atomic_t cm_loopbacks;
75 atomic_t cm_nodes_created;
76 atomic_t cm_nodes_destroyed;
77 atomic_t cm_accel_dropped_pkts;
78 atomic_t cm_resets_recvd;
79
80 static inline int mini_cm_accelerated(struct nes_cm_core *, struct nes_cm_node *);
81 static struct nes_cm_listener *mini_cm_listen(struct nes_cm_core *, struct nes_vnic *, struct nes_cm_info *);
82 static int mini_cm_del_listen(struct nes_cm_core *, struct nes_cm_listener *);
83 static struct nes_cm_node *mini_cm_connect(struct nes_cm_core *, struct nes_vnic *, u16, void *, struct nes_cm_info *);
84 static int mini_cm_close(struct nes_cm_core *, struct nes_cm_node *);
85 static int mini_cm_accept(struct nes_cm_core *, struct nes_cm_node *);
86 static int mini_cm_reject(struct nes_cm_core *, struct nes_cm_node *);
87 static int mini_cm_recv_pkt(struct nes_cm_core *, struct nes_vnic *, struct sk_buff *);
88 static int mini_cm_dealloc_core(struct nes_cm_core *);
89 static int mini_cm_get(struct nes_cm_core *);
90 static int mini_cm_set(struct nes_cm_core *, u32, u32);
91
92 static void form_cm_frame(struct sk_buff *, struct nes_cm_node *, void *, u32, void *, u32, u8);
93 static int add_ref_cm_node(struct nes_cm_node *);
94 static int rem_ref_cm_node(struct nes_cm_core *, struct nes_cm_node *);
95
96 static int nes_cm_disconn_true(struct nes_qp *);
97 static int nes_cm_post_event(struct nes_cm_event *event);
98 static int nes_disconnect(struct nes_qp *nesqp, int abrupt);
99 static void nes_disconnect_worker(struct work_struct *work);
100
101 static int send_mpa_request(struct nes_cm_node *, struct sk_buff *);
102 static int send_mpa_reject(struct nes_cm_node *);
103 static int send_syn(struct nes_cm_node *, u32, struct sk_buff *);
104 static int send_reset(struct nes_cm_node *, struct sk_buff *);
105 static int send_ack(struct nes_cm_node *cm_node, struct sk_buff *skb);
106 static int send_fin(struct nes_cm_node *cm_node, struct sk_buff *skb);
107 static void process_packet(struct nes_cm_node *, struct sk_buff *, struct nes_cm_core *);
108
109 static void active_open_err(struct nes_cm_node *, struct sk_buff *, int);
110 static void passive_open_err(struct nes_cm_node *, struct sk_buff *, int);
111 static void cleanup_retrans_entry(struct nes_cm_node *);
112 static void handle_rcv_mpa(struct nes_cm_node *, struct sk_buff *);
113 static void free_retrans_entry(struct nes_cm_node *cm_node);
114 static int handle_tcp_options(struct nes_cm_node *cm_node, struct tcphdr *tcph, struct sk_buff *skb, int optionsize, int passive);
115
116 /* CM event handler functions */
117 static void cm_event_connected(struct nes_cm_event *);
118 static void cm_event_connect_error(struct nes_cm_event *);
119 static void cm_event_reset(struct nes_cm_event *);
120 static void cm_event_mpa_req(struct nes_cm_event *);
121 static void cm_event_mpa_reject(struct nes_cm_event *);
122 static void handle_recv_entry(struct nes_cm_node *cm_node, u32 rem_node);
123
124 /* MPA build functions */
125 static int cm_build_mpa_frame(struct nes_cm_node *, u8 **, u16 *, u8 *, u8);
126 static void build_mpa_v2(struct nes_cm_node *, void *, u8);
127 static void build_mpa_v1(struct nes_cm_node *, void *, u8);
128 static void build_rdma0_msg(struct nes_cm_node *, struct nes_qp **);
129
130 static void print_core(struct nes_cm_core *core);
131
132 /* External CM API Interface */
133 /* instance of function pointers for client API */
134 /* set address of this instance to cm_core->cm_ops at cm_core alloc */
135 static struct nes_cm_ops nes_cm_api = {
136         mini_cm_accelerated,
137         mini_cm_listen,
138         mini_cm_del_listen,
139         mini_cm_connect,
140         mini_cm_close,
141         mini_cm_accept,
142         mini_cm_reject,
143         mini_cm_recv_pkt,
144         mini_cm_dealloc_core,
145         mini_cm_get,
146         mini_cm_set
147 };
148
149 static struct nes_cm_core *g_cm_core;
150
151 atomic_t cm_connects;
152 atomic_t cm_accepts;
153 atomic_t cm_disconnects;
154 atomic_t cm_closes;
155 atomic_t cm_connecteds;
156 atomic_t cm_connect_reqs;
157 atomic_t cm_rejects;
158
159 int nes_add_ref_cm_node(struct nes_cm_node *cm_node)
160 {
161         return add_ref_cm_node(cm_node);
162 }
163
164 int nes_rem_ref_cm_node(struct nes_cm_node *cm_node)
165 {
166         return rem_ref_cm_node(cm_node->cm_core, cm_node);
167 }
168
169 /**
170  * create_event
171  */
172 static struct nes_cm_event *create_event(struct nes_cm_node *   cm_node,
173                                          enum nes_cm_event_type type)
174 {
175         struct nes_cm_event *event;
176
177         if (!cm_node->cm_id)
178                 return NULL;
179
180         /* allocate an empty event */
181         event = kzalloc(sizeof(*event), GFP_ATOMIC);
182
183         if (!event)
184                 return NULL;
185
186         event->type = type;
187         event->cm_node = cm_node;
188         event->cm_info.rem_addr = cm_node->rem_addr;
189         event->cm_info.loc_addr = cm_node->loc_addr;
190         event->cm_info.rem_port = cm_node->rem_port;
191         event->cm_info.loc_port = cm_node->loc_port;
192         event->cm_info.cm_id = cm_node->cm_id;
193
194         nes_debug(NES_DBG_CM, "cm_node=%p Created event=%p, type=%u, "
195                   "dst_addr=%08x[%x], src_addr=%08x[%x]\n",
196                   cm_node, event, type, event->cm_info.loc_addr,
197                   event->cm_info.loc_port, event->cm_info.rem_addr,
198                   event->cm_info.rem_port);
199
200         nes_cm_post_event(event);
201         return event;
202 }
203
204
205 /**
206  * send_mpa_request
207  */
208 static int send_mpa_request(struct nes_cm_node *cm_node, struct sk_buff *skb)
209 {
210         u8 start_addr = 0;
211         u8 *start_ptr = &start_addr;
212         u8 **start_buff = &start_ptr;
213         u16 buff_len = 0;
214
215         if (!skb) {
216                 nes_debug(NES_DBG_CM, "skb set to NULL\n");
217                 return -1;
218         }
219
220         /* send an MPA Request frame */
221         cm_build_mpa_frame(cm_node, start_buff, &buff_len, NULL, MPA_KEY_REQUEST);
222         form_cm_frame(skb, cm_node, NULL, 0, *start_buff, buff_len, SET_ACK);
223
224         return schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
225 }
226
227
228
229 static int send_mpa_reject(struct nes_cm_node *cm_node)
230 {
231         struct sk_buff *skb = NULL;
232         u8 start_addr = 0;
233         u8 *start_ptr = &start_addr;
234         u8 **start_buff = &start_ptr;
235         u16 buff_len = 0;
236
237         skb = dev_alloc_skb(MAX_CM_BUFFER);
238         if (!skb) {
239                 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
240                 return -ENOMEM;
241         }
242
243         /* send an MPA reject frame */
244         cm_build_mpa_frame(cm_node, start_buff, &buff_len, NULL, MPA_KEY_REPLY);
245         form_cm_frame(skb, cm_node, NULL, 0, *start_buff, buff_len, SET_ACK | SET_FIN);
246
247         cm_node->state = NES_CM_STATE_FIN_WAIT1;
248         return schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
249 }
250
251
252 /**
253  * recv_mpa - process a received TCP pkt, we are expecting an
254  * IETF MPA frame
255  */
256 static int parse_mpa(struct nes_cm_node *cm_node, u8 *buffer, u32 *type,
257                      u32 len)
258 {
259         struct ietf_mpa_v1 *mpa_frame;
260         struct ietf_mpa_v2 *mpa_v2_frame;
261         struct ietf_rtr_msg *rtr_msg;
262         int mpa_hdr_len;
263         int priv_data_len;
264
265         *type = NES_MPA_REQUEST_ACCEPT;
266
267         /* assume req frame is in tcp data payload */
268         if (len < sizeof(struct ietf_mpa_v1)) {
269                 nes_debug(NES_DBG_CM, "The received ietf buffer was too small (%x)\n", len);
270                 return -EINVAL;
271         }
272
273         /* points to the beginning of the frame, which could be MPA V1 or V2 */
274         mpa_frame = (struct ietf_mpa_v1 *)buffer;
275         mpa_hdr_len = sizeof(struct ietf_mpa_v1);
276         priv_data_len = ntohs(mpa_frame->priv_data_len);
277
278         /* make sure mpa private data len is less than 512 bytes */
279         if (priv_data_len > IETF_MAX_PRIV_DATA_LEN) {
280                 nes_debug(NES_DBG_CM, "The received Length of Private"
281                           " Data field exceeds 512 octets\n");
282                 return -EINVAL;
283         }
284         /*
285          * make sure MPA receiver interoperate with the
286          * received MPA version and MPA key information
287          *
288          */
289         if (mpa_frame->rev != IETF_MPA_V1 && mpa_frame->rev != IETF_MPA_V2) {
290                 nes_debug(NES_DBG_CM, "The received mpa version"
291                           " is not supported\n");
292                 return -EINVAL;
293         }
294         /*
295         * backwards compatibility only
296         */
297         if (mpa_frame->rev > cm_node->mpa_frame_rev) {
298                 nes_debug(NES_DBG_CM, "The received mpa version"
299                         " can not be interoperated\n");
300                 return -EINVAL;
301         } else {
302                 cm_node->mpa_frame_rev = mpa_frame->rev;
303         }
304
305         if (cm_node->state != NES_CM_STATE_MPAREQ_SENT) {
306                 if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE)) {
307                         nes_debug(NES_DBG_CM, "Unexpected MPA Key received \n");
308                         return -EINVAL;
309                 }
310         } else {
311                 if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE)) {
312                         nes_debug(NES_DBG_CM, "Unexpected MPA Key received \n");
313                         return -EINVAL;
314                 }
315         }
316
317
318         if (priv_data_len + mpa_hdr_len != len) {
319                 nes_debug(NES_DBG_CM, "The received ietf buffer was not right"
320                         " complete (%x + %x != %x)\n",
321                         priv_data_len, mpa_hdr_len, len);
322                 return -EINVAL;
323         }
324         /* make sure it does not exceed the max size */
325         if (len > MAX_CM_BUFFER) {
326                 nes_debug(NES_DBG_CM, "The received ietf buffer was too large"
327                         " (%x + %x != %x)\n",
328                         priv_data_len, mpa_hdr_len, len);
329                 return -EINVAL;
330         }
331
332         cm_node->mpa_frame_size = priv_data_len;
333
334         switch (mpa_frame->rev) {
335         case IETF_MPA_V2: {
336                 u16 ird_size;
337                 u16 ord_size;
338                 mpa_v2_frame = (struct ietf_mpa_v2 *)buffer;
339                 mpa_hdr_len += IETF_RTR_MSG_SIZE;
340                 cm_node->mpa_frame_size -= IETF_RTR_MSG_SIZE;
341                 rtr_msg = &mpa_v2_frame->rtr_msg;
342
343                 /* parse rtr message */
344                 rtr_msg->ctrl_ird = ntohs(rtr_msg->ctrl_ird);
345                 rtr_msg->ctrl_ord = ntohs(rtr_msg->ctrl_ord);
346                 ird_size = rtr_msg->ctrl_ird & IETF_NO_IRD_ORD;
347                 ord_size = rtr_msg->ctrl_ord & IETF_NO_IRD_ORD;
348
349                 if (!(rtr_msg->ctrl_ird & IETF_PEER_TO_PEER)) {
350                         /* send reset */
351                         return -EINVAL;
352                 }
353
354                 if (cm_node->state != NES_CM_STATE_MPAREQ_SENT) {
355                         /* responder */
356                         if (cm_node->ord_size > ird_size)
357                                 cm_node->ord_size = ird_size;
358                 } else {
359                         /* initiator */
360                         if (cm_node->ord_size > ird_size)
361                                 cm_node->ord_size = ird_size;
362
363                         if (cm_node->ird_size < ord_size) {
364                                 /* no resources available */
365                                 /* send terminate message */
366                                 return -EINVAL;
367                         }
368                 }
369
370                 if (rtr_msg->ctrl_ord & IETF_RDMA0_READ) {
371                         cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
372                 } else if (rtr_msg->ctrl_ord & IETF_RDMA0_WRITE) {
373                         cm_node->send_rdma0_op = SEND_RDMA_WRITE_ZERO;
374                 } else {        /* Not supported RDMA0 operation */
375                         return -EINVAL;
376                 }
377                 break;
378         }
379         case IETF_MPA_V1:
380         default:
381                 break;
382         }
383
384         /* copy entire MPA frame to our cm_node's frame */
385         memcpy(cm_node->mpa_frame_buf, buffer + mpa_hdr_len, cm_node->mpa_frame_size);
386
387         if (mpa_frame->flags & IETF_MPA_FLAGS_REJECT)
388                 *type = NES_MPA_REQUEST_REJECT;
389         return 0;
390 }
391
392
393 /**
394  * form_cm_frame - get a free packet and build empty frame Use
395  * node info to build.
396  */
397 static void form_cm_frame(struct sk_buff *skb,
398                           struct nes_cm_node *cm_node, void *options, u32 optionsize,
399                           void *data, u32 datasize, u8 flags)
400 {
401         struct tcphdr *tcph;
402         struct iphdr *iph;
403         struct ethhdr *ethh;
404         u8 *buf;
405         u16 packetsize = sizeof(*iph);
406
407         packetsize += sizeof(*tcph);
408         packetsize += optionsize + datasize;
409
410         skb_trim(skb, 0);
411         memset(skb->data, 0x00, ETH_HLEN + sizeof(*iph) + sizeof(*tcph));
412
413         buf = skb_put(skb, packetsize + ETH_HLEN);
414
415         ethh = (struct ethhdr *)buf;
416         buf += ETH_HLEN;
417
418         iph = (struct iphdr *)buf;
419         buf += sizeof(*iph);
420         tcph = (struct tcphdr *)buf;
421         skb_reset_mac_header(skb);
422         skb_set_network_header(skb, ETH_HLEN);
423         skb_set_transport_header(skb, ETH_HLEN + sizeof(*iph));
424         buf += sizeof(*tcph);
425
426         skb->ip_summed = CHECKSUM_PARTIAL;
427         skb->protocol = htons(0x800);
428         skb->data_len = 0;
429         skb->mac_len = ETH_HLEN;
430
431         memcpy(ethh->h_dest, cm_node->rem_mac, ETH_ALEN);
432         memcpy(ethh->h_source, cm_node->loc_mac, ETH_ALEN);
433         ethh->h_proto = htons(0x0800);
434
435         iph->version = IPVERSION;
436         iph->ihl = 5;           /* 5 * 4Byte words, IP headr len */
437         iph->tos = 0;
438         iph->tot_len = htons(packetsize);
439         iph->id = htons(++cm_node->tcp_cntxt.loc_id);
440
441         iph->frag_off = htons(0x4000);
442         iph->ttl = 0x40;
443         iph->protocol = 0x06;   /* IPPROTO_TCP */
444
445         iph->saddr = htonl(cm_node->loc_addr);
446         iph->daddr = htonl(cm_node->rem_addr);
447
448         tcph->source = htons(cm_node->loc_port);
449         tcph->dest = htons(cm_node->rem_port);
450         tcph->seq = htonl(cm_node->tcp_cntxt.loc_seq_num);
451
452         if (flags & SET_ACK) {
453                 cm_node->tcp_cntxt.loc_ack_num = cm_node->tcp_cntxt.rcv_nxt;
454                 tcph->ack_seq = htonl(cm_node->tcp_cntxt.loc_ack_num);
455                 tcph->ack = 1;
456         } else {
457                 tcph->ack_seq = 0;
458         }
459
460         if (flags & SET_SYN) {
461                 cm_node->tcp_cntxt.loc_seq_num++;
462                 tcph->syn = 1;
463         } else {
464                 cm_node->tcp_cntxt.loc_seq_num += datasize;
465         }
466
467         if (flags & SET_FIN) {
468                 cm_node->tcp_cntxt.loc_seq_num++;
469                 tcph->fin = 1;
470         }
471
472         if (flags & SET_RST)
473                 tcph->rst = 1;
474
475         tcph->doff = (u16)((sizeof(*tcph) + optionsize + 3) >> 2);
476         tcph->window = htons(cm_node->tcp_cntxt.rcv_wnd);
477         tcph->urg_ptr = 0;
478         if (optionsize)
479                 memcpy(buf, options, optionsize);
480         buf += optionsize;
481         if (datasize)
482                 memcpy(buf, data, datasize);
483
484         skb_shinfo(skb)->nr_frags = 0;
485         cm_packets_created++;
486 }
487
488 /**
489  * print_core - dump a cm core
490  */
491 static void print_core(struct nes_cm_core *core)
492 {
493         nes_debug(NES_DBG_CM, "---------------------------------------------\n");
494         nes_debug(NES_DBG_CM, "CM Core  -- (core = %p )\n", core);
495         if (!core)
496                 return;
497         nes_debug(NES_DBG_CM, "---------------------------------------------\n");
498
499         nes_debug(NES_DBG_CM, "State         : %u \n", core->state);
500
501         nes_debug(NES_DBG_CM, "Listen Nodes  : %u \n", atomic_read(&core->listen_node_cnt));
502         nes_debug(NES_DBG_CM, "Active Nodes  : %u \n", atomic_read(&core->node_cnt));
503
504         nes_debug(NES_DBG_CM, "core          : %p \n", core);
505
506         nes_debug(NES_DBG_CM, "-------------- end core ---------------\n");
507 }
508
509 /**
510  * cm_build_mpa_frame - build a MPA V1 frame or MPA V2 frame
511  */
512 static int cm_build_mpa_frame(struct nes_cm_node *cm_node, u8 **start_buff,
513                               u16 *buff_len, u8 *pci_mem, u8 mpa_key)
514 {
515         int ret = 0;
516
517         *start_buff = (pci_mem) ? pci_mem : &cm_node->mpa_frame_buf[0];
518
519         switch (cm_node->mpa_frame_rev) {
520         case IETF_MPA_V1:
521                 *start_buff = (u8 *)*start_buff + sizeof(struct ietf_rtr_msg);
522                 *buff_len = sizeof(struct ietf_mpa_v1) + cm_node->mpa_frame_size;
523                 build_mpa_v1(cm_node, *start_buff, mpa_key);
524                 break;
525         case IETF_MPA_V2:
526                 *buff_len = sizeof(struct ietf_mpa_v2) + cm_node->mpa_frame_size;
527                 build_mpa_v2(cm_node, *start_buff, mpa_key);
528                 break;
529         default:
530                 ret = -EINVAL;
531         }
532         return ret;
533 }
534
535 /**
536  * build_mpa_v2 - build a MPA V2 frame
537  */
538 static void build_mpa_v2(struct nes_cm_node *cm_node,
539                          void *start_addr, u8 mpa_key)
540 {
541         struct ietf_mpa_v2 *mpa_frame = (struct ietf_mpa_v2 *)start_addr;
542         struct ietf_rtr_msg *rtr_msg = &mpa_frame->rtr_msg;
543
544         /* initialize the upper 5 bytes of the frame */
545         build_mpa_v1(cm_node, start_addr, mpa_key);
546         mpa_frame->flags |= IETF_MPA_V2_FLAG; /* set a bit to indicate MPA V2 */
547         mpa_frame->priv_data_len += htons(IETF_RTR_MSG_SIZE);
548
549         /* initialize RTR msg */
550         rtr_msg->ctrl_ird = (cm_node->ird_size > IETF_NO_IRD_ORD) ?
551                             IETF_NO_IRD_ORD : cm_node->ird_size;
552         rtr_msg->ctrl_ord = (cm_node->ord_size > IETF_NO_IRD_ORD) ?
553                             IETF_NO_IRD_ORD : cm_node->ord_size;
554
555         rtr_msg->ctrl_ird |= IETF_PEER_TO_PEER;
556         rtr_msg->ctrl_ird |= IETF_FLPDU_ZERO_LEN;
557
558         switch (mpa_key) {
559         case MPA_KEY_REQUEST:
560                 rtr_msg->ctrl_ord |= IETF_RDMA0_WRITE;
561                 rtr_msg->ctrl_ord |= IETF_RDMA0_READ;
562                 break;
563         case MPA_KEY_REPLY:
564                 switch (cm_node->send_rdma0_op) {
565                 case SEND_RDMA_WRITE_ZERO:
566                         rtr_msg->ctrl_ord |= IETF_RDMA0_WRITE;
567                         break;
568                 case SEND_RDMA_READ_ZERO:
569                         rtr_msg->ctrl_ord |= IETF_RDMA0_READ;
570                         break;
571                 }
572         }
573         rtr_msg->ctrl_ird = htons(rtr_msg->ctrl_ird);
574         rtr_msg->ctrl_ord = htons(rtr_msg->ctrl_ord);
575 }
576
577 /**
578  * build_mpa_v1 - build a MPA V1 frame
579  */
580 static void build_mpa_v1(struct nes_cm_node *cm_node, void *start_addr, u8 mpa_key)
581 {
582         struct ietf_mpa_v1 *mpa_frame = (struct ietf_mpa_v1 *)start_addr;
583
584         switch (mpa_key) {
585         case MPA_KEY_REQUEST:
586                 memcpy(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE);
587                 break;
588         case MPA_KEY_REPLY:
589                 memcpy(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE);
590                 break;
591         }
592         mpa_frame->flags = IETF_MPA_FLAGS_CRC;
593         mpa_frame->rev = cm_node->mpa_frame_rev;
594         mpa_frame->priv_data_len = htons(cm_node->mpa_frame_size);
595 }
596
597 static void build_rdma0_msg(struct nes_cm_node *cm_node, struct nes_qp **nesqp_addr)
598 {
599         u64 u64temp;
600         struct nes_qp *nesqp = *nesqp_addr;
601         struct nes_hw_qp_wqe *wqe = &nesqp->hwqp.sq_vbase[0];
602
603         u64temp = (unsigned long)nesqp;
604         u64temp |= NES_SW_CONTEXT_ALIGN >> 1;
605         set_wqe_64bit_value(wqe->wqe_words, NES_IWARP_SQ_WQE_COMP_CTX_LOW_IDX, u64temp);
606
607         wqe->wqe_words[NES_IWARP_SQ_WQE_FRAG0_LOW_IDX] = 0;
608         wqe->wqe_words[NES_IWARP_SQ_WQE_FRAG0_HIGH_IDX] = 0;
609
610         switch (cm_node->send_rdma0_op) {
611         case SEND_RDMA_WRITE_ZERO:
612                 nes_debug(NES_DBG_CM, "Sending first write.\n");
613                 wqe->wqe_words[NES_IWARP_SQ_WQE_MISC_IDX] =
614                         cpu_to_le32(NES_IWARP_SQ_OP_RDMAW);
615                 wqe->wqe_words[NES_IWARP_SQ_WQE_TOTAL_PAYLOAD_IDX] = 0;
616                 wqe->wqe_words[NES_IWARP_SQ_WQE_LENGTH0_IDX] = 0;
617                 wqe->wqe_words[NES_IWARP_SQ_WQE_STAG0_IDX] = 0;
618                 break;
619
620         case SEND_RDMA_READ_ZERO:
621         default:
622                 if (cm_node->send_rdma0_op != SEND_RDMA_READ_ZERO) {
623                         printk(KERN_ERR "%s[%u]: Unsupported RDMA0 len operation=%u\n",
624                                  __func__, __LINE__, cm_node->send_rdma0_op);
625                         WARN_ON(1);
626                 }
627                 nes_debug(NES_DBG_CM, "Sending first rdma operation.\n");
628                 wqe->wqe_words[NES_IWARP_SQ_WQE_MISC_IDX] =
629                         cpu_to_le32(NES_IWARP_SQ_OP_RDMAR);
630                 wqe->wqe_words[NES_IWARP_SQ_WQE_RDMA_TO_LOW_IDX] = 1;
631                 wqe->wqe_words[NES_IWARP_SQ_WQE_RDMA_TO_HIGH_IDX] = 0;
632                 wqe->wqe_words[NES_IWARP_SQ_WQE_RDMA_LENGTH_IDX] = 0;
633                 wqe->wqe_words[NES_IWARP_SQ_WQE_RDMA_STAG_IDX] = 1;
634                 wqe->wqe_words[NES_IWARP_SQ_WQE_STAG0_IDX] = 1;
635                 break;
636         }
637
638         if (nesqp->sq_kmapped) {
639                 nesqp->sq_kmapped = 0;
640                 kunmap(nesqp->page);
641         }
642
643         /*use the reserved spot on the WQ for the extra first WQE*/
644         nesqp->nesqp_context->ird_ord_sizes &= cpu_to_le32(~(NES_QPCONTEXT_ORDIRD_LSMM_PRESENT |
645                                                              NES_QPCONTEXT_ORDIRD_WRPDU |
646                                                              NES_QPCONTEXT_ORDIRD_ALSMM));
647         nesqp->skip_lsmm = 1;
648         nesqp->hwqp.sq_tail = 0;
649 }
650
651 /**
652  * schedule_nes_timer
653  * note - cm_node needs to be protected before calling this. Encase in:
654  *                      rem_ref_cm_node(cm_core, cm_node);add_ref_cm_node(cm_node);
655  */
656 int schedule_nes_timer(struct nes_cm_node *cm_node, struct sk_buff *skb,
657                        enum nes_timer_type type, int send_retrans,
658                        int close_when_complete)
659 {
660         unsigned long flags;
661         struct nes_cm_core *cm_core = cm_node->cm_core;
662         struct nes_timer_entry *new_send;
663         int ret = 0;
664         u32 was_timer_set;
665
666         new_send = kzalloc(sizeof(*new_send), GFP_ATOMIC);
667         if (!new_send)
668                 return -ENOMEM;
669
670         /* new_send->timetosend = currenttime */
671         new_send->retrycount = NES_DEFAULT_RETRYS;
672         new_send->retranscount = NES_DEFAULT_RETRANS;
673         new_send->skb = skb;
674         new_send->timetosend = jiffies;
675         new_send->type = type;
676         new_send->netdev = cm_node->netdev;
677         new_send->send_retrans = send_retrans;
678         new_send->close_when_complete = close_when_complete;
679
680         if (type == NES_TIMER_TYPE_CLOSE) {
681                 new_send->timetosend += (HZ / 10);
682                 if (cm_node->recv_entry) {
683                         kfree(new_send);
684                         WARN_ON(1);
685                         return -EINVAL;
686                 }
687                 cm_node->recv_entry = new_send;
688         }
689
690         if (type == NES_TIMER_TYPE_SEND) {
691                 new_send->seq_num = ntohl(tcp_hdr(skb)->seq);
692                 atomic_inc(&new_send->skb->users);
693                 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
694                 cm_node->send_entry = new_send;
695                 add_ref_cm_node(cm_node);
696                 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
697                 new_send->timetosend = jiffies + NES_RETRY_TIMEOUT;
698
699                 ret = nes_nic_cm_xmit(new_send->skb, cm_node->netdev);
700                 if (ret != NETDEV_TX_OK) {
701                         nes_debug(NES_DBG_CM, "Error sending packet %p "
702                                   "(jiffies = %lu)\n", new_send, jiffies);
703                         new_send->timetosend = jiffies;
704                         ret = NETDEV_TX_OK;
705                 } else {
706                         cm_packets_sent++;
707                         if (!send_retrans) {
708                                 cleanup_retrans_entry(cm_node);
709                                 if (close_when_complete)
710                                         rem_ref_cm_node(cm_core, cm_node);
711                                 return ret;
712                         }
713                 }
714         }
715
716         was_timer_set = timer_pending(&cm_core->tcp_timer);
717
718         if (!was_timer_set) {
719                 cm_core->tcp_timer.expires = new_send->timetosend;
720                 add_timer(&cm_core->tcp_timer);
721         }
722
723         return ret;
724 }
725
726 static void nes_retrans_expired(struct nes_cm_node *cm_node)
727 {
728         struct iw_cm_id *cm_id = cm_node->cm_id;
729         enum nes_cm_node_state state = cm_node->state;
730         cm_node->state = NES_CM_STATE_CLOSED;
731
732         switch (state) {
733         case NES_CM_STATE_SYN_RCVD:
734         case NES_CM_STATE_CLOSING:
735                 rem_ref_cm_node(cm_node->cm_core, cm_node);
736                 break;
737         case NES_CM_STATE_LAST_ACK:
738         case NES_CM_STATE_FIN_WAIT1:
739                 if (cm_node->cm_id)
740                         cm_id->rem_ref(cm_id);
741                 send_reset(cm_node, NULL);
742                 break;
743         default:
744                 add_ref_cm_node(cm_node);
745                 send_reset(cm_node, NULL);
746                 create_event(cm_node, NES_CM_EVENT_ABORTED);
747         }
748 }
749
750 static void handle_recv_entry(struct nes_cm_node *cm_node, u32 rem_node)
751 {
752         struct nes_timer_entry *recv_entry = cm_node->recv_entry;
753         struct iw_cm_id *cm_id = cm_node->cm_id;
754         struct nes_qp *nesqp;
755         unsigned long qplockflags;
756
757         if (!recv_entry)
758                 return;
759         nesqp = (struct nes_qp *)recv_entry->skb;
760         if (nesqp) {
761                 spin_lock_irqsave(&nesqp->lock, qplockflags);
762                 if (nesqp->cm_id) {
763                         nes_debug(NES_DBG_CM, "QP%u: cm_id = %p, "
764                                   "refcount = %d: HIT A "
765                                   "NES_TIMER_TYPE_CLOSE with something "
766                                   "to do!!!\n", nesqp->hwqp.qp_id, cm_id,
767                                   atomic_read(&nesqp->refcount));
768                         nesqp->hw_tcp_state = NES_AEQE_TCP_STATE_CLOSED;
769                         nesqp->last_aeq = NES_AEQE_AEID_RESET_SENT;
770                         nesqp->ibqp_state = IB_QPS_ERR;
771                         spin_unlock_irqrestore(&nesqp->lock, qplockflags);
772                         nes_cm_disconn(nesqp);
773                 } else {
774                         spin_unlock_irqrestore(&nesqp->lock, qplockflags);
775                         nes_debug(NES_DBG_CM, "QP%u: cm_id = %p, "
776                                   "refcount = %d: HIT A "
777                                   "NES_TIMER_TYPE_CLOSE with nothing "
778                                   "to do!!!\n", nesqp->hwqp.qp_id, cm_id,
779                                   atomic_read(&nesqp->refcount));
780                 }
781         } else if (rem_node) {
782                 /* TIME_WAIT state */
783                 rem_ref_cm_node(cm_node->cm_core, cm_node);
784         }
785         if (cm_node->cm_id)
786                 cm_id->rem_ref(cm_id);
787         kfree(recv_entry);
788         cm_node->recv_entry = NULL;
789 }
790
791 /**
792  * nes_cm_timer_tick
793  */
794 static void nes_cm_timer_tick(unsigned long pass)
795 {
796         unsigned long flags;
797         unsigned long nexttimeout = jiffies + NES_LONG_TIME;
798         struct nes_cm_node *cm_node;
799         struct nes_timer_entry *send_entry, *recv_entry;
800         struct list_head *list_core_temp;
801         struct list_head *list_node;
802         struct nes_cm_core *cm_core = g_cm_core;
803         u32 settimer = 0;
804         unsigned long timetosend;
805         int ret = NETDEV_TX_OK;
806
807         struct list_head timer_list;
808
809         INIT_LIST_HEAD(&timer_list);
810         spin_lock_irqsave(&cm_core->ht_lock, flags);
811
812         list_for_each_safe(list_node, list_core_temp,
813                            &cm_core->connected_nodes) {
814                 cm_node = container_of(list_node, struct nes_cm_node, list);
815                 if ((cm_node->recv_entry) || (cm_node->send_entry)) {
816                         add_ref_cm_node(cm_node);
817                         list_add(&cm_node->timer_entry, &timer_list);
818                 }
819         }
820         spin_unlock_irqrestore(&cm_core->ht_lock, flags);
821
822         list_for_each_safe(list_node, list_core_temp, &timer_list) {
823                 cm_node = container_of(list_node, struct nes_cm_node,
824                                        timer_entry);
825                 recv_entry = cm_node->recv_entry;
826
827                 if (recv_entry) {
828                         if (time_after(recv_entry->timetosend, jiffies)) {
829                                 if (nexttimeout > recv_entry->timetosend ||
830                                     !settimer) {
831                                         nexttimeout = recv_entry->timetosend;
832                                         settimer = 1;
833                                 }
834                         } else {
835                                 handle_recv_entry(cm_node, 1);
836                         }
837                 }
838
839                 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
840                 do {
841                         send_entry = cm_node->send_entry;
842                         if (!send_entry)
843                                 break;
844                         if (time_after(send_entry->timetosend, jiffies)) {
845                                 if (cm_node->state != NES_CM_STATE_TSA) {
846                                         if ((nexttimeout >
847                                              send_entry->timetosend) ||
848                                             !settimer) {
849                                                 nexttimeout =
850                                                         send_entry->timetosend;
851                                                 settimer = 1;
852                                         }
853                                 } else {
854                                         free_retrans_entry(cm_node);
855                                 }
856                                 break;
857                         }
858
859                         if ((cm_node->state == NES_CM_STATE_TSA) ||
860                             (cm_node->state == NES_CM_STATE_CLOSED)) {
861                                 free_retrans_entry(cm_node);
862                                 break;
863                         }
864
865                         if (!send_entry->retranscount ||
866                             !send_entry->retrycount) {
867                                 cm_packets_dropped++;
868                                 free_retrans_entry(cm_node);
869
870                                 spin_unlock_irqrestore(
871                                         &cm_node->retrans_list_lock, flags);
872                                 nes_retrans_expired(cm_node);
873                                 cm_node->state = NES_CM_STATE_CLOSED;
874                                 spin_lock_irqsave(&cm_node->retrans_list_lock,
875                                                   flags);
876                                 break;
877                         }
878                         atomic_inc(&send_entry->skb->users);
879                         cm_packets_retrans++;
880                         nes_debug(NES_DBG_CM, "Retransmitting send_entry %p "
881                                   "for node %p, jiffies = %lu, time to send = "
882                                   "%lu, retranscount = %u, send_entry->seq_num = "
883                                   "0x%08X, cm_node->tcp_cntxt.rem_ack_num = "
884                                   "0x%08X\n", send_entry, cm_node, jiffies,
885                                   send_entry->timetosend,
886                                   send_entry->retranscount,
887                                   send_entry->seq_num,
888                                   cm_node->tcp_cntxt.rem_ack_num);
889
890                         spin_unlock_irqrestore(&cm_node->retrans_list_lock,
891                                                flags);
892                         ret = nes_nic_cm_xmit(send_entry->skb, cm_node->netdev);
893                         spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
894                         if (ret != NETDEV_TX_OK) {
895                                 nes_debug(NES_DBG_CM, "rexmit failed for "
896                                           "node=%p\n", cm_node);
897                                 cm_packets_bounced++;
898                                 send_entry->retrycount--;
899                                 nexttimeout = jiffies + NES_SHORT_TIME;
900                                 settimer = 1;
901                                 break;
902                         } else {
903                                 cm_packets_sent++;
904                         }
905                         nes_debug(NES_DBG_CM, "Packet Sent: retrans count = "
906                                   "%u, retry count = %u.\n",
907                                   send_entry->retranscount,
908                                   send_entry->retrycount);
909                         if (send_entry->send_retrans) {
910                                 send_entry->retranscount--;
911                                 timetosend = (NES_RETRY_TIMEOUT <<
912                                               (NES_DEFAULT_RETRANS - send_entry->retranscount));
913
914                                 send_entry->timetosend = jiffies +
915                                                          min(timetosend, NES_MAX_TIMEOUT);
916                                 if (nexttimeout > send_entry->timetosend ||
917                                     !settimer) {
918                                         nexttimeout = send_entry->timetosend;
919                                         settimer = 1;
920                                 }
921                         } else {
922                                 int close_when_complete;
923                                 close_when_complete =
924                                         send_entry->close_when_complete;
925                                 nes_debug(NES_DBG_CM, "cm_node=%p state=%d\n",
926                                           cm_node, cm_node->state);
927                                 free_retrans_entry(cm_node);
928                                 if (close_when_complete)
929                                         rem_ref_cm_node(cm_node->cm_core,
930                                                         cm_node);
931                         }
932                 } while (0);
933
934                 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
935                 rem_ref_cm_node(cm_node->cm_core, cm_node);
936         }
937
938         if (settimer) {
939                 if (!timer_pending(&cm_core->tcp_timer)) {
940                         cm_core->tcp_timer.expires = nexttimeout;
941                         add_timer(&cm_core->tcp_timer);
942                 }
943         }
944 }
945
946
947 /**
948  * send_syn
949  */
950 static int send_syn(struct nes_cm_node *cm_node, u32 sendack,
951                     struct sk_buff *skb)
952 {
953         int ret;
954         int flags = SET_SYN;
955         char optionsbuffer[sizeof(struct option_mss) +
956                            sizeof(struct option_windowscale) + sizeof(struct option_base) +
957                            TCP_OPTIONS_PADDING];
958
959         int optionssize = 0;
960         /* Sending MSS option */
961         union all_known_options *options;
962
963         if (!cm_node)
964                 return -EINVAL;
965
966         options = (union all_known_options *)&optionsbuffer[optionssize];
967         options->as_mss.optionnum = OPTION_NUMBER_MSS;
968         options->as_mss.length = sizeof(struct option_mss);
969         options->as_mss.mss = htons(cm_node->tcp_cntxt.mss);
970         optionssize += sizeof(struct option_mss);
971
972         options = (union all_known_options *)&optionsbuffer[optionssize];
973         options->as_windowscale.optionnum = OPTION_NUMBER_WINDOW_SCALE;
974         options->as_windowscale.length = sizeof(struct option_windowscale);
975         options->as_windowscale.shiftcount = cm_node->tcp_cntxt.rcv_wscale;
976         optionssize += sizeof(struct option_windowscale);
977
978         if (sendack && !(NES_DRV_OPT_SUPRESS_OPTION_BC & nes_drv_opt)) {
979                 options = (union all_known_options *)&optionsbuffer[optionssize];
980                 options->as_base.optionnum = OPTION_NUMBER_WRITE0;
981                 options->as_base.length = sizeof(struct option_base);
982                 optionssize += sizeof(struct option_base);
983                 /* we need the size to be a multiple of 4 */
984                 options = (union all_known_options *)&optionsbuffer[optionssize];
985                 options->as_end = 1;
986                 optionssize += 1;
987                 options = (union all_known_options *)&optionsbuffer[optionssize];
988                 options->as_end = 1;
989                 optionssize += 1;
990         }
991
992         options = (union all_known_options *)&optionsbuffer[optionssize];
993         options->as_end = OPTION_NUMBER_END;
994         optionssize += 1;
995
996         if (!skb)
997                 skb = dev_alloc_skb(MAX_CM_BUFFER);
998         if (!skb) {
999                 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
1000                 return -1;
1001         }
1002
1003         if (sendack)
1004                 flags |= SET_ACK;
1005
1006         form_cm_frame(skb, cm_node, optionsbuffer, optionssize, NULL, 0, flags);
1007         ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
1008
1009         return ret;
1010 }
1011
1012
1013 /**
1014  * send_reset
1015  */
1016 static int send_reset(struct nes_cm_node *cm_node, struct sk_buff *skb)
1017 {
1018         int ret;
1019         int flags = SET_RST | SET_ACK;
1020
1021         if (!skb)
1022                 skb = dev_alloc_skb(MAX_CM_BUFFER);
1023         if (!skb) {
1024                 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
1025                 return -ENOMEM;
1026         }
1027
1028         form_cm_frame(skb, cm_node, NULL, 0, NULL, 0, flags);
1029         ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 0, 1);
1030
1031         return ret;
1032 }
1033
1034
1035 /**
1036  * send_ack
1037  */
1038 static int send_ack(struct nes_cm_node *cm_node, struct sk_buff *skb)
1039 {
1040         int ret;
1041
1042         if (!skb)
1043                 skb = dev_alloc_skb(MAX_CM_BUFFER);
1044
1045         if (!skb) {
1046                 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
1047                 return -1;
1048         }
1049
1050         form_cm_frame(skb, cm_node, NULL, 0, NULL, 0, SET_ACK);
1051         ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 0, 0);
1052
1053         return ret;
1054 }
1055
1056
1057 /**
1058  * send_fin
1059  */
1060 static int send_fin(struct nes_cm_node *cm_node, struct sk_buff *skb)
1061 {
1062         int ret;
1063
1064         /* if we didn't get a frame get one */
1065         if (!skb)
1066                 skb = dev_alloc_skb(MAX_CM_BUFFER);
1067
1068         if (!skb) {
1069                 nes_debug(NES_DBG_CM, "Failed to get a Free pkt\n");
1070                 return -1;
1071         }
1072
1073         form_cm_frame(skb, cm_node, NULL, 0, NULL, 0, SET_ACK | SET_FIN);
1074         ret = schedule_nes_timer(cm_node, skb, NES_TIMER_TYPE_SEND, 1, 0);
1075
1076         return ret;
1077 }
1078
1079
1080 /**
1081  * find_node - find a cm node that matches the reference cm node
1082  */
1083 static struct nes_cm_node *find_node(struct nes_cm_core *cm_core,
1084                                      u16 rem_port, nes_addr_t rem_addr, u16 loc_port, nes_addr_t loc_addr)
1085 {
1086         unsigned long flags;
1087         struct list_head *hte;
1088         struct nes_cm_node *cm_node;
1089
1090         /* get a handle on the hte */
1091         hte = &cm_core->connected_nodes;
1092
1093         /* walk list and find cm_node associated with this session ID */
1094         spin_lock_irqsave(&cm_core->ht_lock, flags);
1095         list_for_each_entry(cm_node, hte, list) {
1096                 /* compare quad, return node handle if a match */
1097                 nes_debug(NES_DBG_CM, "finding node %x:%x =? %x:%x ^ %x:%x =? %x:%x\n",
1098                           cm_node->loc_addr, cm_node->loc_port,
1099                           loc_addr, loc_port,
1100                           cm_node->rem_addr, cm_node->rem_port,
1101                           rem_addr, rem_port);
1102                 if ((cm_node->loc_addr == loc_addr) && (cm_node->loc_port == loc_port) &&
1103                     (cm_node->rem_addr == rem_addr) && (cm_node->rem_port == rem_port)) {
1104                         add_ref_cm_node(cm_node);
1105                         spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1106                         return cm_node;
1107                 }
1108         }
1109         spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1110
1111         /* no owner node */
1112         return NULL;
1113 }
1114
1115
1116 /**
1117  * find_listener - find a cm node listening on this addr-port pair
1118  */
1119 static struct nes_cm_listener *find_listener(struct nes_cm_core *cm_core,
1120                                              nes_addr_t dst_addr, u16 dst_port, enum nes_cm_listener_state listener_state)
1121 {
1122         unsigned long flags;
1123         struct nes_cm_listener *listen_node;
1124
1125         /* walk list and find cm_node associated with this session ID */
1126         spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1127         list_for_each_entry(listen_node, &cm_core->listen_list.list, list) {
1128                 /* compare node pair, return node handle if a match */
1129                 if (((listen_node->loc_addr == dst_addr) ||
1130                      listen_node->loc_addr == 0x00000000) &&
1131                     (listen_node->loc_port == dst_port) &&
1132                     (listener_state & listen_node->listener_state)) {
1133                         atomic_inc(&listen_node->ref_count);
1134                         spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1135                         return listen_node;
1136                 }
1137         }
1138         spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1139
1140         /* no listener */
1141         return NULL;
1142 }
1143
1144
1145 /**
1146  * add_hte_node - add a cm node to the hash table
1147  */
1148 static int add_hte_node(struct nes_cm_core *cm_core, struct nes_cm_node *cm_node)
1149 {
1150         unsigned long flags;
1151         struct list_head *hte;
1152
1153         if (!cm_node || !cm_core)
1154                 return -EINVAL;
1155
1156         nes_debug(NES_DBG_CM, "Adding Node %p to Active Connection HT\n",
1157                   cm_node);
1158
1159         spin_lock_irqsave(&cm_core->ht_lock, flags);
1160
1161         /* get a handle on the hash table element (list head for this slot) */
1162         hte = &cm_core->connected_nodes;
1163         list_add_tail(&cm_node->list, hte);
1164         atomic_inc(&cm_core->ht_node_cnt);
1165
1166         spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1167
1168         return 0;
1169 }
1170
1171
1172 /**
1173  * mini_cm_dec_refcnt_listen
1174  */
1175 static int mini_cm_dec_refcnt_listen(struct nes_cm_core *cm_core,
1176                                      struct nes_cm_listener *listener, int free_hanging_nodes)
1177 {
1178         int ret = -EINVAL;
1179         int err = 0;
1180         unsigned long flags;
1181         struct list_head *list_pos = NULL;
1182         struct list_head *list_temp = NULL;
1183         struct nes_cm_node *cm_node = NULL;
1184         struct list_head reset_list;
1185
1186         nes_debug(NES_DBG_CM, "attempting listener= %p free_nodes= %d, "
1187                   "refcnt=%d\n", listener, free_hanging_nodes,
1188                   atomic_read(&listener->ref_count));
1189         /* free non-accelerated child nodes for this listener */
1190         INIT_LIST_HEAD(&reset_list);
1191         if (free_hanging_nodes) {
1192                 spin_lock_irqsave(&cm_core->ht_lock, flags);
1193                 list_for_each_safe(list_pos, list_temp,
1194                                    &g_cm_core->connected_nodes) {
1195                         cm_node = container_of(list_pos, struct nes_cm_node,
1196                                                list);
1197                         if ((cm_node->listener == listener) &&
1198                             (!cm_node->accelerated)) {
1199                                 add_ref_cm_node(cm_node);
1200                                 list_add(&cm_node->reset_entry, &reset_list);
1201                         }
1202                 }
1203                 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1204         }
1205
1206         list_for_each_safe(list_pos, list_temp, &reset_list) {
1207                 cm_node = container_of(list_pos, struct nes_cm_node,
1208                                        reset_entry);
1209                 {
1210                         struct nes_cm_node *loopback = cm_node->loopbackpartner;
1211                         enum nes_cm_node_state old_state;
1212                         if (NES_CM_STATE_FIN_WAIT1 <= cm_node->state) {
1213                                 rem_ref_cm_node(cm_node->cm_core, cm_node);
1214                         } else {
1215                                 if (!loopback) {
1216                                         cleanup_retrans_entry(cm_node);
1217                                         err = send_reset(cm_node, NULL);
1218                                         if (err) {
1219                                                 cm_node->state =
1220                                                         NES_CM_STATE_CLOSED;
1221                                                 WARN_ON(1);
1222                                         } else {
1223                                                 old_state = cm_node->state;
1224                                                 cm_node->state = NES_CM_STATE_LISTENER_DESTROYED;
1225                                                 if (old_state != NES_CM_STATE_MPAREQ_RCVD)
1226                                                         rem_ref_cm_node(
1227                                                                 cm_node->cm_core,
1228                                                                 cm_node);
1229                                         }
1230                                 } else {
1231                                         struct nes_cm_event event;
1232
1233                                         event.cm_node = loopback;
1234                                         event.cm_info.rem_addr =
1235                                                         loopback->rem_addr;
1236                                         event.cm_info.loc_addr =
1237                                                         loopback->loc_addr;
1238                                         event.cm_info.rem_port =
1239                                                         loopback->rem_port;
1240                                         event.cm_info.loc_port =
1241                                                          loopback->loc_port;
1242                                         event.cm_info.cm_id = loopback->cm_id;
1243                                         add_ref_cm_node(loopback);
1244                                         loopback->state = NES_CM_STATE_CLOSED;
1245                                         cm_event_connect_error(&event);
1246                                         cm_node->state = NES_CM_STATE_LISTENER_DESTROYED;
1247
1248                                         rem_ref_cm_node(cm_node->cm_core,
1249                                                          cm_node);
1250
1251                                 }
1252                         }
1253                 }
1254         }
1255
1256         spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1257         if (!atomic_dec_return(&listener->ref_count)) {
1258                 list_del(&listener->list);
1259
1260                 /* decrement our listen node count */
1261                 atomic_dec(&cm_core->listen_node_cnt);
1262
1263                 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1264
1265                 if (listener->nesvnic)
1266                         nes_manage_apbvt(listener->nesvnic, listener->loc_port,
1267                                          PCI_FUNC(listener->nesvnic->nesdev->pcidev->devfn), NES_MANAGE_APBVT_DEL);
1268
1269                 nes_debug(NES_DBG_CM, "destroying listener (%p)\n", listener);
1270
1271                 kfree(listener);
1272                 listener = NULL;
1273                 ret = 0;
1274                 atomic_inc(&cm_listens_destroyed);
1275         } else {
1276                 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1277         }
1278         if (listener) {
1279                 if (atomic_read(&listener->pend_accepts_cnt) > 0)
1280                         nes_debug(NES_DBG_CM, "destroying listener (%p)"
1281                                   " with non-zero pending accepts=%u\n",
1282                                   listener, atomic_read(&listener->pend_accepts_cnt));
1283         }
1284
1285         return ret;
1286 }
1287
1288
1289 /**
1290  * mini_cm_del_listen
1291  */
1292 static int mini_cm_del_listen(struct nes_cm_core *cm_core,
1293                               struct nes_cm_listener *listener)
1294 {
1295         listener->listener_state = NES_CM_LISTENER_PASSIVE_STATE;
1296         listener->cm_id = NULL; /* going to be destroyed pretty soon */
1297         return mini_cm_dec_refcnt_listen(cm_core, listener, 1);
1298 }
1299
1300
1301 /**
1302  * mini_cm_accelerated
1303  */
1304 static inline int mini_cm_accelerated(struct nes_cm_core *cm_core,
1305                                       struct nes_cm_node *cm_node)
1306 {
1307         u32 was_timer_set;
1308
1309         cm_node->accelerated = 1;
1310
1311         if (cm_node->accept_pend) {
1312                 BUG_ON(!cm_node->listener);
1313                 atomic_dec(&cm_node->listener->pend_accepts_cnt);
1314                 cm_node->accept_pend = 0;
1315                 BUG_ON(atomic_read(&cm_node->listener->pend_accepts_cnt) < 0);
1316         }
1317
1318         was_timer_set = timer_pending(&cm_core->tcp_timer);
1319         if (!was_timer_set) {
1320                 cm_core->tcp_timer.expires = jiffies + NES_SHORT_TIME;
1321                 add_timer(&cm_core->tcp_timer);
1322         }
1323
1324         return 0;
1325 }
1326
1327
1328 /**
1329  * nes_addr_resolve_neigh
1330  */
1331 static int nes_addr_resolve_neigh(struct nes_vnic *nesvnic, u32 dst_ip, int arpindex)
1332 {
1333         struct rtable *rt;
1334         struct neighbour *neigh;
1335         int rc = arpindex;
1336         struct net_device *netdev;
1337         struct nes_adapter *nesadapter = nesvnic->nesdev->nesadapter;
1338
1339         rt = ip_route_output(&init_net, htonl(dst_ip), 0, 0, 0);
1340         if (IS_ERR(rt)) {
1341                 printk(KERN_ERR "%s: ip_route_output_key failed for 0x%08X\n",
1342                        __func__, dst_ip);
1343                 return rc;
1344         }
1345
1346         if (netif_is_bond_slave(nesvnic->netdev))
1347                 netdev = nesvnic->netdev->master;
1348         else
1349                 netdev = nesvnic->netdev;
1350
1351         neigh = neigh_lookup(&arp_tbl, &rt->rt_gateway, netdev);
1352         if (neigh) {
1353                 if (neigh->nud_state & NUD_VALID) {
1354                         nes_debug(NES_DBG_CM, "Neighbor MAC address for 0x%08X"
1355                                   " is %pM, Gateway is 0x%08X \n", dst_ip,
1356                                   neigh->ha, ntohl(rt->rt_gateway));
1357
1358                         if (arpindex >= 0) {
1359                                 if (!memcmp(nesadapter->arp_table[arpindex].mac_addr,
1360                                             neigh->ha, ETH_ALEN)) {
1361                                         /* Mac address same as in nes_arp_table */
1362                                         neigh_release(neigh);
1363                                         ip_rt_put(rt);
1364                                         return rc;
1365                                 }
1366
1367                                 nes_manage_arp_cache(nesvnic->netdev,
1368                                                      nesadapter->arp_table[arpindex].mac_addr,
1369                                                      dst_ip, NES_ARP_DELETE);
1370                         }
1371
1372                         nes_manage_arp_cache(nesvnic->netdev, neigh->ha,
1373                                              dst_ip, NES_ARP_ADD);
1374                         rc = nes_arp_table(nesvnic->nesdev, dst_ip, NULL,
1375                                            NES_ARP_RESOLVE);
1376                 }
1377                 neigh_release(neigh);
1378         }
1379
1380         if ((neigh == NULL) || (!(neigh->nud_state & NUD_VALID))) {
1381                 rcu_read_lock();
1382                 neigh_event_send(dst_get_neighbour(&rt->dst), NULL);
1383                 rcu_read_unlock();
1384         }
1385         ip_rt_put(rt);
1386         return rc;
1387 }
1388
1389 /**
1390  * make_cm_node - create a new instance of a cm node
1391  */
1392 static struct nes_cm_node *make_cm_node(struct nes_cm_core *cm_core,
1393                                         struct nes_vnic *nesvnic, struct nes_cm_info *cm_info,
1394                                         struct nes_cm_listener *listener)
1395 {
1396         struct nes_cm_node *cm_node;
1397         struct timespec ts;
1398         int oldarpindex = 0;
1399         int arpindex = 0;
1400         struct nes_device *nesdev;
1401         struct nes_adapter *nesadapter;
1402
1403         /* create an hte and cm_node for this instance */
1404         cm_node = kzalloc(sizeof(*cm_node), GFP_ATOMIC);
1405         if (!cm_node)
1406                 return NULL;
1407
1408         /* set our node specific transport info */
1409         cm_node->loc_addr = cm_info->loc_addr;
1410         cm_node->rem_addr = cm_info->rem_addr;
1411         cm_node->loc_port = cm_info->loc_port;
1412         cm_node->rem_port = cm_info->rem_port;
1413
1414         cm_node->mpa_frame_rev = mpa_version;
1415         cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
1416         cm_node->ird_size = IETF_NO_IRD_ORD;
1417         cm_node->ord_size = IETF_NO_IRD_ORD;
1418
1419         nes_debug(NES_DBG_CM, "Make node addresses : loc = %pI4:%x, rem = %pI4:%x\n",
1420                   &cm_node->loc_addr, cm_node->loc_port,
1421                   &cm_node->rem_addr, cm_node->rem_port);
1422         cm_node->listener = listener;
1423         cm_node->netdev = nesvnic->netdev;
1424         cm_node->cm_id = cm_info->cm_id;
1425         memcpy(cm_node->loc_mac, nesvnic->netdev->dev_addr, ETH_ALEN);
1426
1427         nes_debug(NES_DBG_CM, "listener=%p, cm_id=%p\n", cm_node->listener,
1428                   cm_node->cm_id);
1429
1430         spin_lock_init(&cm_node->retrans_list_lock);
1431
1432         cm_node->loopbackpartner = NULL;
1433         atomic_set(&cm_node->ref_count, 1);
1434         /* associate our parent CM core */
1435         cm_node->cm_core = cm_core;
1436         cm_node->tcp_cntxt.loc_id = NES_CM_DEF_LOCAL_ID;
1437         cm_node->tcp_cntxt.rcv_wscale = NES_CM_DEFAULT_RCV_WND_SCALE;
1438         cm_node->tcp_cntxt.rcv_wnd = NES_CM_DEFAULT_RCV_WND_SCALED >>
1439                                      NES_CM_DEFAULT_RCV_WND_SCALE;
1440         ts = current_kernel_time();
1441         cm_node->tcp_cntxt.loc_seq_num = htonl(ts.tv_nsec);
1442         cm_node->tcp_cntxt.mss = nesvnic->max_frame_size - sizeof(struct iphdr) -
1443                                  sizeof(struct tcphdr) - ETH_HLEN - VLAN_HLEN;
1444         cm_node->tcp_cntxt.rcv_nxt = 0;
1445         /* get a unique session ID , add thread_id to an upcounter to handle race */
1446         atomic_inc(&cm_core->node_cnt);
1447         cm_node->conn_type = cm_info->conn_type;
1448         cm_node->apbvt_set = 0;
1449         cm_node->accept_pend = 0;
1450
1451         cm_node->nesvnic = nesvnic;
1452         /* get some device handles, for arp lookup */
1453         nesdev = nesvnic->nesdev;
1454         nesadapter = nesdev->nesadapter;
1455
1456         cm_node->loopbackpartner = NULL;
1457
1458         /* get the mac addr for the remote node */
1459         if (ipv4_is_loopback(htonl(cm_node->rem_addr))) {
1460                 arpindex = nes_arp_table(nesdev, ntohl(nesvnic->local_ipaddr), NULL, NES_ARP_RESOLVE);
1461         } else {
1462                 oldarpindex = nes_arp_table(nesdev, cm_node->rem_addr, NULL, NES_ARP_RESOLVE);
1463                 arpindex = nes_addr_resolve_neigh(nesvnic, cm_info->rem_addr, oldarpindex);
1464         }
1465         if (arpindex < 0) {
1466                 kfree(cm_node);
1467                 return NULL;
1468         }
1469
1470         /* copy the mac addr to node context */
1471         memcpy(cm_node->rem_mac, nesadapter->arp_table[arpindex].mac_addr, ETH_ALEN);
1472         nes_debug(NES_DBG_CM, "Remote mac addr from arp table: %pM\n",
1473                   cm_node->rem_mac);
1474
1475         add_hte_node(cm_core, cm_node);
1476         atomic_inc(&cm_nodes_created);
1477
1478         return cm_node;
1479 }
1480
1481
1482 /**
1483  * add_ref_cm_node - destroy an instance of a cm node
1484  */
1485 static int add_ref_cm_node(struct nes_cm_node *cm_node)
1486 {
1487         atomic_inc(&cm_node->ref_count);
1488         return 0;
1489 }
1490
1491
1492 /**
1493  * rem_ref_cm_node - destroy an instance of a cm node
1494  */
1495 static int rem_ref_cm_node(struct nes_cm_core *cm_core,
1496                            struct nes_cm_node *cm_node)
1497 {
1498         unsigned long flags;
1499         struct nes_qp *nesqp;
1500
1501         if (!cm_node)
1502                 return -EINVAL;
1503
1504         spin_lock_irqsave(&cm_node->cm_core->ht_lock, flags);
1505         if (atomic_dec_return(&cm_node->ref_count)) {
1506                 spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
1507                 return 0;
1508         }
1509         list_del(&cm_node->list);
1510         atomic_dec(&cm_core->ht_node_cnt);
1511         spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
1512
1513         /* if the node is destroyed before connection was accelerated */
1514         if (!cm_node->accelerated && cm_node->accept_pend) {
1515                 BUG_ON(!cm_node->listener);
1516                 atomic_dec(&cm_node->listener->pend_accepts_cnt);
1517                 BUG_ON(atomic_read(&cm_node->listener->pend_accepts_cnt) < 0);
1518         }
1519         WARN_ON(cm_node->send_entry);
1520         if (cm_node->recv_entry)
1521                 handle_recv_entry(cm_node, 0);
1522         if (cm_node->listener) {
1523                 mini_cm_dec_refcnt_listen(cm_core, cm_node->listener, 0);
1524         } else {
1525                 if (cm_node->apbvt_set && cm_node->nesvnic) {
1526                         nes_manage_apbvt(cm_node->nesvnic, cm_node->loc_port,
1527                                          PCI_FUNC(
1528                                                  cm_node->nesvnic->nesdev->pcidev->devfn),
1529                                          NES_MANAGE_APBVT_DEL);
1530                 }
1531         }
1532
1533         atomic_dec(&cm_core->node_cnt);
1534         atomic_inc(&cm_nodes_destroyed);
1535         nesqp = cm_node->nesqp;
1536         if (nesqp) {
1537                 nesqp->cm_node = NULL;
1538                 nes_rem_ref(&nesqp->ibqp);
1539                 cm_node->nesqp = NULL;
1540         }
1541
1542         kfree(cm_node);
1543         return 0;
1544 }
1545
1546 /**
1547  * process_options
1548  */
1549 static int process_options(struct nes_cm_node *cm_node, u8 *optionsloc,
1550                            u32 optionsize, u32 syn_packet)
1551 {
1552         u32 tmp;
1553         u32 offset = 0;
1554         union all_known_options *all_options;
1555         char got_mss_option = 0;
1556
1557         while (offset < optionsize) {
1558                 all_options = (union all_known_options *)(optionsloc + offset);
1559                 switch (all_options->as_base.optionnum) {
1560                 case OPTION_NUMBER_END:
1561                         offset = optionsize;
1562                         break;
1563                 case OPTION_NUMBER_NONE:
1564                         offset += 1;
1565                         continue;
1566                 case OPTION_NUMBER_MSS:
1567                         nes_debug(NES_DBG_CM, "%s: MSS Length: %d Offset: %d "
1568                                   "Size: %d\n", __func__,
1569                                   all_options->as_mss.length, offset, optionsize);
1570                         got_mss_option = 1;
1571                         if (all_options->as_mss.length != 4) {
1572                                 return 1;
1573                         } else {
1574                                 tmp = ntohs(all_options->as_mss.mss);
1575                                 if (tmp > 0 && tmp <
1576                                     cm_node->tcp_cntxt.mss)
1577                                         cm_node->tcp_cntxt.mss = tmp;
1578                         }
1579                         break;
1580                 case OPTION_NUMBER_WINDOW_SCALE:
1581                         cm_node->tcp_cntxt.snd_wscale =
1582                                 all_options->as_windowscale.shiftcount;
1583                         break;
1584                 default:
1585                         nes_debug(NES_DBG_CM, "TCP Option not understood: %x\n",
1586                                   all_options->as_base.optionnum);
1587                         break;
1588                 }
1589                 offset += all_options->as_base.length;
1590         }
1591         if ((!got_mss_option) && (syn_packet))
1592                 cm_node->tcp_cntxt.mss = NES_CM_DEFAULT_MSS;
1593         return 0;
1594 }
1595
1596 static void drop_packet(struct sk_buff *skb)
1597 {
1598         atomic_inc(&cm_accel_dropped_pkts);
1599         dev_kfree_skb_any(skb);
1600 }
1601
1602 static void handle_fin_pkt(struct nes_cm_node *cm_node)
1603 {
1604         nes_debug(NES_DBG_CM, "Received FIN, cm_node = %p, state = %u. "
1605                   "refcnt=%d\n", cm_node, cm_node->state,
1606                   atomic_read(&cm_node->ref_count));
1607         switch (cm_node->state) {
1608         case NES_CM_STATE_SYN_RCVD:
1609         case NES_CM_STATE_SYN_SENT:
1610         case NES_CM_STATE_ESTABLISHED:
1611         case NES_CM_STATE_MPAREJ_RCVD:
1612                 cm_node->tcp_cntxt.rcv_nxt++;
1613                 cleanup_retrans_entry(cm_node);
1614                 cm_node->state = NES_CM_STATE_LAST_ACK;
1615                 send_fin(cm_node, NULL);
1616                 break;
1617         case NES_CM_STATE_MPAREQ_SENT:
1618                 create_event(cm_node, NES_CM_EVENT_ABORTED);
1619                 cm_node->tcp_cntxt.rcv_nxt++;
1620                 cleanup_retrans_entry(cm_node);
1621                 cm_node->state = NES_CM_STATE_CLOSED;
1622                 add_ref_cm_node(cm_node);
1623                 send_reset(cm_node, NULL);
1624                 break;
1625         case NES_CM_STATE_FIN_WAIT1:
1626                 cm_node->tcp_cntxt.rcv_nxt++;
1627                 cleanup_retrans_entry(cm_node);
1628                 cm_node->state = NES_CM_STATE_CLOSING;
1629                 send_ack(cm_node, NULL);
1630                 /* Wait for ACK as this is simultaneous close..
1631                 * After we receive ACK, do not send anything..
1632                 * Just rm the node.. Done.. */
1633                 break;
1634         case NES_CM_STATE_FIN_WAIT2:
1635                 cm_node->tcp_cntxt.rcv_nxt++;
1636                 cleanup_retrans_entry(cm_node);
1637                 cm_node->state = NES_CM_STATE_TIME_WAIT;
1638                 send_ack(cm_node, NULL);
1639                 schedule_nes_timer(cm_node, NULL,  NES_TIMER_TYPE_CLOSE, 1, 0);
1640                 break;
1641         case NES_CM_STATE_TIME_WAIT:
1642                 cm_node->tcp_cntxt.rcv_nxt++;
1643                 cleanup_retrans_entry(cm_node);
1644                 cm_node->state = NES_CM_STATE_CLOSED;
1645                 rem_ref_cm_node(cm_node->cm_core, cm_node);
1646                 break;
1647         case NES_CM_STATE_TSA:
1648         default:
1649                 nes_debug(NES_DBG_CM, "Error Rcvd FIN for node-%p state = %d\n",
1650                         cm_node, cm_node->state);
1651                 break;
1652         }
1653 }
1654
1655
1656 static void handle_rst_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1657         struct tcphdr *tcph)
1658 {
1659
1660         int     reset = 0;      /* whether to send reset in case of err.. */
1661         atomic_inc(&cm_resets_recvd);
1662         nes_debug(NES_DBG_CM, "Received Reset, cm_node = %p, state = %u."
1663                         " refcnt=%d\n", cm_node, cm_node->state,
1664                         atomic_read(&cm_node->ref_count));
1665         cleanup_retrans_entry(cm_node);
1666         switch (cm_node->state) {
1667         case NES_CM_STATE_SYN_SENT:
1668         case NES_CM_STATE_MPAREQ_SENT:
1669                 nes_debug(NES_DBG_CM, "%s[%u] create abort for cm_node=%p "
1670                         "listener=%p state=%d\n", __func__, __LINE__, cm_node,
1671                         cm_node->listener, cm_node->state);
1672                 switch (cm_node->mpa_frame_rev) {
1673                 case IETF_MPA_V2:
1674                         cm_node->mpa_frame_rev = IETF_MPA_V1;
1675                         /* send a syn and goto syn sent state */
1676                         cm_node->state = NES_CM_STATE_SYN_SENT;
1677                         if (send_syn(cm_node, 0, NULL)) {
1678                                 active_open_err(cm_node, skb, reset);
1679                         }
1680                         break;
1681                 case IETF_MPA_V1:
1682                 default:
1683                         active_open_err(cm_node, skb, reset);
1684                         break;
1685                 }
1686                 break;
1687         case NES_CM_STATE_MPAREQ_RCVD:
1688                 atomic_inc(&cm_node->passive_state);
1689                 dev_kfree_skb_any(skb);
1690                 break;
1691         case NES_CM_STATE_ESTABLISHED:
1692         case NES_CM_STATE_SYN_RCVD:
1693         case NES_CM_STATE_LISTENING:
1694                 nes_debug(NES_DBG_CM, "Bad state %s[%u]\n", __func__, __LINE__);
1695                 passive_open_err(cm_node, skb, reset);
1696                 break;
1697         case NES_CM_STATE_TSA:
1698                 active_open_err(cm_node, skb, reset);
1699                 break;
1700         case NES_CM_STATE_CLOSED:
1701                 drop_packet(skb);
1702                 break;
1703         case NES_CM_STATE_FIN_WAIT2:
1704         case NES_CM_STATE_FIN_WAIT1:
1705         case NES_CM_STATE_LAST_ACK:
1706                 cm_node->cm_id->rem_ref(cm_node->cm_id);
1707         case NES_CM_STATE_TIME_WAIT:
1708                 cm_node->state = NES_CM_STATE_CLOSED;
1709                 rem_ref_cm_node(cm_node->cm_core, cm_node);
1710                 drop_packet(skb);
1711                 break;
1712         default:
1713                 drop_packet(skb);
1714                 break;
1715         }
1716 }
1717
1718
1719 static void handle_rcv_mpa(struct nes_cm_node *cm_node, struct sk_buff *skb)
1720 {
1721         int ret = 0;
1722         int datasize = skb->len;
1723         u8 *dataloc = skb->data;
1724
1725         enum nes_cm_event_type type = NES_CM_EVENT_UNKNOWN;
1726         u32 res_type;
1727
1728         ret = parse_mpa(cm_node, dataloc, &res_type, datasize);
1729         if (ret) {
1730                 nes_debug(NES_DBG_CM, "didn't like MPA Request\n");
1731                 if (cm_node->state == NES_CM_STATE_MPAREQ_SENT) {
1732                         nes_debug(NES_DBG_CM, "%s[%u] create abort for "
1733                                   "cm_node=%p listener=%p state=%d\n", __func__,
1734                                   __LINE__, cm_node, cm_node->listener,
1735                                   cm_node->state);
1736                         active_open_err(cm_node, skb, 1);
1737                 } else {
1738                         passive_open_err(cm_node, skb, 1);
1739                 }
1740                 return;
1741         }
1742
1743         switch (cm_node->state) {
1744         case NES_CM_STATE_ESTABLISHED:
1745                 if (res_type == NES_MPA_REQUEST_REJECT)
1746                         /*BIG problem as we are receiving the MPA.. So should
1747                          * not be REJECT.. This is Passive Open.. We can
1748                          * only receive it Reject for Active Open...*/
1749                         WARN_ON(1);
1750                 cm_node->state = NES_CM_STATE_MPAREQ_RCVD;
1751                 type = NES_CM_EVENT_MPA_REQ;
1752                 atomic_set(&cm_node->passive_state,
1753                            NES_PASSIVE_STATE_INDICATED);
1754                 break;
1755         case NES_CM_STATE_MPAREQ_SENT:
1756                 cleanup_retrans_entry(cm_node);
1757                 if (res_type == NES_MPA_REQUEST_REJECT) {
1758                         type = NES_CM_EVENT_MPA_REJECT;
1759                         cm_node->state = NES_CM_STATE_MPAREJ_RCVD;
1760                 } else {
1761                         type = NES_CM_EVENT_CONNECTED;
1762                         cm_node->state = NES_CM_STATE_TSA;
1763                 }
1764
1765                 break;
1766         default:
1767                 WARN_ON(1);
1768                 break;
1769         }
1770         dev_kfree_skb_any(skb);
1771         create_event(cm_node, type);
1772 }
1773
1774 static void indicate_pkt_err(struct nes_cm_node *cm_node, struct sk_buff *skb)
1775 {
1776         switch (cm_node->state) {
1777         case NES_CM_STATE_SYN_SENT:
1778         case NES_CM_STATE_MPAREQ_SENT:
1779                 nes_debug(NES_DBG_CM, "%s[%u] create abort for cm_node=%p "
1780                           "listener=%p state=%d\n", __func__, __LINE__, cm_node,
1781                           cm_node->listener, cm_node->state);
1782                 active_open_err(cm_node, skb, 1);
1783                 break;
1784         case NES_CM_STATE_ESTABLISHED:
1785         case NES_CM_STATE_SYN_RCVD:
1786                 passive_open_err(cm_node, skb, 1);
1787                 break;
1788         case NES_CM_STATE_TSA:
1789         default:
1790                 drop_packet(skb);
1791         }
1792 }
1793
1794 static int check_syn(struct nes_cm_node *cm_node, struct tcphdr *tcph,
1795                      struct sk_buff *skb)
1796 {
1797         int err;
1798
1799         err = ((ntohl(tcph->ack_seq) == cm_node->tcp_cntxt.loc_seq_num)) ? 0 : 1;
1800         if (err)
1801                 active_open_err(cm_node, skb, 1);
1802
1803         return err;
1804 }
1805
1806 static int check_seq(struct nes_cm_node *cm_node, struct tcphdr *tcph,
1807                      struct sk_buff *skb)
1808 {
1809         int err = 0;
1810         u32 seq;
1811         u32 ack_seq;
1812         u32 loc_seq_num = cm_node->tcp_cntxt.loc_seq_num;
1813         u32 rcv_nxt = cm_node->tcp_cntxt.rcv_nxt;
1814         u32 rcv_wnd;
1815
1816         seq = ntohl(tcph->seq);
1817         ack_seq = ntohl(tcph->ack_seq);
1818         rcv_wnd = cm_node->tcp_cntxt.rcv_wnd;
1819         if (ack_seq != loc_seq_num)
1820                 err = 1;
1821         else if (!between(seq, rcv_nxt, (rcv_nxt + rcv_wnd)))
1822                 err = 1;
1823         if (err) {
1824                 nes_debug(NES_DBG_CM, "%s[%u] create abort for cm_node=%p "
1825                           "listener=%p state=%d\n", __func__, __LINE__, cm_node,
1826                           cm_node->listener, cm_node->state);
1827                 indicate_pkt_err(cm_node, skb);
1828                 nes_debug(NES_DBG_CM, "seq ERROR cm_node =%p seq=0x%08X "
1829                           "rcv_nxt=0x%08X rcv_wnd=0x%x\n", cm_node, seq, rcv_nxt,
1830                           rcv_wnd);
1831         }
1832         return err;
1833 }
1834
1835 /*
1836  * handle_syn_pkt() is for Passive node. The syn packet is received when a node
1837  * is created with a listener or it may comein as rexmitted packet which in
1838  * that case will be just dropped.
1839  */
1840 static void handle_syn_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1841                            struct tcphdr *tcph)
1842 {
1843         int ret;
1844         u32 inc_sequence;
1845         int optionsize;
1846
1847         optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
1848         skb_trim(skb, 0);
1849         inc_sequence = ntohl(tcph->seq);
1850
1851         switch (cm_node->state) {
1852         case NES_CM_STATE_SYN_SENT:
1853         case NES_CM_STATE_MPAREQ_SENT:
1854                 /* Rcvd syn on active open connection*/
1855                 active_open_err(cm_node, skb, 1);
1856                 break;
1857         case NES_CM_STATE_LISTENING:
1858                 /* Passive OPEN */
1859                 if (atomic_read(&cm_node->listener->pend_accepts_cnt) >
1860                     cm_node->listener->backlog) {
1861                         nes_debug(NES_DBG_CM, "drop syn due to backlog "
1862                                   "pressure \n");
1863                         cm_backlog_drops++;
1864                         passive_open_err(cm_node, skb, 0);
1865                         break;
1866                 }
1867                 ret = handle_tcp_options(cm_node, tcph, skb, optionsize,
1868                                          1);
1869                 if (ret) {
1870                         passive_open_err(cm_node, skb, 0);
1871                         /* drop pkt */
1872                         break;
1873                 }
1874                 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
1875                 BUG_ON(cm_node->send_entry);
1876                 cm_node->accept_pend = 1;
1877                 atomic_inc(&cm_node->listener->pend_accepts_cnt);
1878
1879                 cm_node->state = NES_CM_STATE_SYN_RCVD;
1880                 send_syn(cm_node, 1, skb);
1881                 break;
1882         case NES_CM_STATE_CLOSED:
1883                 cleanup_retrans_entry(cm_node);
1884                 add_ref_cm_node(cm_node);
1885                 send_reset(cm_node, skb);
1886                 break;
1887         case NES_CM_STATE_TSA:
1888         case NES_CM_STATE_ESTABLISHED:
1889         case NES_CM_STATE_FIN_WAIT1:
1890         case NES_CM_STATE_FIN_WAIT2:
1891         case NES_CM_STATE_MPAREQ_RCVD:
1892         case NES_CM_STATE_LAST_ACK:
1893         case NES_CM_STATE_CLOSING:
1894         case NES_CM_STATE_UNKNOWN:
1895         default:
1896                 drop_packet(skb);
1897                 break;
1898         }
1899 }
1900
1901 static void handle_synack_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1902                               struct tcphdr *tcph)
1903 {
1904         int ret;
1905         u32 inc_sequence;
1906         int optionsize;
1907
1908         optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
1909         skb_trim(skb, 0);
1910         inc_sequence = ntohl(tcph->seq);
1911         switch (cm_node->state) {
1912         case NES_CM_STATE_SYN_SENT:
1913                 cleanup_retrans_entry(cm_node);
1914                 /* active open */
1915                 if (check_syn(cm_node, tcph, skb))
1916                         return;
1917                 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
1918                 /* setup options */
1919                 ret = handle_tcp_options(cm_node, tcph, skb, optionsize, 0);
1920                 if (ret) {
1921                         nes_debug(NES_DBG_CM, "cm_node=%p tcp_options failed\n",
1922                                   cm_node);
1923                         break;
1924                 }
1925                 cleanup_retrans_entry(cm_node);
1926                 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
1927                 send_mpa_request(cm_node, skb);
1928                 cm_node->state = NES_CM_STATE_MPAREQ_SENT;
1929                 break;
1930         case NES_CM_STATE_MPAREQ_RCVD:
1931                 /* passive open, so should not be here */
1932                 passive_open_err(cm_node, skb, 1);
1933                 break;
1934         case NES_CM_STATE_LISTENING:
1935                 cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
1936                 cleanup_retrans_entry(cm_node);
1937                 cm_node->state = NES_CM_STATE_CLOSED;
1938                 send_reset(cm_node, skb);
1939                 break;
1940         case NES_CM_STATE_CLOSED:
1941                 cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
1942                 cleanup_retrans_entry(cm_node);
1943                 add_ref_cm_node(cm_node);
1944                 send_reset(cm_node, skb);
1945                 break;
1946         case NES_CM_STATE_ESTABLISHED:
1947         case NES_CM_STATE_FIN_WAIT1:
1948         case NES_CM_STATE_FIN_WAIT2:
1949         case NES_CM_STATE_LAST_ACK:
1950         case NES_CM_STATE_TSA:
1951         case NES_CM_STATE_CLOSING:
1952         case NES_CM_STATE_UNKNOWN:
1953         case NES_CM_STATE_MPAREQ_SENT:
1954         default:
1955                 drop_packet(skb);
1956                 break;
1957         }
1958 }
1959
1960 static int handle_ack_pkt(struct nes_cm_node *cm_node, struct sk_buff *skb,
1961                           struct tcphdr *tcph)
1962 {
1963         int datasize = 0;
1964         u32 inc_sequence;
1965         int ret = 0;
1966         int optionsize;
1967
1968         optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
1969
1970         if (check_seq(cm_node, tcph, skb))
1971                 return -EINVAL;
1972
1973         skb_pull(skb, tcph->doff << 2);
1974         inc_sequence = ntohl(tcph->seq);
1975         datasize = skb->len;
1976         switch (cm_node->state) {
1977         case NES_CM_STATE_SYN_RCVD:
1978                 /* Passive OPEN */
1979                 cleanup_retrans_entry(cm_node);
1980                 ret = handle_tcp_options(cm_node, tcph, skb, optionsize, 1);
1981                 if (ret)
1982                         break;
1983                 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
1984                 cm_node->state = NES_CM_STATE_ESTABLISHED;
1985                 if (datasize) {
1986                         cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
1987                         handle_rcv_mpa(cm_node, skb);
1988                 } else { /* rcvd ACK only */
1989                         dev_kfree_skb_any(skb);
1990                 }
1991                 break;
1992         case NES_CM_STATE_ESTABLISHED:
1993                 /* Passive OPEN */
1994                 cleanup_retrans_entry(cm_node);
1995                 if (datasize) {
1996                         cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
1997                         handle_rcv_mpa(cm_node, skb);
1998                 } else {
1999                         drop_packet(skb);
2000                 }
2001                 break;
2002         case NES_CM_STATE_MPAREQ_SENT:
2003                 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2004                 if (datasize) {
2005                         cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2006                         handle_rcv_mpa(cm_node, skb);
2007                 } else { /* Could be just an ack pkt.. */
2008                         dev_kfree_skb_any(skb);
2009                 }
2010                 break;
2011         case NES_CM_STATE_LISTENING:
2012                 cleanup_retrans_entry(cm_node);
2013                 cm_node->state = NES_CM_STATE_CLOSED;
2014                 send_reset(cm_node, skb);
2015                 break;
2016         case NES_CM_STATE_CLOSED:
2017                 cleanup_retrans_entry(cm_node);
2018                 add_ref_cm_node(cm_node);
2019                 send_reset(cm_node, skb);
2020                 break;
2021         case NES_CM_STATE_LAST_ACK:
2022         case NES_CM_STATE_CLOSING:
2023                 cleanup_retrans_entry(cm_node);
2024                 cm_node->state = NES_CM_STATE_CLOSED;
2025                 cm_node->cm_id->rem_ref(cm_node->cm_id);
2026                 rem_ref_cm_node(cm_node->cm_core, cm_node);
2027                 drop_packet(skb);
2028                 break;
2029         case NES_CM_STATE_FIN_WAIT1:
2030                 cleanup_retrans_entry(cm_node);
2031                 drop_packet(skb);
2032                 cm_node->state = NES_CM_STATE_FIN_WAIT2;
2033                 break;
2034         case NES_CM_STATE_SYN_SENT:
2035         case NES_CM_STATE_FIN_WAIT2:
2036         case NES_CM_STATE_TSA:
2037         case NES_CM_STATE_MPAREQ_RCVD:
2038         case NES_CM_STATE_UNKNOWN:
2039         default:
2040                 cleanup_retrans_entry(cm_node);
2041                 drop_packet(skb);
2042                 break;
2043         }
2044         return ret;
2045 }
2046
2047
2048
2049 static int handle_tcp_options(struct nes_cm_node *cm_node, struct tcphdr *tcph,
2050                               struct sk_buff *skb, int optionsize, int passive)
2051 {
2052         u8 *optionsloc = (u8 *)&tcph[1];
2053
2054         if (optionsize) {
2055                 if (process_options(cm_node, optionsloc, optionsize,
2056                                     (u32)tcph->syn)) {
2057                         nes_debug(NES_DBG_CM, "%s: Node %p, Sending RESET\n",
2058                                   __func__, cm_node);
2059                         if (passive)
2060                                 passive_open_err(cm_node, skb, 1);
2061                         else
2062                                 active_open_err(cm_node, skb, 1);
2063                         return 1;
2064                 }
2065         }
2066
2067         cm_node->tcp_cntxt.snd_wnd = ntohs(tcph->window) <<
2068                                      cm_node->tcp_cntxt.snd_wscale;
2069
2070         if (cm_node->tcp_cntxt.snd_wnd > cm_node->tcp_cntxt.max_snd_wnd)
2071                 cm_node->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.snd_wnd;
2072         return 0;
2073 }
2074
2075 /*
2076  * active_open_err() will send reset() if flag set..
2077  * It will also send ABORT event.
2078  */
2079 static void active_open_err(struct nes_cm_node *cm_node, struct sk_buff *skb,
2080                             int reset)
2081 {
2082         cleanup_retrans_entry(cm_node);
2083         if (reset) {
2084                 nes_debug(NES_DBG_CM, "ERROR active err called for cm_node=%p, "
2085                           "state=%d\n", cm_node, cm_node->state);
2086                 add_ref_cm_node(cm_node);
2087                 send_reset(cm_node, skb);
2088         } else {
2089                 dev_kfree_skb_any(skb);
2090         }
2091
2092         cm_node->state = NES_CM_STATE_CLOSED;
2093         create_event(cm_node, NES_CM_EVENT_ABORTED);
2094 }
2095
2096 /*
2097  * passive_open_err() will either do a reset() or will free up the skb and
2098  * remove the cm_node.
2099  */
2100 static void passive_open_err(struct nes_cm_node *cm_node, struct sk_buff *skb,
2101                              int reset)
2102 {
2103         cleanup_retrans_entry(cm_node);
2104         cm_node->state = NES_CM_STATE_CLOSED;
2105         if (reset) {
2106                 nes_debug(NES_DBG_CM, "passive_open_err sending RST for "
2107                           "cm_node=%p state =%d\n", cm_node, cm_node->state);
2108                 send_reset(cm_node, skb);
2109         } else {
2110                 dev_kfree_skb_any(skb);
2111                 rem_ref_cm_node(cm_node->cm_core, cm_node);
2112         }
2113 }
2114
2115 /*
2116  * free_retrans_entry() routines assumes that the retrans_list_lock has
2117  * been acquired before calling.
2118  */
2119 static void free_retrans_entry(struct nes_cm_node *cm_node)
2120 {
2121         struct nes_timer_entry *send_entry;
2122
2123         send_entry = cm_node->send_entry;
2124         if (send_entry) {
2125                 cm_node->send_entry = NULL;
2126                 dev_kfree_skb_any(send_entry->skb);
2127                 kfree(send_entry);
2128                 rem_ref_cm_node(cm_node->cm_core, cm_node);
2129         }
2130 }
2131
2132 static void cleanup_retrans_entry(struct nes_cm_node *cm_node)
2133 {
2134         unsigned long flags;
2135
2136         spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
2137         free_retrans_entry(cm_node);
2138         spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
2139 }
2140
2141 /**
2142  * process_packet
2143  * Returns skb if to be freed, else it will return NULL if already used..
2144  */
2145 static void process_packet(struct nes_cm_node *cm_node, struct sk_buff *skb,
2146                            struct nes_cm_core *cm_core)
2147 {
2148         enum nes_tcpip_pkt_type pkt_type = NES_PKT_TYPE_UNKNOWN;
2149         struct tcphdr *tcph = tcp_hdr(skb);
2150         u32 fin_set = 0;
2151         int ret = 0;
2152
2153         skb_pull(skb, ip_hdr(skb)->ihl << 2);
2154
2155         nes_debug(NES_DBG_CM, "process_packet: cm_node=%p state =%d syn=%d "
2156                   "ack=%d rst=%d fin=%d\n", cm_node, cm_node->state, tcph->syn,
2157                   tcph->ack, tcph->rst, tcph->fin);
2158
2159         if (tcph->rst) {
2160                 pkt_type = NES_PKT_TYPE_RST;
2161         } else if (tcph->syn) {
2162                 pkt_type = NES_PKT_TYPE_SYN;
2163                 if (tcph->ack)
2164                         pkt_type = NES_PKT_TYPE_SYNACK;
2165         } else if (tcph->ack) {
2166                 pkt_type = NES_PKT_TYPE_ACK;
2167         }
2168         if (tcph->fin)
2169                 fin_set = 1;
2170
2171         switch (pkt_type) {
2172         case NES_PKT_TYPE_SYN:
2173                 handle_syn_pkt(cm_node, skb, tcph);
2174                 break;
2175         case NES_PKT_TYPE_SYNACK:
2176                 handle_synack_pkt(cm_node, skb, tcph);
2177                 break;
2178         case NES_PKT_TYPE_ACK:
2179                 ret = handle_ack_pkt(cm_node, skb, tcph);
2180                 if (fin_set && !ret)
2181                         handle_fin_pkt(cm_node);
2182                 break;
2183         case NES_PKT_TYPE_RST:
2184                 handle_rst_pkt(cm_node, skb, tcph);
2185                 break;
2186         default:
2187                 if ((fin_set) && (!check_seq(cm_node, tcph, skb)))
2188                         handle_fin_pkt(cm_node);
2189                 drop_packet(skb);
2190                 break;
2191         }
2192 }
2193
2194 /**
2195  * mini_cm_listen - create a listen node with params
2196  */
2197 static struct nes_cm_listener *mini_cm_listen(struct nes_cm_core *cm_core,
2198                                               struct nes_vnic *nesvnic, struct nes_cm_info *cm_info)
2199 {
2200         struct nes_cm_listener *listener;
2201         unsigned long flags;
2202
2203         nes_debug(NES_DBG_CM, "Search for 0x%08x : 0x%04x\n",
2204                   cm_info->loc_addr, cm_info->loc_port);
2205
2206         /* cannot have multiple matching listeners */
2207         listener = find_listener(cm_core, htonl(cm_info->loc_addr),
2208                                  htons(cm_info->loc_port), NES_CM_LISTENER_EITHER_STATE);
2209         if (listener && listener->listener_state == NES_CM_LISTENER_ACTIVE_STATE) {
2210                 /* find automatically incs ref count ??? */
2211                 atomic_dec(&listener->ref_count);
2212                 nes_debug(NES_DBG_CM, "Not creating listener since it already exists\n");
2213                 return NULL;
2214         }
2215
2216         if (!listener) {
2217                 /* create a CM listen node (1/2 node to compare incoming traffic to) */
2218                 listener = kzalloc(sizeof(*listener), GFP_ATOMIC);
2219                 if (!listener) {
2220                         nes_debug(NES_DBG_CM, "Not creating listener memory allocation failed\n");
2221                         return NULL;
2222                 }
2223
2224                 listener->loc_addr = htonl(cm_info->loc_addr);
2225                 listener->loc_port = htons(cm_info->loc_port);
2226                 listener->reused_node = 0;
2227
2228                 atomic_set(&listener->ref_count, 1);
2229         }
2230         /* pasive case */
2231         /* find already inc'ed the ref count */
2232         else {
2233                 listener->reused_node = 1;
2234         }
2235
2236         listener->cm_id = cm_info->cm_id;
2237         atomic_set(&listener->pend_accepts_cnt, 0);
2238         listener->cm_core = cm_core;
2239         listener->nesvnic = nesvnic;
2240         atomic_inc(&cm_core->node_cnt);
2241
2242         listener->conn_type = cm_info->conn_type;
2243         listener->backlog = cm_info->backlog;
2244         listener->listener_state = NES_CM_LISTENER_ACTIVE_STATE;
2245
2246         if (!listener->reused_node) {
2247                 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
2248                 list_add(&listener->list, &cm_core->listen_list.list);
2249                 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
2250                 atomic_inc(&cm_core->listen_node_cnt);
2251         }
2252
2253         nes_debug(NES_DBG_CM, "Api - listen(): addr=0x%08X, port=0x%04x,"
2254                   " listener = %p, backlog = %d, cm_id = %p.\n",
2255                   cm_info->loc_addr, cm_info->loc_port,
2256                   listener, listener->backlog, listener->cm_id);
2257
2258         return listener;
2259 }
2260
2261
2262 /**
2263  * mini_cm_connect - make a connection node with params
2264  */
2265 static struct nes_cm_node *mini_cm_connect(struct nes_cm_core *cm_core,
2266                                            struct nes_vnic *nesvnic, u16 private_data_len,
2267                                            void *private_data, struct nes_cm_info *cm_info)
2268 {
2269         int ret = 0;
2270         struct nes_cm_node *cm_node;
2271         struct nes_cm_listener *loopbackremotelistener;
2272         struct nes_cm_node *loopbackremotenode;
2273         struct nes_cm_info loopback_cm_info;
2274         u8 *start_buff;
2275
2276         /* create a CM connection node */
2277         cm_node = make_cm_node(cm_core, nesvnic, cm_info, NULL);
2278         if (!cm_node)
2279                 return NULL;
2280
2281         /* set our node side to client (active) side */
2282         cm_node->tcp_cntxt.client = 1;
2283         cm_node->tcp_cntxt.rcv_wscale = NES_CM_DEFAULT_RCV_WND_SCALE;
2284
2285         if (cm_info->loc_addr == cm_info->rem_addr) {
2286                 loopbackremotelistener = find_listener(cm_core,
2287                                                        ntohl(nesvnic->local_ipaddr), cm_node->rem_port,
2288                                                        NES_CM_LISTENER_ACTIVE_STATE);
2289                 if (loopbackremotelistener == NULL) {
2290                         create_event(cm_node, NES_CM_EVENT_ABORTED);
2291                 } else {
2292                         loopback_cm_info = *cm_info;
2293                         loopback_cm_info.loc_port = cm_info->rem_port;
2294                         loopback_cm_info.rem_port = cm_info->loc_port;
2295                         loopback_cm_info.cm_id = loopbackremotelistener->cm_id;
2296                         loopbackremotenode = make_cm_node(cm_core, nesvnic,
2297                                                           &loopback_cm_info, loopbackremotelistener);
2298                         if (!loopbackremotenode) {
2299                                 rem_ref_cm_node(cm_node->cm_core, cm_node);
2300                                 return NULL;
2301                         }
2302                         atomic_inc(&cm_loopbacks);
2303                         loopbackremotenode->loopbackpartner = cm_node;
2304                         loopbackremotenode->tcp_cntxt.rcv_wscale =
2305                                 NES_CM_DEFAULT_RCV_WND_SCALE;
2306                         cm_node->loopbackpartner = loopbackremotenode;
2307                         memcpy(loopbackremotenode->mpa_frame_buf, private_data,
2308                                private_data_len);
2309                         loopbackremotenode->mpa_frame_size = private_data_len;
2310
2311                         /* we are done handling this state. */
2312                         /* set node to a TSA state */
2313                         cm_node->state = NES_CM_STATE_TSA;
2314                         cm_node->tcp_cntxt.rcv_nxt =
2315                                 loopbackremotenode->tcp_cntxt.loc_seq_num;
2316                         loopbackremotenode->tcp_cntxt.rcv_nxt =
2317                                 cm_node->tcp_cntxt.loc_seq_num;
2318                         cm_node->tcp_cntxt.max_snd_wnd =
2319                                 loopbackremotenode->tcp_cntxt.rcv_wnd;
2320                         loopbackremotenode->tcp_cntxt.max_snd_wnd =
2321                                 cm_node->tcp_cntxt.rcv_wnd;
2322                         cm_node->tcp_cntxt.snd_wnd =
2323                                 loopbackremotenode->tcp_cntxt.rcv_wnd;
2324                         loopbackremotenode->tcp_cntxt.snd_wnd =
2325                                 cm_node->tcp_cntxt.rcv_wnd;
2326                         cm_node->tcp_cntxt.snd_wscale =
2327                                 loopbackremotenode->tcp_cntxt.rcv_wscale;
2328                         loopbackremotenode->tcp_cntxt.snd_wscale =
2329                                 cm_node->tcp_cntxt.rcv_wscale;
2330                         loopbackremotenode->state = NES_CM_STATE_MPAREQ_RCVD;
2331                         create_event(loopbackremotenode, NES_CM_EVENT_MPA_REQ);
2332                 }
2333                 return cm_node;
2334         }
2335
2336         start_buff = &cm_node->mpa_frame_buf[0] + sizeof(struct ietf_mpa_v2);
2337         cm_node->mpa_frame_size = private_data_len;
2338
2339         memcpy(start_buff, private_data, private_data_len);
2340
2341         /* send a syn and goto syn sent state */
2342         cm_node->state = NES_CM_STATE_SYN_SENT;
2343         ret = send_syn(cm_node, 0, NULL);
2344
2345         if (ret) {
2346                 /* error in sending the syn free up the cm_node struct */
2347                 nes_debug(NES_DBG_CM, "Api - connect() FAILED: dest "
2348                           "addr=0x%08X, port=0x%04x, cm_node=%p, cm_id = %p.\n",
2349                           cm_node->rem_addr, cm_node->rem_port, cm_node,
2350                           cm_node->cm_id);
2351                 rem_ref_cm_node(cm_node->cm_core, cm_node);
2352                 cm_node = NULL;
2353         }
2354
2355         if (cm_node) {
2356                 nes_debug(NES_DBG_CM, "Api - connect(): dest addr=0x%08X,"
2357                           "port=0x%04x, cm_node=%p, cm_id = %p.\n",
2358                           cm_node->rem_addr, cm_node->rem_port, cm_node,
2359                           cm_node->cm_id);
2360         }
2361
2362         return cm_node;
2363 }
2364
2365
2366 /**
2367  * mini_cm_accept - accept a connection
2368  * This function is never called
2369  */
2370 static int mini_cm_accept(struct nes_cm_core *cm_core, struct nes_cm_node *cm_node)
2371 {
2372         return 0;
2373 }
2374
2375
2376 /**
2377  * mini_cm_reject - reject and teardown a connection
2378  */
2379 static int mini_cm_reject(struct nes_cm_core *cm_core, struct nes_cm_node *cm_node)
2380 {
2381         int ret = 0;
2382         int err = 0;
2383         int passive_state;
2384         struct nes_cm_event event;
2385         struct iw_cm_id *cm_id = cm_node->cm_id;
2386         struct nes_cm_node *loopback = cm_node->loopbackpartner;
2387
2388         nes_debug(NES_DBG_CM, "%s cm_node=%p type=%d state=%d\n",
2389                   __func__, cm_node, cm_node->tcp_cntxt.client, cm_node->state);
2390
2391         if (cm_node->tcp_cntxt.client)
2392                 return ret;
2393         cleanup_retrans_entry(cm_node);
2394
2395         if (!loopback) {
2396                 passive_state = atomic_add_return(1, &cm_node->passive_state);
2397                 if (passive_state == NES_SEND_RESET_EVENT) {
2398                         cm_node->state = NES_CM_STATE_CLOSED;
2399                         rem_ref_cm_node(cm_core, cm_node);
2400                 } else {
2401                         if (cm_node->state == NES_CM_STATE_LISTENER_DESTROYED) {
2402                                 rem_ref_cm_node(cm_core, cm_node);
2403                         } else {
2404                                 ret = send_mpa_reject(cm_node);
2405                                 if (ret) {
2406                                         cm_node->state = NES_CM_STATE_CLOSED;
2407                                         err = send_reset(cm_node, NULL);
2408                                         if (err)
2409                                                 WARN_ON(1);
2410                                 } else {
2411                                         cm_id->add_ref(cm_id);
2412                                 }
2413                         }
2414                 }
2415         } else {
2416                 cm_node->cm_id = NULL;
2417                 if (cm_node->state == NES_CM_STATE_LISTENER_DESTROYED) {
2418                         rem_ref_cm_node(cm_core, cm_node);
2419                         rem_ref_cm_node(cm_core, loopback);
2420                 } else {
2421                         event.cm_node = loopback;
2422                         event.cm_info.rem_addr = loopback->rem_addr;
2423                         event.cm_info.loc_addr = loopback->loc_addr;
2424                         event.cm_info.rem_port = loopback->rem_port;
2425                         event.cm_info.loc_port = loopback->loc_port;
2426                         event.cm_info.cm_id = loopback->cm_id;
2427                         cm_event_mpa_reject(&event);
2428                         rem_ref_cm_node(cm_core, cm_node);
2429                         loopback->state = NES_CM_STATE_CLOSING;
2430
2431                         cm_id = loopback->cm_id;
2432                         rem_ref_cm_node(cm_core, loopback);
2433                         cm_id->rem_ref(cm_id);
2434                 }
2435         }
2436
2437         return ret;
2438 }
2439
2440
2441 /**
2442  * mini_cm_close
2443  */
2444 static int mini_cm_close(struct nes_cm_core *cm_core, struct nes_cm_node *cm_node)
2445 {
2446         int ret = 0;
2447
2448         if (!cm_core || !cm_node)
2449                 return -EINVAL;
2450
2451         switch (cm_node->state) {
2452         case NES_CM_STATE_SYN_RCVD:
2453         case NES_CM_STATE_SYN_SENT:
2454         case NES_CM_STATE_ONE_SIDE_ESTABLISHED:
2455         case NES_CM_STATE_ESTABLISHED:
2456         case NES_CM_STATE_ACCEPTING:
2457         case NES_CM_STATE_MPAREQ_SENT:
2458         case NES_CM_STATE_MPAREQ_RCVD:
2459                 cleanup_retrans_entry(cm_node);
2460                 send_reset(cm_node, NULL);
2461                 break;
2462         case NES_CM_STATE_CLOSE_WAIT:
2463                 cm_node->state = NES_CM_STATE_LAST_ACK;
2464                 send_fin(cm_node, NULL);
2465                 break;
2466         case NES_CM_STATE_FIN_WAIT1:
2467         case NES_CM_STATE_FIN_WAIT2:
2468         case NES_CM_STATE_LAST_ACK:
2469         case NES_CM_STATE_TIME_WAIT:
2470         case NES_CM_STATE_CLOSING:
2471                 ret = -1;
2472                 break;
2473         case NES_CM_STATE_LISTENING:
2474                 cleanup_retrans_entry(cm_node);
2475                 send_reset(cm_node, NULL);
2476                 break;
2477         case NES_CM_STATE_MPAREJ_RCVD:
2478         case NES_CM_STATE_UNKNOWN:
2479         case NES_CM_STATE_INITED:
2480         case NES_CM_STATE_CLOSED:
2481         case NES_CM_STATE_LISTENER_DESTROYED:
2482                 ret = rem_ref_cm_node(cm_core, cm_node);
2483                 break;
2484         case NES_CM_STATE_TSA:
2485                 if (cm_node->send_entry)
2486                         printk(KERN_ERR "ERROR Close got called from STATE_TSA "
2487                                "send_entry=%p\n", cm_node->send_entry);
2488                 ret = rem_ref_cm_node(cm_core, cm_node);
2489                 break;
2490         }
2491         return ret;
2492 }
2493
2494
2495 /**
2496  * recv_pkt - recv an ETHERNET packet, and process it through CM
2497  * node state machine
2498  */
2499 static int mini_cm_recv_pkt(struct nes_cm_core *cm_core,
2500                             struct nes_vnic *nesvnic, struct sk_buff *skb)
2501 {
2502         struct nes_cm_node *cm_node = NULL;
2503         struct nes_cm_listener *listener = NULL;
2504         struct iphdr *iph;
2505         struct tcphdr *tcph;
2506         struct nes_cm_info nfo;
2507         int skb_handled = 1;
2508         __be32 tmp_daddr, tmp_saddr;
2509
2510         if (!skb)
2511                 return 0;
2512         if (skb->len < sizeof(struct iphdr) + sizeof(struct tcphdr))
2513                 return 0;
2514
2515         iph = (struct iphdr *)skb->data;
2516         tcph = (struct tcphdr *)(skb->data + sizeof(struct iphdr));
2517
2518         nfo.loc_addr = ntohl(iph->daddr);
2519         nfo.loc_port = ntohs(tcph->dest);
2520         nfo.rem_addr = ntohl(iph->saddr);
2521         nfo.rem_port = ntohs(tcph->source);
2522
2523         tmp_daddr = cpu_to_be32(iph->daddr);
2524         tmp_saddr = cpu_to_be32(iph->saddr);
2525
2526         nes_debug(NES_DBG_CM, "Received packet: dest=%pI4:0x%04X src=%pI4:0x%04X\n",
2527                   &tmp_daddr, tcph->dest, &tmp_saddr, tcph->source);
2528
2529         do {
2530                 cm_node = find_node(cm_core,
2531                                     nfo.rem_port, nfo.rem_addr,
2532                                     nfo.loc_port, nfo.loc_addr);
2533
2534                 if (!cm_node) {
2535                         /* Only type of packet accepted are for */
2536                         /* the PASSIVE open (syn only) */
2537                         if ((!tcph->syn) || (tcph->ack)) {
2538                                 skb_handled = 0;
2539                                 break;
2540                         }
2541                         listener = find_listener(cm_core, nfo.loc_addr,
2542                                                  nfo.loc_port,
2543                                                  NES_CM_LISTENER_ACTIVE_STATE);
2544                         if (!listener) {
2545                                 nfo.cm_id = NULL;
2546                                 nfo.conn_type = 0;
2547                                 nes_debug(NES_DBG_CM, "Unable to find listener for the pkt\n");
2548                                 skb_handled = 0;
2549                                 break;
2550                         }
2551                         nfo.cm_id = listener->cm_id;
2552                         nfo.conn_type = listener->conn_type;
2553                         cm_node = make_cm_node(cm_core, nesvnic, &nfo,
2554                                                listener);
2555                         if (!cm_node) {
2556                                 nes_debug(NES_DBG_CM, "Unable to allocate "
2557                                           "node\n");
2558                                 cm_packets_dropped++;
2559                                 atomic_dec(&listener->ref_count);
2560                                 dev_kfree_skb_any(skb);
2561                                 break;
2562                         }
2563                         if (!tcph->rst && !tcph->fin) {
2564                                 cm_node->state = NES_CM_STATE_LISTENING;
2565                         } else {
2566                                 cm_packets_dropped++;
2567                                 rem_ref_cm_node(cm_core, cm_node);
2568                                 dev_kfree_skb_any(skb);
2569                                 break;
2570                         }
2571                         add_ref_cm_node(cm_node);
2572                 } else if (cm_node->state == NES_CM_STATE_TSA) {
2573                         if (cm_node->nesqp->pau_mode)
2574                                 nes_queue_mgt_skbs(skb, nesvnic, cm_node->nesqp);
2575                         else {
2576                                 rem_ref_cm_node(cm_core, cm_node);
2577                                 atomic_inc(&cm_accel_dropped_pkts);
2578                                 dev_kfree_skb_any(skb);
2579                         }
2580                         break;
2581                 }
2582                 skb_reset_network_header(skb);
2583                 skb_set_transport_header(skb, sizeof(*tcph));
2584                 skb->len = ntohs(iph->tot_len);
2585                 process_packet(cm_node, skb, cm_core);
2586                 rem_ref_cm_node(cm_core, cm_node);
2587         } while (0);
2588         return skb_handled;
2589 }
2590
2591
2592 /**
2593  * nes_cm_alloc_core - allocate a top level instance of a cm core
2594  */
2595 static struct nes_cm_core *nes_cm_alloc_core(void)
2596 {
2597         struct nes_cm_core *cm_core;
2598
2599         /* setup the CM core */
2600         /* alloc top level core control structure */
2601         cm_core = kzalloc(sizeof(*cm_core), GFP_KERNEL);
2602         if (!cm_core)
2603                 return NULL;
2604
2605         INIT_LIST_HEAD(&cm_core->connected_nodes);
2606         init_timer(&cm_core->tcp_timer);
2607         cm_core->tcp_timer.function = nes_cm_timer_tick;
2608
2609         cm_core->mtu = NES_CM_DEFAULT_MTU;
2610         cm_core->state = NES_CM_STATE_INITED;
2611         cm_core->free_tx_pkt_max = NES_CM_DEFAULT_FREE_PKTS;
2612
2613         atomic_set(&cm_core->events_posted, 0);
2614
2615         cm_core->api = &nes_cm_api;
2616
2617         spin_lock_init(&cm_core->ht_lock);
2618         spin_lock_init(&cm_core->listen_list_lock);
2619
2620         INIT_LIST_HEAD(&cm_core->listen_list.list);
2621
2622         nes_debug(NES_DBG_CM, "Init CM Core completed -- cm_core=%p\n", cm_core);
2623
2624         nes_debug(NES_DBG_CM, "Enable QUEUE EVENTS\n");
2625         cm_core->event_wq = create_singlethread_workqueue("nesewq");
2626         cm_core->post_event = nes_cm_post_event;
2627         nes_debug(NES_DBG_CM, "Enable QUEUE DISCONNECTS\n");
2628         cm_core->disconn_wq = create_singlethread_workqueue("nesdwq");
2629
2630         print_core(cm_core);
2631         return cm_core;
2632 }
2633
2634
2635 /**
2636  * mini_cm_dealloc_core - deallocate a top level instance of a cm core
2637  */
2638 static int mini_cm_dealloc_core(struct nes_cm_core *cm_core)
2639 {
2640         nes_debug(NES_DBG_CM, "De-Alloc CM Core (%p)\n", cm_core);
2641
2642         if (!cm_core)
2643                 return -EINVAL;
2644
2645         barrier();
2646
2647         if (timer_pending(&cm_core->tcp_timer))
2648                 del_timer(&cm_core->tcp_timer);
2649
2650         destroy_workqueue(cm_core->event_wq);
2651         destroy_workqueue(cm_core->disconn_wq);
2652         nes_debug(NES_DBG_CM, "\n");
2653         kfree(cm_core);
2654
2655         return 0;
2656 }
2657
2658
2659 /**
2660  * mini_cm_get
2661  */
2662 static int mini_cm_get(struct nes_cm_core *cm_core)
2663 {
2664         return cm_core->state;
2665 }
2666
2667
2668 /**
2669  * mini_cm_set
2670  */
2671 static int mini_cm_set(struct nes_cm_core *cm_core, u32 type, u32 value)
2672 {
2673         int ret = 0;
2674
2675         switch (type) {
2676         case NES_CM_SET_PKT_SIZE:
2677                 cm_core->mtu = value;
2678                 break;
2679         case NES_CM_SET_FREE_PKT_Q_SIZE:
2680                 cm_core->free_tx_pkt_max = value;
2681                 break;
2682         default:
2683                 /* unknown set option */
2684                 ret = -EINVAL;
2685         }
2686
2687         return ret;
2688 }
2689
2690
2691 /**
2692  * nes_cm_init_tsa_conn setup HW; MPA frames must be
2693  * successfully exchanged when this is called
2694  */
2695 static int nes_cm_init_tsa_conn(struct nes_qp *nesqp, struct nes_cm_node *cm_node)
2696 {
2697         int ret = 0;
2698
2699         if (!nesqp)
2700                 return -EINVAL;
2701
2702         nesqp->nesqp_context->misc |= cpu_to_le32(NES_QPCONTEXT_MISC_IPV4 |
2703                                                   NES_QPCONTEXT_MISC_NO_NAGLE | NES_QPCONTEXT_MISC_DO_NOT_FRAG |
2704                                                   NES_QPCONTEXT_MISC_DROS);
2705
2706         if (cm_node->tcp_cntxt.snd_wscale || cm_node->tcp_cntxt.rcv_wscale)
2707                 nesqp->nesqp_context->misc |= cpu_to_le32(NES_QPCONTEXT_MISC_WSCALE);
2708
2709         nesqp->nesqp_context->misc2 |= cpu_to_le32(64 << NES_QPCONTEXT_MISC2_TTL_SHIFT);
2710
2711         nesqp->nesqp_context->mss |= cpu_to_le32(((u32)cm_node->tcp_cntxt.mss) << 16);
2712
2713         nesqp->nesqp_context->tcp_state_flow_label |= cpu_to_le32(
2714                 (u32)NES_QPCONTEXT_TCPSTATE_EST << NES_QPCONTEXT_TCPFLOW_TCP_STATE_SHIFT);
2715
2716         nesqp->nesqp_context->pd_index_wscale |= cpu_to_le32(
2717                 (cm_node->tcp_cntxt.snd_wscale << NES_QPCONTEXT_PDWSCALE_SND_WSCALE_SHIFT) &
2718                 NES_QPCONTEXT_PDWSCALE_SND_WSCALE_MASK);
2719
2720         nesqp->nesqp_context->pd_index_wscale |= cpu_to_le32(
2721                 (cm_node->tcp_cntxt.rcv_wscale << NES_QPCONTEXT_PDWSCALE_RCV_WSCALE_SHIFT) &
2722                 NES_QPCONTEXT_PDWSCALE_RCV_WSCALE_MASK);
2723
2724         nesqp->nesqp_context->keepalive = cpu_to_le32(0x80);
2725         nesqp->nesqp_context->ts_recent = 0;
2726         nesqp->nesqp_context->ts_age = 0;
2727         nesqp->nesqp_context->snd_nxt = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2728         nesqp->nesqp_context->snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.snd_wnd);
2729         nesqp->nesqp_context->rcv_nxt = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
2730         nesqp->nesqp_context->rcv_wnd = cpu_to_le32(cm_node->tcp_cntxt.rcv_wnd <<
2731                                                     cm_node->tcp_cntxt.rcv_wscale);
2732         nesqp->nesqp_context->snd_max = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2733         nesqp->nesqp_context->snd_una = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2734         nesqp->nesqp_context->srtt = 0;
2735         nesqp->nesqp_context->rttvar = cpu_to_le32(0x6);
2736         nesqp->nesqp_context->ssthresh = cpu_to_le32(0x3FFFC000);
2737         nesqp->nesqp_context->cwnd = cpu_to_le32(2 * cm_node->tcp_cntxt.mss);
2738         nesqp->nesqp_context->snd_wl1 = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
2739         nesqp->nesqp_context->snd_wl2 = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
2740         nesqp->nesqp_context->max_snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.max_snd_wnd);
2741
2742         nes_debug(NES_DBG_CM, "QP%u: rcv_nxt = 0x%08X, snd_nxt = 0x%08X,"
2743                   " Setting MSS to %u, PDWscale = 0x%08X, rcv_wnd = %u, context misc = 0x%08X.\n",
2744                   nesqp->hwqp.qp_id, le32_to_cpu(nesqp->nesqp_context->rcv_nxt),
2745                   le32_to_cpu(nesqp->nesqp_context->snd_nxt),
2746                   cm_node->tcp_cntxt.mss, le32_to_cpu(nesqp->nesqp_context->pd_index_wscale),
2747                   le32_to_cpu(nesqp->nesqp_context->rcv_wnd),
2748                   le32_to_cpu(nesqp->nesqp_context->misc));
2749         nes_debug(NES_DBG_CM, "  snd_wnd  = 0x%08X.\n", le32_to_cpu(nesqp->nesqp_context->snd_wnd));
2750         nes_debug(NES_DBG_CM, "  snd_cwnd = 0x%08X.\n", le32_to_cpu(nesqp->nesqp_context->cwnd));
2751         nes_debug(NES_DBG_CM, "  max_swnd = 0x%08X.\n", le32_to_cpu(nesqp->nesqp_context->max_snd_wnd));
2752
2753         nes_debug(NES_DBG_CM, "Change cm_node state to TSA\n");
2754         cm_node->state = NES_CM_STATE_TSA;
2755
2756         return ret;
2757 }
2758
2759
2760 /**
2761  * nes_cm_disconn
2762  */
2763 int nes_cm_disconn(struct nes_qp *nesqp)
2764 {
2765         struct disconn_work *work;
2766
2767         work = kzalloc(sizeof *work, GFP_ATOMIC);
2768         if (!work)
2769                 return -ENOMEM;  /* Timer will clean up */
2770
2771         nes_add_ref(&nesqp->ibqp);
2772         work->nesqp = nesqp;
2773         INIT_WORK(&work->work, nes_disconnect_worker);
2774         queue_work(g_cm_core->disconn_wq, &work->work);
2775         return 0;
2776 }
2777
2778
2779 /**
2780  * nes_disconnect_worker
2781  */
2782 static void nes_disconnect_worker(struct work_struct *work)
2783 {
2784         struct disconn_work *dwork = container_of(work, struct disconn_work, work);
2785         struct nes_qp *nesqp = dwork->nesqp;
2786
2787         kfree(dwork);
2788         nes_debug(NES_DBG_CM, "processing AEQE id 0x%04X for QP%u.\n",
2789                   nesqp->last_aeq, nesqp->hwqp.qp_id);
2790         nes_cm_disconn_true(nesqp);
2791         nes_rem_ref(&nesqp->ibqp);
2792 }
2793
2794
2795 /**
2796  * nes_cm_disconn_true
2797  */
2798 static int nes_cm_disconn_true(struct nes_qp *nesqp)
2799 {
2800         unsigned long flags;
2801         int ret = 0;
2802         struct iw_cm_id *cm_id;
2803         struct iw_cm_event cm_event;
2804         struct nes_vnic *nesvnic;
2805         u16 last_ae;
2806         u8 original_hw_tcp_state;
2807         u8 original_ibqp_state;
2808         int disconn_status = 0;
2809         int issue_disconn = 0;
2810         int issue_close = 0;
2811         int issue_flush = 0;
2812         u32 flush_q = NES_CQP_FLUSH_RQ;
2813         struct ib_event ibevent;
2814
2815         if (!nesqp) {
2816                 nes_debug(NES_DBG_CM, "disconnect_worker nesqp is NULL\n");
2817                 return -1;
2818         }
2819
2820         spin_lock_irqsave(&nesqp->lock, flags);
2821         cm_id = nesqp->cm_id;
2822         /* make sure we havent already closed this connection */
2823         if (!cm_id) {
2824                 nes_debug(NES_DBG_CM, "QP%u disconnect_worker cmid is NULL\n",
2825                           nesqp->hwqp.qp_id);
2826                 spin_unlock_irqrestore(&nesqp->lock, flags);
2827                 return -1;
2828         }
2829
2830         nesvnic = to_nesvnic(nesqp->ibqp.device);
2831         nes_debug(NES_DBG_CM, "Disconnecting QP%u\n", nesqp->hwqp.qp_id);
2832
2833         original_hw_tcp_state = nesqp->hw_tcp_state;
2834         original_ibqp_state = nesqp->ibqp_state;
2835         last_ae = nesqp->last_aeq;
2836
2837         if (nesqp->term_flags) {
2838                 issue_disconn = 1;
2839                 issue_close = 1;
2840                 nesqp->cm_id = NULL;
2841                 if (nesqp->flush_issued == 0) {
2842                         nesqp->flush_issued = 1;
2843                         issue_flush = 1;
2844                 }
2845         } else if ((original_hw_tcp_state == NES_AEQE_TCP_STATE_CLOSE_WAIT) ||
2846                         ((original_ibqp_state == IB_QPS_RTS) &&
2847                         (last_ae == NES_AEQE_AEID_LLP_CONNECTION_RESET))) {
2848                 issue_disconn = 1;
2849                 if (last_ae == NES_AEQE_AEID_LLP_CONNECTION_RESET)
2850                         disconn_status = -ECONNRESET;
2851         }
2852
2853         if (((original_hw_tcp_state == NES_AEQE_TCP_STATE_CLOSED) ||
2854                  (original_hw_tcp_state == NES_AEQE_TCP_STATE_TIME_WAIT) ||
2855                  (last_ae == NES_AEQE_AEID_RDMAP_ROE_BAD_LLP_CLOSE) ||
2856                  (last_ae == NES_AEQE_AEID_LLP_CONNECTION_RESET))) {
2857                 issue_close = 1;
2858                 nesqp->cm_id = NULL;
2859                 if (nesqp->flush_issued == 0) {
2860                         nesqp->flush_issued = 1;
2861                         issue_flush = 1;
2862                 }
2863         }
2864
2865         spin_unlock_irqrestore(&nesqp->lock, flags);
2866
2867         if ((issue_flush) && (nesqp->destroyed == 0)) {
2868                 /* Flush the queue(s) */
2869                 if (nesqp->hw_iwarp_state >= NES_AEQE_IWARP_STATE_TERMINATE)
2870                         flush_q |= NES_CQP_FLUSH_SQ;
2871                 flush_wqes(nesvnic->nesdev, nesqp, flush_q, 1);
2872
2873                 if (nesqp->term_flags) {
2874                         ibevent.device = nesqp->ibqp.device;
2875                         ibevent.event = nesqp->terminate_eventtype;
2876                         ibevent.element.qp = &nesqp->ibqp;
2877                         nesqp->ibqp.event_handler(&ibevent, nesqp->ibqp.qp_context);
2878                 }
2879         }
2880
2881         if ((cm_id) && (cm_id->event_handler)) {
2882                 if (issue_disconn) {
2883                         atomic_inc(&cm_disconnects);
2884                         cm_event.event = IW_CM_EVENT_DISCONNECT;
2885                         cm_event.status = disconn_status;
2886                         cm_event.local_addr = cm_id->local_addr;
2887                         cm_event.remote_addr = cm_id->remote_addr;
2888                         cm_event.private_data = NULL;
2889                         cm_event.private_data_len = 0;
2890
2891                         nes_debug(NES_DBG_CM, "Generating a CM Disconnect Event"
2892                                   " for  QP%u, SQ Head = %u, SQ Tail = %u. "
2893                                   "cm_id = %p, refcount = %u.\n",
2894                                   nesqp->hwqp.qp_id, nesqp->hwqp.sq_head,
2895                                   nesqp->hwqp.sq_tail, cm_id,
2896                                   atomic_read(&nesqp->refcount));
2897
2898                         ret = cm_id->event_handler(cm_id, &cm_event);
2899                         if (ret)
2900                                 nes_debug(NES_DBG_CM, "OFA CM event_handler "
2901                                           "returned, ret=%d\n", ret);
2902                 }
2903
2904                 if (issue_close) {
2905                         atomic_inc(&cm_closes);
2906                         nes_disconnect(nesqp, 1);
2907
2908                         cm_id->provider_data = nesqp;
2909                         /* Send up the close complete event */
2910                         cm_event.event = IW_CM_EVENT_CLOSE;
2911                         cm_event.status = 0;
2912                         cm_event.provider_data = cm_id->provider_data;
2913                         cm_event.local_addr = cm_id->local_addr;
2914                         cm_event.remote_addr = cm_id->remote_addr;
2915                         cm_event.private_data = NULL;
2916                         cm_event.private_data_len = 0;
2917
2918                         ret = cm_id->event_handler(cm_id, &cm_event);
2919                         if (ret)
2920                                 nes_debug(NES_DBG_CM, "OFA CM event_handler returned, ret=%d\n", ret);
2921
2922                         cm_id->rem_ref(cm_id);
2923                 }
2924         }
2925
2926         return 0;
2927 }
2928
2929
2930 /**
2931  * nes_disconnect
2932  */
2933 static int nes_disconnect(struct nes_qp *nesqp, int abrupt)
2934 {
2935         int ret = 0;
2936         struct nes_vnic *nesvnic;
2937         struct nes_device *nesdev;
2938         struct nes_ib_device *nesibdev;
2939
2940         nesvnic = to_nesvnic(nesqp->ibqp.device);
2941         if (!nesvnic)
2942                 return -EINVAL;
2943
2944         nesdev = nesvnic->nesdev;
2945         nesibdev = nesvnic->nesibdev;
2946
2947         nes_debug(NES_DBG_CM, "netdev refcnt = %u.\n",
2948                         netdev_refcnt_read(nesvnic->netdev));
2949
2950         if (nesqp->active_conn) {
2951
2952                 /* indicate this connection is NOT active */
2953                 nesqp->active_conn = 0;
2954         } else {
2955                 /* Need to free the Last Streaming Mode Message */