1/*******************************************************************************
2*
3* Copyright (c) 2015-2016 Intel Corporation.  All rights reserved.
4*
5* This software is available to you under a choice of one of two
6* licenses.  You may choose to be licensed under the terms of the GNU
7* General Public License (GPL) Version 2, available from the file
8* COPYING in the main directory of this source tree, or the
9* OpenFabrics.org BSD license below:
10*
11*   Redistribution and use in source and binary forms, with or
12*   without modification, are permitted provided that the following
13*   conditions are met:
14*
15*    - Redistributions of source code must retain the above
16*	copyright notice, this list of conditions and the following
17*	disclaimer.
18*
19*    - Redistributions in binary form must reproduce the above
20*	copyright notice, this list of conditions and the following
21*	disclaimer in the documentation and/or other materials
22*	provided with the distribution.
23*
24* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31* SOFTWARE.
32*
33*******************************************************************************/
34
35#include <linux/atomic.h>
36#include <linux/ip.h>
37#include <linux/tcp.h>
38#include <linux/init.h>
39#include <linux/if_arp.h>
40#include <linux/if_vlan.h>
41#include <linux/notifier.h>
42#include <linux/net.h>
43#include <linux/types.h>
44#include <linux/timer.h>
45#include <linux/time.h>
46#include <linux/delay.h>
47#include <linux/etherdevice.h>
48#include <linux/netdevice.h>
49#include <linux/random.h>
50#include <linux/list.h>
51#include <linux/threads.h>
52#include <linux/highmem.h>
53#include <net/arp.h>
54#include <net/ndisc.h>
55#include <net/neighbour.h>
56#include <net/route.h>
57#include <net/addrconf.h>
58#include <net/ip6_route.h>
59#include <net/ip_fib.h>
60#include <net/secure_seq.h>
61#include <net/tcp.h>
62#include <asm/checksum.h>
63
64#include "i40iw.h"
65
66static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *);
67static void i40iw_cm_post_event(struct i40iw_cm_event *event);
68static void i40iw_disconnect_worker(struct work_struct *work);
69
70/**
71 * i40iw_free_sqbuf - put back puda buffer if refcount = 0
72 * @vsi: pointer to vsi structure
73 * @buf: puda buffer to free
74 */
75void i40iw_free_sqbuf(struct i40iw_sc_vsi *vsi, void *bufp)
76{
77	struct i40iw_puda_buf *buf = (struct i40iw_puda_buf *)bufp;
78	struct i40iw_puda_rsrc *ilq = vsi->ilq;
79
80	if (!atomic_dec_return(&buf->refcount))
81		i40iw_puda_ret_bufpool(ilq, buf);
82}
83
84/**
85 * i40iw_derive_hw_ird_setting - Calculate IRD
86 *
87 * @cm_ird: IRD of connection's node
88 *
89 * The ird from the connection is rounded to a supported HW
90 * setting (2,8,32,64) and then encoded for ird_size field of
91 * qp_ctx
92 */
93static u8 i40iw_derive_hw_ird_setting(u16 cm_ird)
94{
95	u8 encoded_ird_size;
96
97	/* ird_size field is encoded in qp_ctx */
98	switch (cm_ird ? roundup_pow_of_two(cm_ird) : 0) {
99	case I40IW_HW_IRD_SETTING_64:
100		encoded_ird_size = 3;
101		break;
102	case I40IW_HW_IRD_SETTING_32:
103	case I40IW_HW_IRD_SETTING_16:
104		encoded_ird_size = 2;
105		break;
106	case I40IW_HW_IRD_SETTING_8:
107	case I40IW_HW_IRD_SETTING_4:
108		encoded_ird_size = 1;
109		break;
110	case I40IW_HW_IRD_SETTING_2:
111	default:
112		encoded_ird_size = 0;
113		break;
114	}
115	return encoded_ird_size;
116}
117
118/**
119 * i40iw_record_ird_ord - Record IRD/ORD passed in
120 * @cm_node: connection's node
121 * @conn_ird: connection IRD
122 * @conn_ord: connection ORD
123 */
124static void i40iw_record_ird_ord(struct i40iw_cm_node *cm_node, u32 conn_ird,
125				 u32 conn_ord)
126{
127	if (conn_ird > I40IW_MAX_IRD_SIZE)
128		conn_ird = I40IW_MAX_IRD_SIZE;
129
130	if (conn_ord > I40IW_MAX_ORD_SIZE)
131		conn_ord = I40IW_MAX_ORD_SIZE;
132	else if (!conn_ord && cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO)
133		conn_ord = 1;
134
135	cm_node->ird_size = conn_ird;
136	cm_node->ord_size = conn_ord;
137}
138
139/**
140 * i40iw_copy_ip_ntohl - change network to host ip
141 * @dst: host ip
142 * @src: big endian
143 */
144void i40iw_copy_ip_ntohl(u32 *dst, __be32 *src)
145{
146	*dst++ = ntohl(*src++);
147	*dst++ = ntohl(*src++);
148	*dst++ = ntohl(*src++);
149	*dst = ntohl(*src);
150}
151
152/**
153 * i40iw_copy_ip_htonl - change host addr to network ip
154 * @dst: host ip
155 * @src: little endian
156 */
157static inline void i40iw_copy_ip_htonl(__be32 *dst, u32 *src)
158{
159	*dst++ = htonl(*src++);
160	*dst++ = htonl(*src++);
161	*dst++ = htonl(*src++);
162	*dst = htonl(*src);
163}
164
165/**
166 * i40iw_fill_sockaddr4 - get addr info for passive connection
167 * @cm_node: connection's node
168 * @event: upper layer's cm event
169 */
170static inline void i40iw_fill_sockaddr4(struct i40iw_cm_node *cm_node,
171					struct iw_cm_event *event)
172{
173	struct sockaddr_in *laddr = (struct sockaddr_in *)&event->local_addr;
174	struct sockaddr_in *raddr = (struct sockaddr_in *)&event->remote_addr;
175
176	laddr->sin_family = AF_INET;
177	raddr->sin_family = AF_INET;
178
179	laddr->sin_port = htons(cm_node->loc_port);
180	raddr->sin_port = htons(cm_node->rem_port);
181
182	laddr->sin_addr.s_addr = htonl(cm_node->loc_addr[0]);
183	raddr->sin_addr.s_addr = htonl(cm_node->rem_addr[0]);
184}
185
186/**
187 * i40iw_fill_sockaddr6 - get ipv6 addr info for passive side
188 * @cm_node: connection's node
189 * @event: upper layer's cm event
190 */
191static inline void i40iw_fill_sockaddr6(struct i40iw_cm_node *cm_node,
192					struct iw_cm_event *event)
193{
194	struct sockaddr_in6 *laddr6 = (struct sockaddr_in6 *)&event->local_addr;
195	struct sockaddr_in6 *raddr6 = (struct sockaddr_in6 *)&event->remote_addr;
196
197	laddr6->sin6_family = AF_INET6;
198	raddr6->sin6_family = AF_INET6;
199
200	laddr6->sin6_port = htons(cm_node->loc_port);
201	raddr6->sin6_port = htons(cm_node->rem_port);
202
203	i40iw_copy_ip_htonl(laddr6->sin6_addr.in6_u.u6_addr32,
204			    cm_node->loc_addr);
205	i40iw_copy_ip_htonl(raddr6->sin6_addr.in6_u.u6_addr32,
206			    cm_node->rem_addr);
207}
208
209/**
210 * i40iw_get_addr_info
211 * @cm_node: contains ip/tcp info
212 * @cm_info: to get a copy of the cm_node ip/tcp info
213*/
214static void i40iw_get_addr_info(struct i40iw_cm_node *cm_node,
215				struct i40iw_cm_info *cm_info)
216{
217	cm_info->ipv4 = cm_node->ipv4;
218	cm_info->vlan_id = cm_node->vlan_id;
219	memcpy(cm_info->loc_addr, cm_node->loc_addr, sizeof(cm_info->loc_addr));
220	memcpy(cm_info->rem_addr, cm_node->rem_addr, sizeof(cm_info->rem_addr));
221	cm_info->loc_port = cm_node->loc_port;
222	cm_info->rem_port = cm_node->rem_port;
223	cm_info->user_pri = cm_node->user_pri;
224}
225
226/**
227 * i40iw_get_cmevent_info - for cm event upcall
228 * @cm_node: connection's node
229 * @cm_id: upper layers cm struct for the event
230 * @event: upper layer's cm event
231 */
232static inline void i40iw_get_cmevent_info(struct i40iw_cm_node *cm_node,
233					  struct iw_cm_id *cm_id,
234					  struct iw_cm_event *event)
235{
236	memcpy(&event->local_addr, &cm_id->m_local_addr,
237	       sizeof(event->local_addr));
238	memcpy(&event->remote_addr, &cm_id->m_remote_addr,
239	       sizeof(event->remote_addr));
240	if (cm_node) {
241		event->private_data = (void *)cm_node->pdata_buf;
242		event->private_data_len = (u8)cm_node->pdata.size;
243		event->ird = cm_node->ird_size;
244		event->ord = cm_node->ord_size;
245	}
246}
247
248/**
249 * i40iw_send_cm_event - upcall cm's event handler
250 * @cm_node: connection's node
251 * @cm_id: upper layer's cm info struct
252 * @type: Event type to indicate
253 * @status: status for the event type
254 */
255static int i40iw_send_cm_event(struct i40iw_cm_node *cm_node,
256			       struct iw_cm_id *cm_id,
257			       enum iw_cm_event_type type,
258			       int status)
259{
260	struct iw_cm_event event;
261
262	memset(&event, 0, sizeof(event));
263	event.event = type;
264	event.status = status;
265	switch (type) {
266	case IW_CM_EVENT_CONNECT_REQUEST:
267		if (cm_node->ipv4)
268			i40iw_fill_sockaddr4(cm_node, &event);
269		else
270			i40iw_fill_sockaddr6(cm_node, &event);
271		event.provider_data = (void *)cm_node;
272		event.private_data = (void *)cm_node->pdata_buf;
273		event.private_data_len = (u8)cm_node->pdata.size;
274		event.ird = cm_node->ird_size;
275		break;
276	case IW_CM_EVENT_CONNECT_REPLY:
277		i40iw_get_cmevent_info(cm_node, cm_id, &event);
278		break;
279	case IW_CM_EVENT_ESTABLISHED:
280		event.ird = cm_node->ird_size;
281		event.ord = cm_node->ord_size;
282		break;
283	case IW_CM_EVENT_DISCONNECT:
284		break;
285	case IW_CM_EVENT_CLOSE:
286		break;
287	default:
288		i40iw_pr_err("event type received type = %d\n", type);
289		return -1;
290	}
291	return cm_id->event_handler(cm_id, &event);
292}
293
294/**
295 * i40iw_create_event - create cm event
296 * @cm_node: connection's node
297 * @type: Event type to generate
298 */
299static struct i40iw_cm_event *i40iw_create_event(struct i40iw_cm_node *cm_node,
300						 enum i40iw_cm_event_type type)
301{
302	struct i40iw_cm_event *event;
303
304	if (!cm_node->cm_id)
305		return NULL;
306
307	event = kzalloc(sizeof(*event), GFP_ATOMIC);
308
309	if (!event)
310		return NULL;
311
312	event->type = type;
313	event->cm_node = cm_node;
314	memcpy(event->cm_info.rem_addr, cm_node->rem_addr, sizeof(event->cm_info.rem_addr));
315	memcpy(event->cm_info.loc_addr, cm_node->loc_addr, sizeof(event->cm_info.loc_addr));
316	event->cm_info.rem_port = cm_node->rem_port;
317	event->cm_info.loc_port = cm_node->loc_port;
318	event->cm_info.cm_id = cm_node->cm_id;
319
320	i40iw_debug(cm_node->dev,
321		    I40IW_DEBUG_CM,
322		    "node=%p event=%p type=%u dst=%pI4 src=%pI4\n",
323		    cm_node,
324		    event,
325		    type,
326		    event->cm_info.loc_addr,
327		    event->cm_info.rem_addr);
328
329	i40iw_cm_post_event(event);
330	return event;
331}
332
333/**
334 * i40iw_free_retrans_entry - free send entry
335 * @cm_node: connection's node
336 */
337static void i40iw_free_retrans_entry(struct i40iw_cm_node *cm_node)
338{
339	struct i40iw_device *iwdev = cm_node->iwdev;
340	struct i40iw_timer_entry *send_entry;
341
342	send_entry = cm_node->send_entry;
343	if (send_entry) {
344		cm_node->send_entry = NULL;
345		i40iw_free_sqbuf(&iwdev->vsi, (void *)send_entry->sqbuf);
346		kfree(send_entry);
347		atomic_dec(&cm_node->ref_count);
348	}
349}
350
351/**
352 * i40iw_cleanup_retrans_entry - free send entry with lock
353 * @cm_node: connection's node
354 */
355static void i40iw_cleanup_retrans_entry(struct i40iw_cm_node *cm_node)
356{
357	unsigned long flags;
358
359	spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
360	i40iw_free_retrans_entry(cm_node);
361	spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
362}
363
364/**
365 * i40iw_form_cm_frame - get a free packet and build frame
366 * @cm_node: connection's node ionfo to use in frame
367 * @options: pointer to options info
368 * @hdr: pointer mpa header
369 * @pdata: pointer to private data
370 * @flags:  indicates FIN or ACK
371 */
372static struct i40iw_puda_buf *i40iw_form_cm_frame(struct i40iw_cm_node *cm_node,
373						  struct i40iw_kmem_info *options,
374						  struct i40iw_kmem_info *hdr,
375						  struct i40iw_kmem_info *pdata,
376						  u8 flags)
377{
378	struct i40iw_puda_buf *sqbuf;
379	struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
380	u8 *buf;
381
382	struct tcphdr *tcph;
383	struct iphdr *iph;
384	struct ipv6hdr *ip6h;
385	struct ethhdr *ethh;
386	u16 packetsize;
387	u16 eth_hlen = ETH_HLEN;
388	u32 opts_len = 0;
389	u32 pd_len = 0;
390	u32 hdr_len = 0;
391	u16 vtag;
392
393	sqbuf = i40iw_puda_get_bufpool(vsi->ilq);
394	if (!sqbuf)
395		return NULL;
396	buf = sqbuf->mem.va;
397
398	if (options)
399		opts_len = (u32)options->size;
400
401	if (hdr)
402		hdr_len = hdr->size;
403
404	if (pdata)
405		pd_len = pdata->size;
406
407	if (cm_node->vlan_id <= VLAN_VID_MASK)
408		eth_hlen += 4;
409
410	if (cm_node->ipv4)
411		packetsize = sizeof(*iph) + sizeof(*tcph);
412	else
413		packetsize = sizeof(*ip6h) + sizeof(*tcph);
414	packetsize += opts_len + hdr_len + pd_len;
415
416	memset(buf, 0x00, eth_hlen + packetsize);
417
418	sqbuf->totallen = packetsize + eth_hlen;
419	sqbuf->maclen = eth_hlen;
420	sqbuf->tcphlen = sizeof(*tcph) + opts_len;
421	sqbuf->scratch = (void *)cm_node;
422
423	ethh = (struct ethhdr *)buf;
424	buf += eth_hlen;
425
426	if (cm_node->ipv4) {
427		sqbuf->ipv4 = true;
428
429		iph = (struct iphdr *)buf;
430		buf += sizeof(*iph);
431		tcph = (struct tcphdr *)buf;
432		buf += sizeof(*tcph);
433
434		ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
435		ether_addr_copy(ethh->h_source, cm_node->loc_mac);
436		if (cm_node->vlan_id <= VLAN_VID_MASK) {
437			((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
438			vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
439			((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
440
441			((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IP);
442		} else {
443			ethh->h_proto = htons(ETH_P_IP);
444		}
445
446		iph->version = IPVERSION;
447		iph->ihl = 5;	/* 5 * 4Byte words, IP headr len */
448		iph->tos = cm_node->tos;
449		iph->tot_len = htons(packetsize);
450		iph->id = htons(++cm_node->tcp_cntxt.loc_id);
451
452		iph->frag_off = htons(0x4000);
453		iph->ttl = 0x40;
454		iph->protocol = IPPROTO_TCP;
455		iph->saddr = htonl(cm_node->loc_addr[0]);
456		iph->daddr = htonl(cm_node->rem_addr[0]);
457	} else {
458		sqbuf->ipv4 = false;
459		ip6h = (struct ipv6hdr *)buf;
460		buf += sizeof(*ip6h);
461		tcph = (struct tcphdr *)buf;
462		buf += sizeof(*tcph);
463
464		ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
465		ether_addr_copy(ethh->h_source, cm_node->loc_mac);
466		if (cm_node->vlan_id <= VLAN_VID_MASK) {
467			((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
468			vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
469			((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
470			((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IPV6);
471		} else {
472			ethh->h_proto = htons(ETH_P_IPV6);
473		}
474		ip6h->version = 6;
475		ip6h->priority = cm_node->tos >> 4;
476		ip6h->flow_lbl[0] = cm_node->tos << 4;
477		ip6h->flow_lbl[1] = 0;
478		ip6h->flow_lbl[2] = 0;
479		ip6h->payload_len = htons(packetsize - sizeof(*ip6h));
480		ip6h->nexthdr = 6;
481		ip6h->hop_limit = 128;
482		i40iw_copy_ip_htonl(ip6h->saddr.in6_u.u6_addr32,
483				    cm_node->loc_addr);
484		i40iw_copy_ip_htonl(ip6h->daddr.in6_u.u6_addr32,
485				    cm_node->rem_addr);
486	}
487
488	tcph->source = htons(cm_node->loc_port);
489	tcph->dest = htons(cm_node->rem_port);
490
491	tcph->seq = htonl(cm_node->tcp_cntxt.loc_seq_num);
492
493	if (flags & SET_ACK) {
494		cm_node->tcp_cntxt.loc_ack_num = cm_node->tcp_cntxt.rcv_nxt;
495		tcph->ack_seq = htonl(cm_node->tcp_cntxt.loc_ack_num);
496		tcph->ack = 1;
497	} else {
498		tcph->ack_seq = 0;
499	}
500
501	if (flags & SET_SYN) {
502		cm_node->tcp_cntxt.loc_seq_num++;
503		tcph->syn = 1;
504	} else {
505		cm_node->tcp_cntxt.loc_seq_num += hdr_len + pd_len;
506	}
507
508	if (flags & SET_FIN) {
509		cm_node->tcp_cntxt.loc_seq_num++;
510		tcph->fin = 1;
511	}
512
513	if (flags & SET_RST)
514		tcph->rst = 1;
515
516	tcph->doff = (u16)((sizeof(*tcph) + opts_len + 3) >> 2);
517	sqbuf->tcphlen = tcph->doff << 2;
518	tcph->window = htons(cm_node->tcp_cntxt.rcv_wnd);
519	tcph->urg_ptr = 0;
520
521	if (opts_len) {
522		memcpy(buf, options->addr, opts_len);
523		buf += opts_len;
524	}
525
526	if (hdr_len) {
527		memcpy(buf, hdr->addr, hdr_len);
528		buf += hdr_len;
529	}
530
531	if (pdata && pdata->addr)
532		memcpy(buf, pdata->addr, pdata->size);
533
534	atomic_set(&sqbuf->refcount, 1);
535
536	return sqbuf;
537}
538
539/**
540 * i40iw_send_reset - Send RST packet
541 * @cm_node: connection's node
542 */
543int i40iw_send_reset(struct i40iw_cm_node *cm_node)
544{
545	struct i40iw_puda_buf *sqbuf;
546	int flags = SET_RST | SET_ACK;
547
548	sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, flags);
549	if (!sqbuf) {
550		i40iw_pr_err("no sqbuf\n");
551		return -1;
552	}
553
554	return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 0, 1);
555}
556
557/**
558 * i40iw_active_open_err - send event for active side cm error
559 * @cm_node: connection's node
560 * @reset: Flag to send reset or not
561 */
562static void i40iw_active_open_err(struct i40iw_cm_node *cm_node, bool reset)
563{
564	i40iw_cleanup_retrans_entry(cm_node);
565	cm_node->cm_core->stats_connect_errs++;
566	if (reset) {
567		i40iw_debug(cm_node->dev,
568			    I40IW_DEBUG_CM,
569			    "%s cm_node=%p state=%d\n",
570			    __func__,
571			    cm_node,
572			    cm_node->state);
573		atomic_inc(&cm_node->ref_count);
574		i40iw_send_reset(cm_node);
575	}
576
577	cm_node->state = I40IW_CM_STATE_CLOSED;
578	i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
579}
580
581/**
582 * i40iw_passive_open_err - handle passive side cm error
583 * @cm_node: connection's node
584 * @reset: send reset or just free cm_node
585 */
586static void i40iw_passive_open_err(struct i40iw_cm_node *cm_node, bool reset)
587{
588	i40iw_cleanup_retrans_entry(cm_node);
589	cm_node->cm_core->stats_passive_errs++;
590	cm_node->state = I40IW_CM_STATE_CLOSED;
591	i40iw_debug(cm_node->dev,
592		    I40IW_DEBUG_CM,
593		    "%s cm_node=%p state =%d\n",
594		    __func__,
595		    cm_node,
596		    cm_node->state);
597	if (reset)
598		i40iw_send_reset(cm_node);
599	else
600		i40iw_rem_ref_cm_node(cm_node);
601}
602
603/**
604 * i40iw_event_connect_error - to create connect error event
605 * @event: cm information for connect event
606 */
607static void i40iw_event_connect_error(struct i40iw_cm_event *event)
608{
609	struct i40iw_qp *iwqp;
610	struct iw_cm_id *cm_id;
611
612	cm_id = event->cm_node->cm_id;
613	if (!cm_id)
614		return;
615
616	iwqp = cm_id->provider_data;
617
618	if (!iwqp || !iwqp->iwdev)
619		return;
620
621	iwqp->cm_id = NULL;
622	cm_id->provider_data = NULL;
623	i40iw_send_cm_event(event->cm_node, cm_id,
624			    IW_CM_EVENT_CONNECT_REPLY,
625			    -ECONNRESET);
626	cm_id->rem_ref(cm_id);
627	i40iw_rem_ref_cm_node(event->cm_node);
628}
629
630/**
631 * i40iw_process_options
632 * @cm_node: connection's node
633 * @optionsloc: point to start of options
634 * @optionsize: size of all options
635 * @syn_packet: flag if syn packet
636 */
637static int i40iw_process_options(struct i40iw_cm_node *cm_node,
638				 u8 *optionsloc,
639				 u32 optionsize,
640				 u32 syn_packet)
641{
642	u32 tmp;
643	u32 offset = 0;
644	union all_known_options *all_options;
645	char got_mss_option = 0;
646
647	while (offset < optionsize) {
648		all_options = (union all_known_options *)(optionsloc + offset);
649		switch (all_options->as_base.optionnum) {
650		case OPTION_NUMBER_END:
651			offset = optionsize;
652			break;
653		case OPTION_NUMBER_NONE:
654			offset += 1;
655			continue;
656		case OPTION_NUMBER_MSS:
657			i40iw_debug(cm_node->dev,
658				    I40IW_DEBUG_CM,
659				    "%s: MSS Length: %d Offset: %d Size: %d\n",
660				    __func__,
661				    all_options->as_mss.length,
662				    offset,
663				    optionsize);
664			got_mss_option = 1;
665			if (all_options->as_mss.length != 4)
666				return -1;
667			tmp = ntohs(all_options->as_mss.mss);
668			if (tmp > 0 && tmp < cm_node->tcp_cntxt.mss)
669				cm_node->tcp_cntxt.mss = tmp;
670			break;
671		case OPTION_NUMBER_WINDOW_SCALE:
672			cm_node->tcp_cntxt.snd_wscale =
673			    all_options->as_windowscale.shiftcount;
674			break;
675		default:
676			i40iw_debug(cm_node->dev,
677				    I40IW_DEBUG_CM,
678				    "TCP Option not understood: %x\n",
679				    all_options->as_base.optionnum);
680			break;
681		}
682		offset += all_options->as_base.length;
683	}
684	if (!got_mss_option && syn_packet)
685		cm_node->tcp_cntxt.mss = I40IW_CM_DEFAULT_MSS;
686	return 0;
687}
688
689/**
690 * i40iw_handle_tcp_options -
691 * @cm_node: connection's node
692 * @tcph: pointer tcp header
693 * @optionsize: size of options rcvd
694 * @passive: active or passive flag
695 */
696static int i40iw_handle_tcp_options(struct i40iw_cm_node *cm_node,
697				    struct tcphdr *tcph,
698				    int optionsize,
699				    int passive)
700{
701	u8 *optionsloc = (u8 *)&tcph[1];
702
703	if (optionsize) {
704		if (i40iw_process_options(cm_node,
705					  optionsloc,
706					  optionsize,
707					  (u32)tcph->syn)) {
708			i40iw_debug(cm_node->dev,
709				    I40IW_DEBUG_CM,
710				    "%s: Node %p, Sending RESET\n",
711				    __func__,
712				    cm_node);
713			if (passive)
714				i40iw_passive_open_err(cm_node, true);
715			else
716				i40iw_active_open_err(cm_node, true);
717			return -1;
718		}
719	}
720
721	cm_node->tcp_cntxt.snd_wnd = ntohs(tcph->window) <<
722	    cm_node->tcp_cntxt.snd_wscale;
723
724	if (cm_node->tcp_cntxt.snd_wnd > cm_node->tcp_cntxt.max_snd_wnd)
725		cm_node->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.snd_wnd;
726	return 0;
727}
728
729/**
730 * i40iw_build_mpa_v1 - build a MPA V1 frame
731 * @cm_node: connection's node
732 * @mpa_key: to do read0 or write0
733 */
734static void i40iw_build_mpa_v1(struct i40iw_cm_node *cm_node,
735			       void *start_addr,
736			       u8 mpa_key)
737{
738	struct ietf_mpa_v1 *mpa_frame = (struct ietf_mpa_v1 *)start_addr;
739
740	switch (mpa_key) {
741	case MPA_KEY_REQUEST:
742		memcpy(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE);
743		break;
744	case MPA_KEY_REPLY:
745		memcpy(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE);
746		break;
747	default:
748		break;
749	}
750	mpa_frame->flags = IETF_MPA_FLAGS_CRC;
751	mpa_frame->rev = cm_node->mpa_frame_rev;
752	mpa_frame->priv_data_len = htons(cm_node->pdata.size);
753}
754
755/**
756 * i40iw_build_mpa_v2 - build a MPA V2 frame
757 * @cm_node: connection's node
758 * @start_addr: buffer start address
759 * @mpa_key: to do read0 or write0
760 */
761static void i40iw_build_mpa_v2(struct i40iw_cm_node *cm_node,
762			       void *start_addr,
763			       u8 mpa_key)
764{
765	struct ietf_mpa_v2 *mpa_frame = (struct ietf_mpa_v2 *)start_addr;
766	struct ietf_rtr_msg *rtr_msg = &mpa_frame->rtr_msg;
767	u16 ctrl_ird, ctrl_ord;
768
769	/* initialize the upper 5 bytes of the frame */
770	i40iw_build_mpa_v1(cm_node, start_addr, mpa_key);
771	mpa_frame->flags |= IETF_MPA_V2_FLAG;
772	mpa_frame->priv_data_len += htons(IETF_RTR_MSG_SIZE);
773
774	/* initialize RTR msg */
775	if (cm_node->mpav2_ird_ord == IETF_NO_IRD_ORD) {
776		ctrl_ird = IETF_NO_IRD_ORD;
777		ctrl_ord = IETF_NO_IRD_ORD;
778	} else {
779		ctrl_ird = (cm_node->ird_size > IETF_NO_IRD_ORD) ?
780			IETF_NO_IRD_ORD : cm_node->ird_size;
781		ctrl_ord = (cm_node->ord_size > IETF_NO_IRD_ORD) ?
782			IETF_NO_IRD_ORD : cm_node->ord_size;
783	}
784
785	ctrl_ird |= IETF_PEER_TO_PEER;
786
787	switch (mpa_key) {
788	case MPA_KEY_REQUEST:
789		ctrl_ord |= IETF_RDMA0_WRITE;
790		ctrl_ord |= IETF_RDMA0_READ;
791		break;
792	case MPA_KEY_REPLY:
793		switch (cm_node->send_rdma0_op) {
794		case SEND_RDMA_WRITE_ZERO:
795			ctrl_ord |= IETF_RDMA0_WRITE;
796			break;
797		case SEND_RDMA_READ_ZERO:
798			ctrl_ord |= IETF_RDMA0_READ;
799			break;
800		}
801		break;
802	default:
803		break;
804	}
805	rtr_msg->ctrl_ird = htons(ctrl_ird);
806	rtr_msg->ctrl_ord = htons(ctrl_ord);
807}
808
809/**
810 * i40iw_cm_build_mpa_frame - build mpa frame for mpa version 1 or version 2
811 * @cm_node: connection's node
812 * @mpa: mpa: data buffer
813 * @mpa_key: to do read0 or write0
814 */
815static int i40iw_cm_build_mpa_frame(struct i40iw_cm_node *cm_node,
816				    struct i40iw_kmem_info *mpa,
817				    u8 mpa_key)
818{
819	int hdr_len = 0;
820
821	switch (cm_node->mpa_frame_rev) {
822	case IETF_MPA_V1:
823		hdr_len = sizeof(struct ietf_mpa_v1);
824		i40iw_build_mpa_v1(cm_node, mpa->addr, mpa_key);
825		break;
826	case IETF_MPA_V2:
827		hdr_len = sizeof(struct ietf_mpa_v2);
828		i40iw_build_mpa_v2(cm_node, mpa->addr, mpa_key);
829		break;
830	default:
831		break;
832	}
833
834	return hdr_len;
835}
836
837/**
838 * i40iw_send_mpa_request - active node send mpa request to passive node
839 * @cm_node: connection's node
840 */
841static int i40iw_send_mpa_request(struct i40iw_cm_node *cm_node)
842{
843	struct i40iw_puda_buf *sqbuf;
844
845	if (!cm_node) {
846		i40iw_pr_err("cm_node == NULL\n");
847		return -1;
848	}
849
850	cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
851	cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
852							 &cm_node->mpa_hdr,
853							 MPA_KEY_REQUEST);
854	if (!cm_node->mpa_hdr.size) {
855		i40iw_pr_err("mpa size = %d\n", cm_node->mpa_hdr.size);
856		return -1;
857	}
858
859	sqbuf = i40iw_form_cm_frame(cm_node,
860				    NULL,
861				    &cm_node->mpa_hdr,
862				    &cm_node->pdata,
863				    SET_ACK);
864	if (!sqbuf) {
865		i40iw_pr_err("sq_buf == NULL\n");
866		return -1;
867	}
868	return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
869}
870
871/**
872 * i40iw_send_mpa_reject -
873 * @cm_node: connection's node
874 * @pdata: reject data for connection
875 * @plen: length of reject data
876 */
877static int i40iw_send_mpa_reject(struct i40iw_cm_node *cm_node,
878				 const void *pdata,
879				 u8 plen)
880{
881	struct i40iw_puda_buf *sqbuf;
882	struct i40iw_kmem_info priv_info;
883
884	cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
885	cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
886							 &cm_node->mpa_hdr,
887							 MPA_KEY_REPLY);
888
889	cm_node->mpa_frame.flags |= IETF_MPA_FLAGS_REJECT;
890	priv_info.addr = (void *)pdata;
891	priv_info.size = plen;
892
893	sqbuf = i40iw_form_cm_frame(cm_node,
894				    NULL,
895				    &cm_node->mpa_hdr,
896				    &priv_info,
897				    SET_ACK | SET_FIN);
898	if (!sqbuf) {
899		i40iw_pr_err("no sqbuf\n");
900		return -ENOMEM;
901	}
902	cm_node->state = I40IW_CM_STATE_FIN_WAIT1;
903	return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
904}
905
906/**
907 * recv_mpa - process an IETF MPA frame
908 * @cm_node: connection's node
909 * @buffer: Data pointer
910 * @type: to return accept or reject
911 * @len: Len of mpa buffer
912 */
913static int i40iw_parse_mpa(struct i40iw_cm_node *cm_node, u8 *buffer, u32 *type, u32 len)
914{
915	struct ietf_mpa_v1 *mpa_frame;
916	struct ietf_mpa_v2 *mpa_v2_frame;
917	struct ietf_rtr_msg *rtr_msg;
918	int mpa_hdr_len;
919	int priv_data_len;
920
921	*type = I40IW_MPA_REQUEST_ACCEPT;
922
923	if (len < sizeof(struct ietf_mpa_v1)) {
924		i40iw_pr_err("ietf buffer small (%x)\n", len);
925		return -1;
926	}
927
928	mpa_frame = (struct ietf_mpa_v1 *)buffer;
929	mpa_hdr_len = sizeof(struct ietf_mpa_v1);
930	priv_data_len = ntohs(mpa_frame->priv_data_len);
931
932	if (priv_data_len > IETF_MAX_PRIV_DATA_LEN) {
933		i40iw_pr_err("large pri_data %d\n", priv_data_len);
934		return -1;
935	}
936	if (mpa_frame->rev != IETF_MPA_V1 && mpa_frame->rev != IETF_MPA_V2) {
937		i40iw_pr_err("unsupported mpa rev = %d\n", mpa_frame->rev);
938		return -1;
939	}
940	if (mpa_frame->rev > cm_node->mpa_frame_rev) {
941		i40iw_pr_err("rev %d\n", mpa_frame->rev);
942		return -1;
943	}
944	cm_node->mpa_frame_rev = mpa_frame->rev;
945
946	if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
947		if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE)) {
948			i40iw_pr_err("Unexpected MPA Key received\n");
949			return -1;
950		}
951	} else {
952		if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE)) {
953			i40iw_pr_err("Unexpected MPA Key received\n");
954			return -1;
955		}
956	}
957
958	if (priv_data_len + mpa_hdr_len > len) {
959		i40iw_pr_err("ietf buffer len(%x + %x != %x)\n",
960			     priv_data_len, mpa_hdr_len, len);
961		return -1;
962	}
963	if (len > MAX_CM_BUFFER) {
964		i40iw_pr_err("ietf buffer large len = %d\n", len);
965		return -1;
966	}
967
968	switch (mpa_frame->rev) {
969	case IETF_MPA_V2:{
970			u16 ird_size;
971			u16 ord_size;
972			u16 ctrl_ord;
973			u16 ctrl_ird;
974
975			mpa_v2_frame = (struct ietf_mpa_v2 *)buffer;
976			mpa_hdr_len += IETF_RTR_MSG_SIZE;
977			rtr_msg = &mpa_v2_frame->rtr_msg;
978
979			/* parse rtr message */
980			ctrl_ord = ntohs(rtr_msg->ctrl_ord);
981			ctrl_ird = ntohs(rtr_msg->ctrl_ird);
982			ird_size = ctrl_ird & IETF_NO_IRD_ORD;
983			ord_size = ctrl_ord & IETF_NO_IRD_ORD;
984
985			if (!(ctrl_ird & IETF_PEER_TO_PEER))
986				return -1;
987
988			if (ird_size == IETF_NO_IRD_ORD || ord_size == IETF_NO_IRD_ORD) {
989				cm_node->mpav2_ird_ord = IETF_NO_IRD_ORD;
990				goto negotiate_done;
991			}
992
993			if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
994				/* responder */
995				if (!ord_size && (ctrl_ord & IETF_RDMA0_READ))
996					cm_node->ird_size = 1;
997				if (cm_node->ord_size > ird_size)
998					cm_node->ord_size = ird_size;
999			} else {
1000				/* initiator */
1001				if (!ird_size && (ctrl_ord & IETF_RDMA0_READ))
1002					return -1;
1003				if (cm_node->ord_size > ird_size)
1004					cm_node->ord_size = ird_size;
1005
1006				if (cm_node->ird_size < ord_size)
1007					/* no resources available */
1008					return -1;
1009			}
1010
1011negotiate_done:
1012			if (ctrl_ord & IETF_RDMA0_READ)
1013				cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
1014			else if (ctrl_ord & IETF_RDMA0_WRITE)
1015				cm_node->send_rdma0_op = SEND_RDMA_WRITE_ZERO;
1016			else	/* Not supported RDMA0 operation */
1017				return -1;
1018			i40iw_debug(cm_node->dev, I40IW_DEBUG_CM,
1019				    "MPAV2: Negotiated ORD: %d, IRD: %d\n",
1020				    cm_node->ord_size, cm_node->ird_size);
1021			break;
1022		}
1023		break;
1024	case IETF_MPA_V1:
1025	default:
1026		break;
1027	}
1028
1029	memcpy(cm_node->pdata_buf, buffer + mpa_hdr_len, priv_data_len);
1030	cm_node->pdata.size = priv_data_len;
1031
1032	if (mpa_frame->flags & IETF_MPA_FLAGS_REJECT)
1033		*type = I40IW_MPA_REQUEST_REJECT;
1034
1035	if (mpa_frame->flags & IETF_MPA_FLAGS_MARKERS)
1036		cm_node->snd_mark_en = true;
1037
1038	return 0;
1039}
1040
1041/**
1042 * i40iw_schedule_cm_timer
1043 * @@cm_node: connection's node
1044 * @sqbuf: buffer to send
1045 * @type: if it is send or close
1046 * @send_retrans: if rexmits to be done
1047 * @close_when_complete: is cm_node to be removed
1048 *
1049 * note - cm_node needs to be protected before calling this. Encase in:
1050 *		i40iw_rem_ref_cm_node(cm_core, cm_node);
1051 *		i40iw_schedule_cm_timer(...)
1052 *		atomic_inc(&cm_node->ref_count);
1053 */
1054int i40iw_schedule_cm_timer(struct i40iw_cm_node *cm_node,
1055			    struct i40iw_puda_buf *sqbuf,
1056			    enum i40iw_timer_type type,
1057			    int send_retrans,
1058			    int close_when_complete)
1059{
1060	struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1061	struct i40iw_cm_core *cm_core = cm_node->cm_core;
1062	struct i40iw_timer_entry *new_send;
1063	int ret = 0;
1064	u32 was_timer_set;
1065	unsigned long flags;
1066
1067	new_send = kzalloc(sizeof(*new_send), GFP_ATOMIC);
1068	if (!new_send) {
1069		if (type != I40IW_TIMER_TYPE_CLOSE)
1070			i40iw_free_sqbuf(vsi, (void *)sqbuf);
1071		return -ENOMEM;
1072	}
1073	new_send->retrycount = I40IW_DEFAULT_RETRYS;
1074	new_send->retranscount = I40IW_DEFAULT_RETRANS;
1075	new_send->sqbuf = sqbuf;
1076	new_send->timetosend = jiffies;
1077	new_send->type = type;
1078	new_send->send_retrans = send_retrans;
1079	new_send->close_when_complete = close_when_complete;
1080
1081	if (type == I40IW_TIMER_TYPE_CLOSE) {
1082		new_send->timetosend += (HZ / 10);
1083		if (cm_node->close_entry) {
1084			kfree(new_send);
1085			i40iw_pr_err("already close entry\n");
1086			return -EINVAL;
1087		}
1088		cm_node->close_entry = new_send;
1089	}
1090
1091	if (type == I40IW_TIMER_TYPE_SEND) {
1092		spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1093		cm_node->send_entry = new_send;
1094		atomic_inc(&cm_node->ref_count);
1095		spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1096		new_send->timetosend = jiffies + I40IW_RETRY_TIMEOUT;
1097
1098		atomic_inc(&sqbuf->refcount);
1099		i40iw_puda_send_buf(vsi->ilq, sqbuf);
1100		if (!send_retrans) {
1101			i40iw_cleanup_retrans_entry(cm_node);
1102			if (close_when_complete)
1103				i40iw_rem_ref_cm_node(cm_node);
1104			return ret;
1105		}
1106	}
1107
1108	spin_lock_irqsave(&cm_core->ht_lock, flags);
1109	was_timer_set = timer_pending(&cm_core->tcp_timer);
1110
1111	if (!was_timer_set) {
1112		cm_core->tcp_timer.expires = new_send->timetosend;
1113		add_timer(&cm_core->tcp_timer);
1114	}
1115	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1116
1117	return ret;
1118}
1119
1120/**
1121 * i40iw_retrans_expired - Could not rexmit the packet
1122 * @cm_node: connection's node
1123 */
1124static void i40iw_retrans_expired(struct i40iw_cm_node *cm_node)
1125{
1126	struct iw_cm_id *cm_id = cm_node->cm_id;
1127	enum i40iw_cm_node_state state = cm_node->state;
1128
1129	cm_node->state = I40IW_CM_STATE_CLOSED;
1130	switch (state) {
1131	case I40IW_CM_STATE_SYN_RCVD:
1132	case I40IW_CM_STATE_CLOSING:
1133		i40iw_rem_ref_cm_node(cm_node);
1134		break;
1135	case I40IW_CM_STATE_FIN_WAIT1:
1136	case I40IW_CM_STATE_LAST_ACK:
1137		if (cm_node->cm_id)
1138			cm_id->rem_ref(cm_id);
1139		i40iw_send_reset(cm_node);
1140		break;
1141	default:
1142		atomic_inc(&cm_node->ref_count);
1143		i40iw_send_reset(cm_node);
1144		i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
1145		break;
1146	}
1147}
1148
1149/**
1150 * i40iw_handle_close_entry - for handling retry/timeouts
1151 * @cm_node: connection's node
1152 * @rem_node: flag for remove cm_node
1153 */
1154static void i40iw_handle_close_entry(struct i40iw_cm_node *cm_node, u32 rem_node)
1155{
1156	struct i40iw_timer_entry *close_entry = cm_node->close_entry;
1157	struct iw_cm_id *cm_id = cm_node->cm_id;
1158	struct i40iw_qp *iwqp;
1159	unsigned long flags;
1160
1161	if (!close_entry)
1162		return;
1163	iwqp = (struct i40iw_qp *)close_entry->sqbuf;
1164	if (iwqp) {
1165		spin_lock_irqsave(&iwqp->lock, flags);
1166		if (iwqp->cm_id) {
1167			iwqp->hw_tcp_state = I40IW_TCP_STATE_CLOSED;
1168			iwqp->hw_iwarp_state = I40IW_QP_STATE_ERROR;
1169			iwqp->last_aeq = I40IW_AE_RESET_SENT;
1170			iwqp->ibqp_state = IB_QPS_ERR;
1171			spin_unlock_irqrestore(&iwqp->lock, flags);
1172			i40iw_cm_disconn(iwqp);
1173		} else {
1174			spin_unlock_irqrestore(&iwqp->lock, flags);
1175		}
1176	} else if (rem_node) {
1177		/* TIME_WAIT state */
1178		i40iw_rem_ref_cm_node(cm_node);
1179	}
1180	if (cm_id)
1181		cm_id->rem_ref(cm_id);
1182	kfree(close_entry);
1183	cm_node->close_entry = NULL;
1184}
1185
1186/**
1187 * i40iw_build_timer_list - Add cm_nodes to timer list
1188 * @timer_list: ptr to timer list
1189 * @hte: ptr to accelerated or non-accelerated list
1190 */
1191static void i40iw_build_timer_list(struct list_head *timer_list,
1192				   struct list_head *hte)
1193{
1194	struct i40iw_cm_node *cm_node;
1195	struct list_head *list_core_temp, *list_node;
1196
1197	list_for_each_safe(list_node, list_core_temp, hte) {
1198		cm_node = container_of(list_node, struct i40iw_cm_node, list);
1199		if (cm_node->close_entry || cm_node->send_entry) {
1200			atomic_inc(&cm_node->ref_count);
1201			list_add(&cm_node->timer_entry, timer_list);
1202		}
1203	}
1204}
1205
1206/**
1207 * i40iw_cm_timer_tick - system's timer expired callback
1208 * @pass: Pointing to cm_core
1209 */
1210static void i40iw_cm_timer_tick(struct timer_list *t)
1211{
1212	unsigned long nexttimeout = jiffies + I40IW_LONG_TIME;
1213	struct i40iw_cm_node *cm_node;
1214	struct i40iw_timer_entry *send_entry, *close_entry;
1215	struct list_head *list_core_temp;
1216	struct i40iw_sc_vsi *vsi;
1217	struct list_head *list_node;
1218	struct i40iw_cm_core *cm_core = from_timer(cm_core, t, tcp_timer);
1219	u32 settimer = 0;
1220	unsigned long timetosend;
1221	unsigned long flags;
1222
1223	struct list_head timer_list;
1224
1225	INIT_LIST_HEAD(&timer_list);
1226
1227	spin_lock_irqsave(&cm_core->ht_lock, flags);
1228	i40iw_build_timer_list(&timer_list, &cm_core->non_accelerated_list);
1229	i40iw_build_timer_list(&timer_list, &cm_core->accelerated_list);
1230	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1231
1232	list_for_each_safe(list_node, list_core_temp, &timer_list) {
1233		cm_node = container_of(list_node,
1234				       struct i40iw_cm_node,
1235				       timer_entry);
1236		close_entry = cm_node->close_entry;
1237
1238		if (close_entry) {
1239			if (time_after(close_entry->timetosend, jiffies)) {
1240				if (nexttimeout > close_entry->timetosend ||
1241				    !settimer) {
1242					nexttimeout = close_entry->timetosend;
1243					settimer = 1;
1244				}
1245			} else {
1246				i40iw_handle_close_entry(cm_node, 1);
1247			}
1248		}
1249
1250		spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1251
1252		send_entry = cm_node->send_entry;
1253		if (!send_entry)
1254			goto done;
1255		if (time_after(send_entry->timetosend, jiffies)) {
1256			if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
1257				if ((nexttimeout > send_entry->timetosend) ||
1258				    !settimer) {
1259					nexttimeout = send_entry->timetosend;
1260					settimer = 1;
1261				}
1262			} else {
1263				i40iw_free_retrans_entry(cm_node);
1264			}
1265			goto done;
1266		}
1267
1268		if ((cm_node->state == I40IW_CM_STATE_OFFLOADED) ||
1269		    (cm_node->state == I40IW_CM_STATE_CLOSED)) {
1270			i40iw_free_retrans_entry(cm_node);
1271			goto done;
1272		}
1273
1274		if (!send_entry->retranscount || !send_entry->retrycount) {
1275			i40iw_free_retrans_entry(cm_node);
1276
1277			spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1278			i40iw_retrans_expired(cm_node);
1279			cm_node->state = I40IW_CM_STATE_CLOSED;
1280			spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1281			goto done;
1282		}
1283		spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1284
1285		vsi = &cm_node->iwdev->vsi;
1286
1287		if (!cm_node->ack_rcvd) {
1288			atomic_inc(&send_entry->sqbuf->refcount);
1289			i40iw_puda_send_buf(vsi->ilq, send_entry->sqbuf);
1290			cm_node->cm_core->stats_pkt_retrans++;
1291		}
1292		spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1293		if (send_entry->send_retrans) {
1294			send_entry->retranscount--;
1295			timetosend = (I40IW_RETRY_TIMEOUT <<
1296				      (I40IW_DEFAULT_RETRANS -
1297				       send_entry->retranscount));
1298
1299			send_entry->timetosend = jiffies +
1300			    min(timetosend, I40IW_MAX_TIMEOUT);
1301			if (nexttimeout > send_entry->timetosend || !settimer) {
1302				nexttimeout = send_entry->timetosend;
1303				settimer = 1;
1304			}
1305		} else {
1306			int close_when_complete;
1307
1308			close_when_complete = send_entry->close_when_complete;
1309			i40iw_debug(cm_node->dev,
1310				    I40IW_DEBUG_CM,
1311				    "cm_node=%p state=%d\n",
1312				    cm_node,
1313				    cm_node->state);
1314			i40iw_free_retrans_entry(cm_node);
1315			if (close_when_complete)
1316				i40iw_rem_ref_cm_node(cm_node);
1317		}
1318done:
1319		spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1320		i40iw_rem_ref_cm_node(cm_node);
1321	}
1322
1323	if (settimer) {
1324		spin_lock_irqsave(&cm_core->ht_lock, flags);
1325		if (!timer_pending(&cm_core->tcp_timer)) {
1326			cm_core->tcp_timer.expires = nexttimeout;
1327			add_timer(&cm_core->tcp_timer);
1328		}
1329		spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1330	}
1331}
1332
1333/**
1334 * i40iw_send_syn - send SYN packet
1335 * @cm_node: connection's node
1336 * @sendack: flag to set ACK bit or not
1337 */
1338int i40iw_send_syn(struct i40iw_cm_node *cm_node, u32 sendack)
1339{
1340	struct i40iw_puda_buf *sqbuf;
1341	int flags = SET_SYN;
1342	char optionsbuffer[sizeof(struct option_mss) +
1343			   sizeof(struct option_windowscale) +
1344			   sizeof(struct option_base) + TCP_OPTIONS_PADDING];
1345	struct i40iw_kmem_info opts;
1346
1347	int optionssize = 0;
1348	/* Sending MSS option */
1349	union all_known_options *options;
1350
1351	opts.addr = optionsbuffer;
1352	if (!cm_node) {
1353		i40iw_pr_err("no cm_node\n");
1354		return -EINVAL;
1355	}
1356
1357	options = (union all_known_options *)&optionsbuffer[optionssize];
1358	options->as_mss.optionnum = OPTION_NUMBER_MSS;
1359	options->as_mss.length = sizeof(struct option_mss);
1360	options->as_mss.mss = htons(cm_node->tcp_cntxt.mss);
1361	optionssize += sizeof(struct option_mss);
1362
1363	options = (union all_known_options *)&optionsbuffer[optionssize];
1364	options->as_windowscale.optionnum = OPTION_NUMBER_WINDOW_SCALE;
1365	options->as_windowscale.length = sizeof(struct option_windowscale);
1366	options->as_windowscale.shiftcount = cm_node->tcp_cntxt.rcv_wscale;
1367	optionssize += sizeof(struct option_windowscale);
1368	options = (union all_known_options *)&optionsbuffer[optionssize];
1369	options->as_end = OPTION_NUMBER_END;
1370	optionssize += 1;
1371
1372	if (sendack)
1373		flags |= SET_ACK;
1374
1375	opts.size = optionssize;
1376
1377	sqbuf = i40iw_form_cm_frame(cm_node, &opts, NULL, NULL, flags);
1378	if (!sqbuf) {
1379		i40iw_pr_err("no sqbuf\n");
1380		return -1;
1381	}
1382	return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1383}
1384
1385/**
1386 * i40iw_send_ack - Send ACK packet
1387 * @cm_node: connection's node
1388 */
1389static void i40iw_send_ack(struct i40iw_cm_node *cm_node)
1390{
1391	struct i40iw_puda_buf *sqbuf;
1392	struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1393
1394	sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK);
1395	if (sqbuf)
1396		i40iw_puda_send_buf(vsi->ilq, sqbuf);
1397	else
1398		i40iw_pr_err("no sqbuf\n");
1399}
1400
1401/**
1402 * i40iw_send_fin - Send FIN pkt
1403 * @cm_node: connection's node
1404 */
1405static int i40iw_send_fin(struct i40iw_cm_node *cm_node)
1406{
1407	struct i40iw_puda_buf *sqbuf;
1408
1409	sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK | SET_FIN);
1410	if (!sqbuf) {
1411		i40iw_pr_err("no sqbuf\n");
1412		return -1;
1413	}
1414	return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1415}
1416
1417/**
1418 * i40iw_find_node - find a cm node that matches the reference cm node
1419 * @cm_core: cm's core
1420 * @rem_port: remote tcp port num
1421 * @rem_addr: remote ip addr
1422 * @loc_port: local tcp port num
1423 * @loc_addr: loc ip addr
1424 * @add_refcnt: flag to increment refcount of cm_node
1425 * @accelerated_list: flag for accelerated vs non-accelerated list to search
1426 */
1427struct i40iw_cm_node *i40iw_find_node(struct i40iw_cm_core *cm_core,
1428				      u16 rem_port,
1429				      u32 *rem_addr,
1430				      u16 loc_port,
1431				      u32 *loc_addr,
1432				      bool add_refcnt,
1433				      bool accelerated_list)
1434{
1435	struct list_head *hte;
1436	struct i40iw_cm_node *cm_node;
1437	unsigned long flags;
1438
1439	hte = accelerated_list ?
1440	      &cm_core->accelerated_list : &cm_core->non_accelerated_list;
1441
1442	/* walk list and find cm_node associated with this session ID */
1443	spin_lock_irqsave(&cm_core->ht_lock, flags);
1444	list_for_each_entry(cm_node, hte, list) {
1445		if (!memcmp(cm_node->loc_addr, loc_addr, sizeof(cm_node->loc_addr)) &&
1446		    (cm_node->loc_port == loc_port) &&
1447		    !memcmp(cm_node->rem_addr, rem_addr, sizeof(cm_node->rem_addr)) &&
1448		    (cm_node->rem_port == rem_port)) {
1449			if (add_refcnt)
1450				atomic_inc(&cm_node->ref_count);
1451			spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1452			return cm_node;
1453		}
1454	}
1455	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1456
1457	/* no owner node */
1458	return NULL;
1459}
1460
1461/**
1462 * i40iw_find_listener - find a cm node listening on this addr-port pair
1463 * @cm_core: cm's core
1464 * @dst_port: listener tcp port num
1465 * @dst_addr: listener ip addr
1466 * @listener_state: state to match with listen node's
1467 */
1468static struct i40iw_cm_listener *i40iw_find_listener(
1469						     struct i40iw_cm_core *cm_core,
1470						     u32 *dst_addr,
1471						     u16 dst_port,
1472						     u16 vlan_id,
1473						     enum i40iw_cm_listener_state
1474						     listener_state)
1475{
1476	struct i40iw_cm_listener *listen_node;
1477	static const u32 ip_zero[4] = { 0, 0, 0, 0 };
1478	u32 listen_addr[4];
1479	u16 listen_port;
1480	unsigned long flags;
1481
1482	/* walk list and find cm_node associated with this session ID */
1483	spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1484	list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1485		memcpy(listen_addr, listen_node->loc_addr, sizeof(listen_addr));
1486		listen_port = listen_node->loc_port;
1487		/* compare node pair, return node handle if a match */
1488		if ((!memcmp(listen_addr, dst_addr, sizeof(listen_addr)) ||
1489		     !memcmp(listen_addr, ip_zero, sizeof(listen_addr))) &&
1490		     (listen_port == dst_port) &&
1491		     (listener_state & listen_node->listener_state)) {
1492			atomic_inc(&listen_node->ref_count);
1493			spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1494			return listen_node;
1495		}
1496	}
1497	spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1498	return NULL;
1499}
1500
1501/**
1502 * i40iw_add_hte_node - add a cm node to the hash table
1503 * @cm_core: cm's core
1504 * @cm_node: connection's node
1505 */
1506static void i40iw_add_hte_node(struct i40iw_cm_core *cm_core,
1507			       struct i40iw_cm_node *cm_node)
1508{
1509	unsigned long flags;
1510
1511	if (!cm_node || !cm_core) {
1512		i40iw_pr_err("cm_node or cm_core == NULL\n");
1513		return;
1514	}
1515
1516	spin_lock_irqsave(&cm_core->ht_lock, flags);
1517	list_add_tail(&cm_node->list, &cm_core->non_accelerated_list);
1518	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1519}
1520
1521/**
1522 * i40iw_find_port - find port that matches reference port
1523 * @hte: ptr to accelerated or non-accelerated list
1524 * @accelerated_list: flag for accelerated vs non-accelerated list
1525 */
1526static bool i40iw_find_port(struct list_head *hte, u16 port)
1527{
1528	struct i40iw_cm_node *cm_node;
1529
1530	list_for_each_entry(cm_node, hte, list) {
1531		if (cm_node->loc_port == port)
1532			return true;
1533	}
1534	return false;
1535}
1536
1537/**
1538 * i40iw_port_in_use - determine if port is in use
1539 * @cm_core: cm's core
1540 * @port: port number
1541 */
1542bool i40iw_port_in_use(struct i40iw_cm_core *cm_core, u16 port)
1543{
1544	struct i40iw_cm_listener *listen_node;
1545	unsigned long flags;
1546
1547	spin_lock_irqsave(&cm_core->ht_lock, flags);
1548	if (i40iw_find_port(&cm_core->accelerated_list, port) ||
1549	    i40iw_find_port(&cm_core->non_accelerated_list, port)) {
1550		spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1551		return true;
1552	}
1553	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1554
1555	spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1556	list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1557		if (listen_node->loc_port == port) {
1558			spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1559			return true;
1560		}
1561	}
1562	spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1563
1564	return false;
1565}
1566
1567/**
1568 * i40iw_del_multiple_qhash - Remove qhash and child listens
1569 * @iwdev: iWarp device
1570 * @cm_info: CM info for parent listen node
1571 * @cm_parent_listen_node: The parent listen node
1572 */
1573static enum i40iw_status_code i40iw_del_multiple_qhash(
1574						       struct i40iw_device *iwdev,
1575						       struct i40iw_cm_info *cm_info,
1576						       struct i40iw_cm_listener *cm_parent_listen_node)
1577{
1578	struct i40iw_cm_listener *child_listen_node;
1579	enum i40iw_status_code ret = I40IW_ERR_CONFIG;
1580	struct list_head *pos, *tpos;
1581	unsigned long flags;
1582
1583	spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1584	list_for_each_safe(pos, tpos, &cm_parent_listen_node->child_listen_list) {
1585		child_listen_node = list_entry(pos, struct i40iw_cm_listener, child_listen_list);
1586		if (child_listen_node->ipv4)
1587			i40iw_debug(&iwdev->sc_dev,
1588				    I40IW_DEBUG_CM,
1589				    "removing child listen for IP=%pI4, port=%d, vlan=%d\n",
1590				    child_listen_node->loc_addr,
1591				    child_listen_node->loc_port,
1592				    child_listen_node->vlan_id);
1593		else
1594			i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
1595				    "removing child listen for IP=%pI6, port=%d, vlan=%d\n",
1596				    child_listen_node->loc_addr,
1597				    child_listen_node->loc_port,
1598				    child_listen_node->vlan_id);
1599		list_del(pos);
1600		memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1601		       sizeof(cm_info->loc_addr));
1602		cm_info->vlan_id = child_listen_node->vlan_id;
1603		if (child_listen_node->qhash_set) {
1604			ret = i40iw_manage_qhash(iwdev, cm_info,
1605						 I40IW_QHASH_TYPE_TCP_SYN,
1606						 I40IW_QHASH_MANAGE_TYPE_DELETE,
1607						 NULL, false);
1608			child_listen_node->qhash_set = false;
1609		} else {
1610			ret = I40IW_SUCCESS;
1611		}
1612		i40iw_debug(&iwdev->sc_dev,
1613			    I40IW_DEBUG_CM,
1614			    "freed pointer = %p\n",
1615			    child_listen_node);
1616		kfree(child_listen_node);
1617		cm_parent_listen_node->cm_core->stats_listen_nodes_destroyed++;
1618	}
1619	spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1620
1621	return ret;
1622}
1623
1624/**
1625 * i40iw_netdev_vlan_ipv6 - Gets the netdev and vlan
1626 * @addr: local IPv6 address
1627 * @vlan_id: vlan id for the given IPv6 address
1628 *
1629 * Returns the net_device of the IPv6 address and also sets the
1630 * vlan id for that address.
1631 */
1632static struct net_device *i40iw_netdev_vlan_ipv6(u32 *addr, u16 *vlan_id)
1633{
1634	struct net_device *ip_dev = NULL;
1635	struct in6_addr laddr6;
1636
1637	if (!IS_ENABLED(CONFIG_IPV6))
1638		return NULL;
1639	i40iw_copy_ip_htonl(laddr6.in6_u.u6_addr32, addr);
1640	if (vlan_id)
1641		*vlan_id = I40IW_NO_VLAN;
1642	rcu_read_lock();
1643	for_each_netdev_rcu(&init_net, ip_dev) {
1644		if (ipv6_chk_addr(&init_net, &laddr6, ip_dev, 1)) {
1645			if (vlan_id)
1646				*vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1647			break;
1648		}
1649	}
1650	rcu_read_unlock();
1651	return ip_dev;
1652}
1653
1654/**
1655 * i40iw_get_vlan_ipv4 - Returns the vlan_id for IPv4 address
1656 * @addr: local IPv4 address
1657 */
1658static u16 i40iw_get_vlan_ipv4(u32 *addr)
1659{
1660	struct net_device *netdev;
1661	u16 vlan_id = I40IW_NO_VLAN;
1662
1663	netdev = ip_dev_find(&init_net, htonl(addr[0]));
1664	if (netdev) {
1665		vlan_id = rdma_vlan_dev_vlan_id(netdev);
1666		dev_put(netdev);
1667	}
1668	return vlan_id;
1669}
1670
1671/**
1672 * i40iw_add_mqh_6 - Adds multiple qhashes for IPv6
1673 * @iwdev: iWarp device
1674 * @cm_info: CM info for parent listen node
1675 * @cm_parent_listen_node: The parent listen node
1676 *
1677 * Adds a qhash and a child listen node for every IPv6 address
1678 * on the adapter and adds the associated qhash filter
1679 */
1680static enum i40iw_status_code i40iw_add_mqh_6(struct i40iw_device *iwdev,
1681					      struct i40iw_cm_info *cm_info,
1682					      struct i40iw_cm_listener *cm_parent_listen_node)
1683{
1684	struct net_device *ip_dev;
1685	struct inet6_dev *idev;
1686	struct inet6_ifaddr *ifp, *tmp;
1687	enum i40iw_status_code ret = 0;
1688	struct i40iw_cm_listener *child_listen_node;
1689	unsigned long flags;
1690
1691	rtnl_lock();
1692	for_each_netdev(&init_net, ip_dev) {
1693		if ((((rdma_vlan_dev_vlan_id(ip_dev) < I40IW_NO_VLAN) &&
1694		      (rdma_vlan_dev_real_dev(ip_dev) == iwdev->netdev)) ||
1695		     (ip_dev == iwdev->netdev)) && (ip_dev->flags & IFF_UP)) {
1696			idev = __in6_dev_get(ip_dev);
1697			if (!idev) {
1698				i40iw_pr_err("idev == NULL\n");
1699				break;
1700			}
1701			list_for_each_entry_safe(ifp, tmp, &idev->addr_list, if_list) {
1702				i40iw_debug(&iwdev->sc_dev,
1703					    I40IW_DEBUG_CM,
1704					    "IP=%pI6, vlan_id=%d, MAC=%pM\n",
1705					    &ifp->addr,
1706					    rdma_vlan_dev_vlan_id(ip_dev),
1707					    ip_dev->dev_addr);
1708				child_listen_node =
1709					kzalloc(sizeof(*child_listen_node), GFP_ATOMIC);
1710				i40iw_debug(&iwdev->sc_dev,
1711					    I40IW_DEBUG_CM,
1712					    "Allocating child listener %p\n",
1713					    child_listen_node);
1714				if (!child_listen_node) {
1715					ret = I40IW_ERR_NO_MEMORY;
1716					goto exit;
1717				}
1718				cm_info->vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1719				cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1720
1721				memcpy(child_listen_node, cm_parent_listen_node,
1722				       sizeof(*child_listen_node));
1723
1724				i40iw_copy_ip_ntohl(child_listen_node->loc_addr,
1725						    ifp->addr.in6_u.u6_addr32);
1726				memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1727				       sizeof(cm_info->loc_addr));
1728
1729				ret = i40iw_manage_qhash(iwdev, cm_info,
1730							 I40IW_QHASH_TYPE_TCP_SYN,
1731							 I40IW_QHASH_MANAGE_TYPE_ADD,
1732							 NULL, true);
1733				if (!ret) {
1734					child_listen_node->qhash_set = true;
1735					spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1736					list_add(&child_listen_node->child_listen_list,
1737						 &cm_parent_listen_node->child_listen_list);
1738					spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1739					cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1740				} else {
1741					kfree(child_listen_node);
1742				}
1743			}
1744		}
1745	}
1746exit:
1747	rtnl_unlock();
1748	return ret;
1749}
1750
1751/**
1752 * i40iw_add_mqh_4 - Adds multiple qhashes for IPv4
1753 * @iwdev: iWarp device
1754 * @cm_info: CM info for parent listen node
1755 * @cm_parent_listen_node: The parent listen node
1756 *
1757 * Adds a qhash and a child listen node for every IPv4 address
1758 * on the adapter and adds the associated qhash filter
1759 */
1760static enum i40iw_status_code i40iw_add_mqh_4(
1761				struct i40iw_device *iwdev,
1762				struct i40iw_cm_info *cm_info,
1763				struct i40iw_cm_listener *cm_parent_listen_node)
1764{
1765	struct net_device *dev;
1766	struct in_device *idev;
1767	struct i40iw_cm_listener *child_listen_node;
1768	enum i40iw_status_code ret = 0;
1769	unsigned long flags;
1770
1771	rtnl_lock();
1772	for_each_netdev(&init_net, dev) {
1773		if ((((rdma_vlan_dev_vlan_id(dev) < I40IW_NO_VLAN) &&
1774		      (rdma_vlan_dev_real_dev(dev) == iwdev->netdev)) ||
1775		    (dev == iwdev->netdev)) && (dev->flags & IFF_UP)) {
1776			const struct in_ifaddr *ifa;
1777
1778			idev = in_dev_get(dev);
1779
1780			in_dev_for_each_ifa_rtnl(ifa, idev) {
1781				i40iw_debug(&iwdev->sc_dev,
1782					    I40IW_DEBUG_CM,
1783					    "Allocating child CM Listener forIP=%pI4, vlan_id=%d, MAC=%pM\n",
1784					    &ifa->ifa_address,
1785					    rdma_vlan_dev_vlan_id(dev),
1786					    dev->dev_addr);
1787				child_listen_node = kzalloc(sizeof(*child_listen_node), GFP_KERNEL);
1788				cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1789				i40iw_debug(&iwdev->sc_dev,
1790					    I40IW_DEBUG_CM,
1791					    "Allocating child listener %p\n",
1792					    child_listen_node);
1793				if (!child_listen_node) {
1794					in_dev_put(idev);
1795					ret = I40IW_ERR_NO_MEMORY;
1796					goto exit;
1797				}
1798				cm_info->vlan_id = rdma_vlan_dev_vlan_id(dev);
1799				cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1800				memcpy(child_listen_node,
1801				       cm_parent_listen_node,
1802				       sizeof(*child_listen_node));
1803
1804				child_listen_node->loc_addr[0] = ntohl(ifa->ifa_address);
1805				memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1806				       sizeof(cm_info->loc_addr));
1807
1808				ret = i40iw_manage_qhash(iwdev,
1809							 cm_info,
1810							 I40IW_QHASH_TYPE_TCP_SYN,
1811							 I40IW_QHASH_MANAGE_TYPE_ADD,
1812							 NULL,
1813							 true);
1814				if (!ret) {
1815					child_listen_node->qhash_set = true;
1816					spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1817					list_add(&child_listen_node->child_listen_list,
1818						 &cm_parent_listen_node->child_listen_list);
1819					spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1820				} else {
1821					kfree(child_listen_node);
1822					cm_parent_listen_node->cm_core->stats_listen_nodes_created--;
1823				}
1824			}
1825
1826			in_dev_put(idev);
1827		}
1828	}
1829exit:
1830	rtnl_unlock();
1831	return ret;
1832}
1833
1834/**
1835 * i40iw_dec_refcnt_listen - delete listener and associated cm nodes
1836 * @cm_core: cm's core
1837 * @free_hanging_nodes: to free associated cm_nodes
1838 * @apbvt_del: flag to delete the apbvt
1839 */
1840static int i40iw_dec_refcnt_listen(struct i40iw_cm_core *cm_core,
1841				   struct i40iw_cm_listener *listener,
1842				   int free_hanging_nodes, bool apbvt_del)
1843{
1844	int ret = -EINVAL;
1845	int err = 0;
1846	struct list_head *list_pos;
1847	struct list_head *list_temp;
1848	struct i40iw_cm_node *cm_node;
1849	struct list_head reset_list;
1850	struct i40iw_cm_info nfo;
1851	struct i40iw_cm_node *loopback;
1852	enum i40iw_cm_node_state old_state;
1853	unsigned long flags;
1854
1855	/* free non-accelerated child nodes for this listener */
1856	INIT_LIST_HEAD(&reset_list);
1857	if (free_hanging_nodes) {
1858		spin_lock_irqsave(&cm_core->ht_lock, flags);
1859		list_for_each_safe(list_pos,
1860				   list_temp, &cm_core->non_accelerated_list) {
1861			cm_node = container_of(list_pos, struct i40iw_cm_node, list);
1862			if ((cm_node->listener == listener) &&
1863			    !cm_node->accelerated) {
1864				atomic_inc(&cm_node->ref_count);
1865				list_add(&cm_node->reset_entry, &reset_list);
1866			}
1867		}
1868		spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1869	}
1870
1871	list_for_each_safe(list_pos, list_temp, &reset_list) {
1872		cm_node = container_of(list_pos, struct i40iw_cm_node, reset_entry);
1873		loopback = cm_node->loopbackpartner;
1874		if (cm_node->state >= I40IW_CM_STATE_FIN_WAIT1) {
1875			i40iw_rem_ref_cm_node(cm_node);
1876		} else {
1877			if (!loopback) {
1878				i40iw_cleanup_retrans_entry(cm_node);
1879				err = i40iw_send_reset(cm_node);
1880				if (err) {
1881					cm_node->state = I40IW_CM_STATE_CLOSED;
1882					i40iw_pr_err("send reset\n");
1883				} else {
1884					old_state = cm_node->state;
1885					cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1886					if (old_state != I40IW_CM_STATE_MPAREQ_RCVD)
1887						i40iw_rem_ref_cm_node(cm_node);
1888				}
1889			} else {
1890				struct i40iw_cm_event event;
1891
1892				event.cm_node = loopback;
1893				memcpy(event.cm_info.rem_addr,
1894				       loopback->rem_addr, sizeof(event.cm_info.rem_addr));
1895				memcpy(event.cm_info.loc_addr,
1896				       loopback->loc_addr, sizeof(event.cm_info.loc_addr));
1897				event.cm_info.rem_port = loopback->rem_port;
1898				event.cm_info.loc_port = loopback->loc_port;
1899				event.cm_info.cm_id = loopback->cm_id;
1900				event.cm_info.ipv4 = loopback->ipv4;
1901				atomic_inc(&loopback->ref_count);
1902				loopback->state = I40IW_CM_STATE_CLOSED;
1903				i40iw_event_connect_error(&event);
1904				cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1905				i40iw_rem_ref_cm_node(cm_node);
1906			}
1907		}
1908	}
1909
1910	if (!atomic_dec_return(&listener->ref_count)) {
1911		spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1912		list_del(&listener->list);
1913		spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1914
1915		if (listener->iwdev) {
1916			if (apbvt_del)
1917				i40iw_manage_apbvt(listener->iwdev,
1918						   listener->loc_port,
1919						   I40IW_MANAGE_APBVT_DEL);
1920
1921			memcpy(nfo.loc_addr, listener->loc_addr, sizeof(nfo.loc_addr));
1922			nfo.loc_port = listener->loc_port;
1923			nfo.ipv4 = listener->ipv4;
1924			nfo.vlan_id = listener->vlan_id;
1925			nfo.user_pri = listener->user_pri;
1926
1927			if (!list_empty(&listener->child_listen_list)) {
1928				i40iw_del_multiple_qhash(listener->iwdev, &nfo, listener);
1929			} else {
1930				if (listener->qhash_set)
1931					i40iw_manage_qhash(listener->iwdev,
1932							   &nfo,
1933							   I40IW_QHASH_TYPE_TCP_SYN,
1934							   I40IW_QHASH_MANAGE_TYPE_DELETE,
1935							   NULL,
1936							   false);
1937			}
1938		}
1939
1940		cm_core->stats_listen_destroyed++;
1941		kfree(listener);
1942		cm_core->stats_listen_nodes_destroyed++;
1943		listener = NULL;
1944		ret = 0;
1945	}
1946
1947	if (listener) {
1948		if (atomic_read(&listener->pend_accepts_cnt) > 0)
1949			i40iw_debug(cm_core->dev,
1950				    I40IW_DEBUG_CM,
1951				    "%s: listener (%p) pending accepts=%u\n",
1952				    __func__,
1953				    listener,
1954				    atomic_read(&listener->pend_accepts_cnt));
1955	}
1956
1957	return ret;
1958}
1959
1960/**
1961 * i40iw_cm_del_listen - delete a linstener
1962 * @cm_core: cm's core
1963  * @listener: passive connection's listener
1964 * @apbvt_del: flag to delete apbvt
1965 */
1966static int i40iw_cm_del_listen(struct i40iw_cm_core *cm_core,
1967			       struct i40iw_cm_listener *listener,
1968			       bool apbvt_del)
1969{
1970	listener->listener_state = I40IW_CM_LISTENER_PASSIVE_STATE;
1971	listener->cm_id = NULL;	/* going to be destroyed pretty soon */
1972	return i40iw_dec_refcnt_listen(cm_core, listener, 1, apbvt_del);
1973}
1974
1975/**
1976 * i40iw_addr_resolve_neigh - resolve neighbor address
1977 * @iwdev: iwarp device structure
1978 * @src_ip: local ip address
1979 * @dst_ip: remote ip address
1980 * @arpindex: if there is an arp entry
1981 */
1982static int i40iw_addr_resolve_neigh(struct i40iw_device *iwdev,
1983				    u32 src_ip,
1984				    u32 dst_ip,
1985				    int arpindex)
1986{
1987	struct rtable *rt;
1988	struct neighbour *neigh;
1989	int rc = arpindex;
1990	__be32 dst_ipaddr = htonl(dst_ip);
1991	__be32 src_ipaddr = htonl(src_ip);
1992
1993	rt = ip_route_output(&init_net, dst_ipaddr, src_ipaddr, 0, 0);
1994	if (IS_ERR(rt)) {
1995		i40iw_pr_err("ip_route_output\n");
1996		return rc;
1997	}
1998
1999	neigh = dst_neigh_lookup(&rt->dst, &dst_ipaddr);
2000
2001	rcu_read_lock();
2002	if (neigh) {
2003		if (neigh->nud_state & NUD_VALID) {
2004			if (arpindex >= 0) {
2005				if (ether_addr_equal(iwdev->arp_table[arpindex].mac_addr,
2006						     neigh->ha))
2007					/* Mac address same as arp table */
2008					goto resolve_neigh_exit;
2009				i40iw_manage_arp_cache(iwdev,
2010						       iwdev->arp_table[arpindex].mac_addr,
2011						       &dst_ip,
2012						       true,
2013						       I40IW_ARP_DELETE);
2014			}
2015
2016			i40iw_manage_arp_cache(iwdev, neigh->ha, &dst_ip, true, I40IW_ARP_ADD);
2017			rc = i40iw_arp_table(iwdev, &dst_ip, true, NULL, I40IW_ARP_RESOLVE);
2018		} else {
2019			neigh_event_send(neigh, NULL);
2020		}
2021	}
2022 resolve_neigh_exit:
2023
2024	rcu_read_unlock();
2025	if (neigh)
2026		neigh_release(neigh);
2027
2028	ip_rt_put(rt);
2029	return rc;
2030}
2031
2032/**
2033 * i40iw_get_dst_ipv6
2034 */
2035static struct dst_entry *i40iw_get_dst_ipv6(struct sockaddr_in6 *src_addr,
2036					    struct sockaddr_in6 *dst_addr)
2037{
2038	struct dst_entry *dst;
2039	struct flowi6 fl6;
2040
2041	memset(&fl6, 0, sizeof(fl6));
2042	fl6.daddr = dst_addr->sin6_addr;
2043	fl6.saddr = src_addr->sin6_addr;
2044	if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
2045		fl6.flowi6_oif = dst_addr->sin6_scope_id;
2046
2047	dst = ip6_route_output(&init_net, NULL, &fl6);
2048	return dst;
2049}
2050
2051/**
2052 * i40iw_addr_resolve_neigh_ipv6 - resolve neighbor ipv6 address
2053 * @iwdev: iwarp device structure
2054 * @dst_ip: remote ip address
2055 * @arpindex: if there is an arp entry
2056 */
2057static int i40iw_addr_resolve_neigh_ipv6(struct i40iw_device *iwdev,
2058					 u32 *src,
2059					 u32 *dest,
2060					 int arpindex)
2061{
2062	struct neighbour *neigh;
2063	int rc = arpindex;
2064	struct dst_entry *dst;
2065	struct sockaddr_in6 dst_addr;
2066	struct sockaddr_in6 src_addr;
2067
2068	memset(&dst_addr, 0, sizeof(dst_addr));
2069	dst_addr.sin6_family = AF_INET6;
2070	i40iw_copy_ip_htonl(dst_addr.sin6_addr.in6_u.u6_addr32, dest);
2071	memset(&src_addr, 0, sizeof(src_addr));
2072	src_addr.sin6_family = AF_INET6;
2073	i40iw_copy_ip_htonl(src_addr.sin6_addr.in6_u.u6_addr32, src);
2074	dst = i40iw_get_dst_ipv6(&src_addr, &dst_addr);
2075	if (!dst || dst->error) {
2076		if (dst) {
2077			i40iw_pr_err("ip6_route_output returned dst->error = %d\n",
2078				     dst->error);
2079			dst_release(dst);
2080		}
2081		return rc;
2082	}
2083
2084	neigh = dst_neigh_lookup(dst, dst_addr.sin6_addr.in6_u.u6_addr32);
2085
2086	rcu_read_lock();
2087	if (neigh) {
2088		i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "dst_neigh_lookup MAC=%pM\n", neigh->ha);
2089		if (neigh->nud_state & NUD_VALID) {
2090			if (arpindex >= 0) {
2091				if (ether_addr_equal
2092				    (iwdev->arp_table[arpindex].mac_addr,
2093				     neigh->ha)) {
2094					/* Mac address same as in arp table */
2095					goto resolve_neigh_exit6;
2096				}
2097				i40iw_manage_arp_cache(iwdev,
2098						       iwdev->arp_table[arpindex].mac_addr,
2099						       dest,
2100						       false,
2101						       I40IW_ARP_DELETE);
2102			}
2103			i40iw_manage_arp_cache(iwdev,
2104					       neigh->ha,
2105					       dest,
2106					       false,
2107					       I40IW_ARP_ADD);
2108			rc = i40iw_arp_table(iwdev,
2109					     dest,
2110					     false,
2111					     NULL,
2112					     I40IW_ARP_RESOLVE);
2113		} else {
2114			neigh_event_send(neigh, NULL);
2115		}
2116	}
2117
2118 resolve_neigh_exit6:
2119	rcu_read_unlock();
2120	if (neigh)
2121		neigh_release(neigh);
2122	dst_release(dst);
2123	return rc;
2124}
2125
2126/**
2127 * i40iw_ipv4_is_loopback - check if loopback
2128 * @loc_addr: local addr to compare
2129 * @rem_addr: remote address
2130 */
2131static bool i40iw_ipv4_is_loopback(u32 loc_addr, u32 rem_addr)
2132{
2133	return ipv4_is_loopback(htonl(rem_addr)) || (loc_addr == rem_addr);
2134}
2135
2136/**
2137 * i40iw_ipv6_is_loopback - check if loopback
2138 * @loc_addr: local addr to compare
2139 * @rem_addr: remote address
2140 */
2141static bool i40iw_ipv6_is_loopback(u32 *loc_addr, u32 *rem_addr)
2142{
2143	struct in6_addr raddr6;
2144
2145	i40iw_copy_ip_htonl(raddr6.in6_u.u6_addr32, rem_addr);
2146	return !memcmp(loc_addr, rem_addr, 16) || ipv6_addr_loopback(&raddr6);
2147}
2148
2149/**
2150 * i40iw_make_cm_node - create a new instance of a cm node
2151 * @cm_core: cm's core
2152 * @iwdev: iwarp device structure
2153 * @cm_info: quad info for connection
2154 * @listener: passive connection's listener
2155 */
2156static struct i40iw_cm_node *i40iw_make_cm_node(
2157				   struct i40iw_cm_core *cm_core,
2158				   struct i40iw_device *iwdev,
2159				   struct i40iw_cm_info *cm_info,
2160				   struct i40iw_cm_listener *listener)
2161{
2162	struct i40iw_cm_node *cm_node;
2163	int oldarpindex;
2164	int arpindex;
2165	struct net_device *netdev = iwdev->netdev;
2166
2167	/* create an hte and cm_node for this instance */
2168	cm_node = kzalloc(sizeof(*cm_node), GFP_ATOMIC);
2169	if (!cm_node)
2170		return NULL;
2171
2172	/* set our node specific transport info */
2173	cm_node->ipv4 = cm_info->ipv4;
2174	cm_node->vlan_id = cm_info->vlan_id;
2175	if ((cm_node->vlan_id == I40IW_NO_VLAN) && iwdev->dcb)
2176		cm_node->vlan_id = 0;
2177	cm_node->tos = cm_info->tos;
2178	cm_node->user_pri = cm_info->user_pri;
2179	if (listener) {
2180		if (listener->tos != cm_info->tos)
2181			i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB,
2182				    "application TOS[%d] and remote client TOS[%d] mismatch\n",
2183				     listener->tos, cm_info->tos);
2184		cm_node->tos = max(listener->tos, cm_info->tos);
2185		cm_node->user_pri = rt_tos2priority(cm_node->tos);
2186		i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "listener: TOS:[%d] UP:[%d]\n",
2187			    cm_node->tos, cm_node->user_pri);
2188	}
2189	memcpy(cm_node->loc_addr, cm_info->loc_addr, sizeof(cm_node->loc_addr));
2190	memcpy(cm_node->rem_addr, cm_info->rem_addr, sizeof(cm_node->rem_addr));
2191	cm_node->loc_port = cm_info->loc_port;
2192	cm_node->rem_port = cm_info->rem_port;
2193
2194	cm_node->mpa_frame_rev = iwdev->mpa_version;
2195	cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
2196	cm_node->ird_size = I40IW_MAX_IRD_SIZE;
2197	cm_node->ord_size = I40IW_MAX_ORD_SIZE;
2198
2199	cm_node->listener = listener;
2200	cm_node->cm_id = cm_info->cm_id;
2201	ether_addr_copy(cm_node->loc_mac, netdev->dev_addr);
2202	spin_lock_init(&cm_node->retrans_list_lock);
2203	cm_node->ack_rcvd = false;
2204
2205	atomic_set(&cm_node->ref_count, 1);
2206	/* associate our parent CM core */
2207	cm_node->cm_core = cm_core;
2208	cm_node->tcp_cntxt.loc_id = I40IW_CM_DEF_LOCAL_ID;
2209	cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2210	cm_node->tcp_cntxt.rcv_wnd =
2211			I40IW_CM_DEFAULT_RCV_WND_SCALED >> I40IW_CM_DEFAULT_RCV_WND_SCALE;
2212	if (cm_node->ipv4) {
2213		cm_node->tcp_cntxt.loc_seq_num = secure_tcp_seq(htonl(cm_node->loc_addr[0]),
2214							htonl(cm_node->rem_addr[0]),
2215							htons(cm_node->loc_port),
2216							htons(cm_node->rem_port));
2217		cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV4;
2218	} else if (IS_ENABLED(CONFIG_IPV6)) {
2219		__be32 loc[4] = {
2220			htonl(cm_node->loc_addr[0]), htonl(cm_node->loc_addr[1]),
2221			htonl(cm_node->loc_addr[2]), htonl(cm_node->loc_addr[3])
2222		};
2223		__be32 rem[4] = {
2224			htonl(cm_node->rem_addr[0]), htonl(cm_node->rem_addr[1]),
2225			htonl(cm_node->rem_addr[2]), htonl(cm_node->rem_addr[3])
2226		};
2227		cm_node->tcp_cntxt.loc_seq_num = secure_tcpv6_seq(loc, rem,
2228							htons(cm_node->loc_port),
2229							htons(cm_node->rem_port));
2230		cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV6;
2231	}
2232
2233	cm_node->iwdev = iwdev;
2234	cm_node->dev = &iwdev->sc_dev;
2235
2236	if ((cm_node->ipv4 &&
2237	     i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
2238	     (!cm_node->ipv4 && i40iw_ipv6_is_loopback(cm_node->loc_addr,
2239						       cm_node->rem_addr))) {
2240		arpindex = i40iw_arp_table(iwdev,
2241					   cm_node->rem_addr,
2242					   false,
2243					   NULL,
2244					   I40IW_ARP_RESOLVE);
2245	} else {
2246		oldarpindex = i40iw_arp_table(iwdev,
2247					      cm_node->rem_addr,
2248					      false,
2249					      NULL,
2250					      I40IW_ARP_RESOLVE);
2251		if (cm_node->ipv4)
2252			arpindex = i40iw_addr_resolve_neigh(iwdev,
2253							    cm_info->loc_addr[0],
2254							    cm_info->rem_addr[0],
2255							    oldarpindex);
2256		else if (IS_ENABLED(CONFIG_IPV6))
2257			arpindex = i40iw_addr_resolve_neigh_ipv6(iwdev,
2258								 cm_info->loc_addr,
2259								 cm_info->rem_addr,
2260								 oldarpindex);
2261		else
2262			arpindex = -EINVAL;
2263	}
2264	if (arpindex < 0) {
2265		i40iw_pr_err("cm_node arpindex\n");
2266		kfree(cm_node);
2267		return NULL;
2268	}
2269	ether_addr_copy(cm_node->rem_mac, iwdev->arp_table[arpindex].mac_addr);
2270	i40iw_add_hte_node(cm_core, cm_node);
2271	cm_core->stats_nodes_created++;
2272	return cm_node;
2273}
2274
2275/**
2276 * i40iw_rem_ref_cm_node - destroy an instance of a cm node
2277 * @cm_node: connection's node
2278 */
2279static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *cm_node)
2280{
2281	struct i40iw_cm_core *cm_core = cm_node->cm_core;
2282	struct i40iw_qp *iwqp;
2283	struct i40iw_cm_info nfo;
2284	unsigned long flags;
2285
2286	spin_lock_irqsave(&cm_node->cm_core->ht_lock, flags);
2287	if (atomic_dec_return(&cm_node->ref_count)) {
2288		spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2289		return;
2290	}
2291	list_del(&cm_node->list);
2292	spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2293
2294	/* if the node is destroyed before connection was accelerated */
2295	if (!cm_node->accelerated && cm_node->accept_pend) {
2296		pr_err("node destroyed before established\n");
2297		atomic_dec(&cm_node->listener->pend_accepts_cnt);
2298	}
2299	if (cm_node->close_entry)
2300		i40iw_handle_close_entry(cm_node, 0);
2301	if (cm_node->listener) {
2302		i40iw_dec_refcnt_listen(cm_core, cm_node->listener, 0, true);
2303	} else {
2304		if (cm_node->apbvt_set) {
2305			i40iw_manage_apbvt(cm_node->iwdev,
2306					   cm_node->loc_port,
2307					   I40IW_MANAGE_APBVT_DEL);
2308			cm_node->apbvt_set = 0;
2309		}
2310		i40iw_get_addr_info(cm_node, &nfo);
2311		if (cm_node->qhash_set) {
2312			i40iw_manage_qhash(cm_node->iwdev,
2313					   &nfo,
2314					   I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2315					   I40IW_QHASH_MANAGE_TYPE_DELETE,
2316					   NULL,
2317					   false);
2318			cm_node->qhash_set = 0;
2319		}
2320	}
2321
2322	iwqp = cm_node->iwqp;
2323	if (iwqp) {
2324		iwqp->cm_node = NULL;
2325		i40iw_qp_rem_ref(&iwqp->ibqp);
2326		cm_node->iwqp = NULL;
2327	} else if (cm_node->qhash_set) {
2328		i40iw_get_addr_info(cm_node, &nfo);
2329		i40iw_manage_qhash(cm_node->iwdev,
2330				   &nfo,
2331				   I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2332				   I40IW_QHASH_MANAGE_TYPE_DELETE,
2333				   NULL,
2334				   false);
2335		cm_node->qhash_set = 0;
2336	}
2337
2338	cm_node->cm_core->stats_nodes_destroyed++;
2339	kfree(cm_node);
2340}
2341
2342/**
2343 * i40iw_handle_fin_pkt - FIN packet received
2344 * @cm_node: connection's node
2345 */
2346static void i40iw_handle_fin_pkt(struct i40iw_cm_node *cm_node)
2347{
2348	u32 ret;
2349
2350	switch (cm_node->state) {
2351	case I40IW_CM_STATE_SYN_RCVD:
2352	case I40IW_CM_STATE_SYN_SENT:
2353	case I40IW_CM_STATE_ESTABLISHED:
2354	case I40IW_CM_STATE_MPAREJ_RCVD:
2355		cm_node->tcp_cntxt.rcv_nxt++;
2356		i40iw_cleanup_retrans_entry(cm_node);
2357		cm_node->state = I40IW_CM_STATE_LAST_ACK;
2358		i40iw_send_fin(cm_node);
2359		break;
2360	case I40IW_CM_STATE_MPAREQ_SENT:
2361		i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
2362		cm_node->tcp_cntxt.rcv_nxt++;
2363		i40iw_cleanup_retrans_entry(cm_node);
2364		cm_node->state = I40IW_CM_STATE_CLOSED;
2365		atomic_inc(&cm_node->ref_count);
2366		i40iw_send_reset(cm_node);
2367		break;
2368	case I40IW_CM_STATE_FIN_WAIT1:
2369		cm_node->tcp_cntxt.rcv_nxt++;
2370		i40iw_cleanup_retrans_entry(cm_node);
2371		cm_node->state = I40IW_CM_STATE_CLOSING;
2372		i40iw_send_ack(cm_node);
2373		/*
2374		 * Wait for ACK as this is simultaneous close.
2375		 * After we receive ACK, do not send anything.
2376		 * Just rm the node.
2377		 */
2378		break;
2379	case I40IW_CM_STATE_FIN_WAIT2:
2380		cm_node->tcp_cntxt.rcv_nxt++;
2381		i40iw_cleanup_retrans_entry(cm_node);
2382		cm_node->state = I40IW_CM_STATE_TIME_WAIT;
2383		i40iw_send_ack(cm_node);
2384		ret =
2385		    i40iw_schedule_cm_timer(cm_node, NULL, I40IW_TIMER_TYPE_CLOSE, 1, 0);
2386		if (ret)
2387			i40iw_pr_err("node %p state = %d\n", cm_node, cm_node->state);
2388		break;
2389	case I40IW_CM_STATE_TIME_WAIT:
2390		cm_node->tcp_cntxt.rcv_nxt++;
2391		i40iw_cleanup_retrans_entry(cm_node);
2392		cm_node->state = I40IW_CM_STATE_CLOSED;
2393		i40iw_rem_ref_cm_node(cm_node);
2394		break;
2395	case I40IW_CM_STATE_OFFLOADED:
2396	default:
2397		i40iw_pr_err("bad state node %p state = %d\n", cm_node, cm_node->state);
2398		break;
2399	}
2400}
2401
2402/**
2403 * i40iw_handle_rst_pkt - process received RST packet
2404 * @cm_node: connection's node
2405 * @rbuf: receive buffer
2406 */
2407static void i40iw_handle_rst_pkt(struct i40iw_cm_node *cm_node,
2408				 struct i40iw_puda_buf *rbuf)
2409{
2410	i40iw_cleanup_retrans_entry(cm_node);
2411	switch (cm_node->state) {
2412	case I40IW_CM_STATE_SYN_SENT:
2413	case I40IW_CM_STATE_MPAREQ_SENT:
2414		switch (cm_node->mpa_frame_rev) {
2415		case IETF_MPA_V2:
2416			cm_node->mpa_frame_rev = IETF_MPA_V1;
2417			/* send a syn and goto syn sent state */
2418			cm_node->state = I40IW_CM_STATE_SYN_SENT;
2419			if (i40iw_send_syn(cm_node, 0))
2420				i40iw_active_open_err(cm_node, false);
2421			break;
2422		case IETF_MPA_V1:
2423		default:
2424			i40iw_active_open_err(cm_node, false);
2425			break;
2426		}
2427		break;
2428	case I40IW_CM_STATE_MPAREQ_RCVD:
2429		atomic_add_return(1, &cm_node->passive_state);
2430		break;
2431	case I40IW_CM_STATE_ESTABLISHED:
2432	case I40IW_CM_STATE_SYN_RCVD:
2433	case I40IW_CM_STATE_LISTENING:
2434		i40iw_pr_err("Bad state state = %d\n", cm_node->state);
2435		i40iw_passive_open_err(cm_node, false);
2436		break;
2437	case I40IW_CM_STATE_OFFLOADED:
2438		i40iw_active_open_err(cm_node, false);
2439		break;
2440	case I40IW_CM_STATE_CLOSED:
2441		break;
2442	case I40IW_CM_STATE_FIN_WAIT2:
2443	case I40IW_CM_STATE_FIN_WAIT1:
2444	case I40IW_CM_STATE_LAST_ACK:
2445		cm_node->cm_id->rem_ref(cm_node->cm_id);
2446		fallthrough;
2447	case I40IW_CM_STATE_TIME_WAIT:
2448		cm_node->state = I40IW_CM_STATE_CLOSED;
2449		i40iw_rem_ref_cm_node(cm_node);
2450		break;
2451	default:
2452		break;
2453	}
2454}
2455
2456/**
2457 * i40iw_handle_rcv_mpa - Process a recv'd mpa buffer
2458 * @cm_node: connection's node
2459 * @rbuf: receive buffer
2460 */
2461static void i40iw_handle_rcv_mpa(struct i40iw_cm_node *cm_node,
2462				 struct i40iw_puda_buf *rbuf)
2463{
2464	int ret;
2465	int datasize = rbuf->datalen;
2466	u8 *dataloc = rbuf->data;
2467
2468	enum i40iw_cm_event_type type = I40IW_CM_EVENT_UNKNOWN;
2469	u32 res_type;
2470
2471	ret = i40iw_parse_mpa(cm_node, dataloc, &res_type, datasize);
2472	if (ret) {
2473		if (cm_node->state == I40IW_CM_STATE_MPAREQ_SENT)
2474			i40iw_active_open_err(cm_node, true);
2475		else
2476			i40iw_passive_open_err(cm_node, true);
2477		return;
2478	}
2479
2480	switch (cm_node->state) {
2481	case I40IW_CM_STATE_ESTABLISHED:
2482		if (res_type == I40IW_MPA_REQUEST_REJECT)
2483			i40iw_pr_err("state for reject\n");
2484		cm_node->state = I40IW_CM_STATE_MPAREQ_RCVD;
2485		type = I40IW_CM_EVENT_MPA_REQ;
2486		i40iw_send_ack(cm_node);	/* ACK received MPA request */
2487		atomic_set(&cm_node->passive_state,
2488			   I40IW_PASSIVE_STATE_INDICATED);
2489		break;
2490	case I40IW_CM_STATE_MPAREQ_SENT:
2491		i40iw_cleanup_retrans_entry(cm_node);
2492		if (res_type == I40IW_MPA_REQUEST_REJECT) {
2493			type = I40IW_CM_EVENT_MPA_REJECT;
2494			cm_node->state = I40IW_CM_STATE_MPAREJ_RCVD;
2495		} else {
2496			type = I40IW_CM_EVENT_CONNECTED;
2497			cm_node->state = I40IW_CM_STATE_OFFLOADED;
2498		}
2499		i40iw_send_ack(cm_node);
2500		break;
2501	default:
2502		pr_err("%s wrong cm_node state =%d\n", __func__, cm_node->state);
2503		break;
2504	}
2505	i40iw_create_event(cm_node, type);
2506}
2507
2508/**
2509 * i40iw_indicate_pkt_err - Send up err event to cm
2510 * @cm_node: connection's node
2511 */
2512static void i40iw_indicate_pkt_err(struct i40iw_cm_node *cm_node)
2513{
2514	switch (cm_node->state) {
2515	case I40IW_CM_STATE_SYN_SENT:
2516	case I40IW_CM_STATE_MPAREQ_SENT:
2517		i40iw_active_open_err(cm_node, true);
2518		break;
2519	case I40IW_CM_STATE_ESTABLISHED:
2520	case I40IW_CM_STATE_SYN_RCVD:
2521		i40iw_passive_open_err(cm_node, true);
2522		break;
2523	case I40IW_CM_STATE_OFFLOADED:
2524	default:
2525		break;
2526	}
2527}
2528
2529/**
2530 * i40iw_check_syn - Check for error on received syn ack
2531 * @cm_node: connection's node
2532 * @tcph: pointer tcp header
2533 */
2534static int i40iw_check_syn(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2535{
2536	int err = 0;
2537
2538	if (ntohl(tcph->ack_seq) != cm_node->tcp_cntxt.loc_seq_num) {
2539		err = 1;
2540		i40iw_active_open_err(cm_node, true);
2541	}
2542	return err;
2543}
2544
2545/**
2546 * i40iw_check_seq - check seq numbers if OK
2547 * @cm_node: connection's node
2548 * @tcph: pointer tcp header
2549 */
2550static int i40iw_check_seq(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2551{
2552	int err = 0;
2553	u32 seq;
2554	u32 ack_seq;
2555	u32 loc_seq_num = cm_node->tcp_cntxt.loc_seq_num;
2556	u32 rcv_nxt = cm_node->tcp_cntxt.rcv_nxt;
2557	u32 rcv_wnd;
2558
2559	seq = ntohl(tcph->seq);
2560	ack_seq = ntohl(tcph->ack_seq);
2561	rcv_wnd = cm_node->tcp_cntxt.rcv_wnd;
2562	if (ack_seq != loc_seq_num)
2563		err = -1;
2564	else if (!between(seq, rcv_nxt, (rcv_nxt + rcv_wnd)))
2565		err = -1;
2566	if (err) {
2567		i40iw_pr_err("seq number\n");
2568		i40iw_indicate_pkt_err(cm_node);
2569	}
2570	return err;
2571}
2572
2573/**
2574 * i40iw_handle_syn_pkt - is for Passive node
2575 * @cm_node: connection's node
2576 * @rbuf: receive buffer
2577 */
2578static void i40iw_handle_syn_pkt(struct i40iw_cm_node *cm_node,
2579				 struct i40iw_puda_buf *rbuf)
2580{
2581	struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2582	int ret;
2583	u32 inc_sequence;
2584	int optionsize;
2585	struct i40iw_cm_info nfo;
2586
2587	optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2588	inc_sequence = ntohl(tcph->seq);
2589
2590	switch (cm_node->state) {
2591	case I40IW_CM_STATE_SYN_SENT:
2592	case I40IW_CM_STATE_MPAREQ_SENT:
2593		/* Rcvd syn on active open connection */
2594		i40iw_active_open_err(cm_node, 1);
2595		break;
2596	case I40IW_CM_STATE_LISTENING:
2597		/* Passive OPEN */
2598		if (atomic_read(&cm_node->listener->pend_accepts_cnt) >
2599		    cm_node->listener->backlog) {
2600			cm_node->cm_core->stats_backlog_drops++;
2601			i40iw_passive_open_err(cm_node, false);
2602			break;
2603		}
2604		ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2605		if (ret) {
2606			i40iw_passive_open_err(cm_node, false);
2607			/* drop pkt */
2608			break;
2609		}
2610		cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2611		cm_node->accept_pend = 1;
2612		atomic_inc(&cm_node->listener->pend_accepts_cnt);
2613
2614		cm_node->state = I40IW_CM_STATE_SYN_RCVD;
2615		i40iw_get_addr_info(cm_node, &nfo);
2616		ret = i40iw_manage_qhash(cm_node->iwdev,
2617					 &nfo,
2618					 I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2619					 I40IW_QHASH_MANAGE_TYPE_ADD,
2620					 (void *)cm_node,
2621					 false);
2622		cm_node->qhash_set = true;
2623		break;
2624	case I40IW_CM_STATE_CLOSED:
2625		i40iw_cleanup_retrans_entry(cm_node);
2626		atomic_inc(&cm_node->ref_count);
2627		i40iw_send_reset(cm_node);
2628		break;
2629	case I40IW_CM_STATE_OFFLOADED:
2630	case I40IW_CM_STATE_ESTABLISHED:
2631	case I40IW_CM_STATE_FIN_WAIT1:
2632	case I40IW_CM_STATE_FIN_WAIT2:
2633	case I40IW_CM_STATE_MPAREQ_RCVD:
2634	case I40IW_CM_STATE_LAST_ACK:
2635	case I40IW_CM_STATE_CLOSING:
2636	case I40IW_CM_STATE_UNKNOWN:
2637	default:
2638		break;
2639	}
2640}
2641
2642/**
2643 * i40iw_handle_synack_pkt - Process SYN+ACK packet (active side)
2644 * @cm_node: connection's node
2645 * @rbuf: receive buffer
2646 */
2647static void i40iw_handle_synack_pkt(struct i40iw_cm_node *cm_node,
2648				    struct i40iw_puda_buf *rbuf)
2649{
2650	struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2651	int ret;
2652	u32 inc_sequence;
2653	int optionsize;
2654
2655	optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2656	inc_sequence = ntohl(tcph->seq);
2657	switch (cm_node->state) {
2658	case I40IW_CM_STATE_SYN_SENT:
2659		i40iw_cleanup_retrans_entry(cm_node);
2660		/* active open */
2661		if (i40iw_check_syn(cm_node, tcph)) {
2662			i40iw_pr_err("check syn fail\n");
2663			return;
2664		}
2665		cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2666		/* setup options */
2667		ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 0);
2668		if (ret) {
2669			i40iw_debug(cm_node->dev,
2670				    I40IW_DEBUG_CM,
2671				    "cm_node=%p tcp_options failed\n",
2672				    cm_node);
2673			break;
2674		}
2675		i40iw_cleanup_retrans_entry(cm_node);
2676		cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2677		i40iw_send_ack(cm_node);	/* ACK  for the syn_ack */
2678		ret = i40iw_send_mpa_request(cm_node);
2679		if (ret) {
2680			i40iw_debug(cm_node->dev,
2681				    I40IW_DEBUG_CM,
2682				    "cm_node=%p i40iw_send_mpa_request failed\n",
2683				    cm_node);
2684			break;
2685		}
2686		cm_node->state = I40IW_CM_STATE_MPAREQ_SENT;
2687		break;
2688	case I40IW_CM_STATE_MPAREQ_RCVD:
2689		i40iw_passive_open_err(cm_node, true);
2690		break;
2691	case I40IW_CM_STATE_LISTENING:
2692		cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2693		i40iw_cleanup_retrans_entry(cm_node);
2694		cm_node->state = I40IW_CM_STATE_CLOSED;
2695		i40iw_send_reset(cm_node);
2696		break;
2697	case I40IW_CM_STATE_CLOSED:
2698		cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2699		i40iw_cleanup_retrans_entry(cm_node);
2700		atomic_inc(&cm_node->ref_count);
2701		i40iw_send_reset(cm_node);
2702		break;
2703	case I40IW_CM_STATE_ESTABLISHED:
2704	case I40IW_CM_STATE_FIN_WAIT1:
2705	case I40IW_CM_STATE_FIN_WAIT2:
2706	case I40IW_CM_STATE_LAST_ACK:
2707	case I40IW_CM_STATE_OFFLOADED:
2708	case I40IW_CM_STATE_CLOSING:
2709	case I40IW_CM_STATE_UNKNOWN:
2710	case I40IW_CM_STATE_MPAREQ_SENT:
2711	default:
2712		break;
2713	}
2714}
2715
2716/**
2717 * i40iw_handle_ack_pkt - process packet with ACK
2718 * @cm_node: connection's node
2719 * @rbuf: receive buffer
2720 */
2721static int i40iw_handle_ack_pkt(struct i40iw_cm_node *cm_node,
2722				struct i40iw_puda_buf *rbuf)
2723{
2724	struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2725	u32 inc_sequence;
2726	int ret = 0;
2727	int optionsize;
2728	u32 datasize = rbuf->datalen;
2729
2730	optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2731
2732	if (i40iw_check_seq(cm_node, tcph))
2733		return -EINVAL;
2734
2735	inc_sequence = ntohl(tcph->seq);
2736	switch (cm_node->state) {
2737	case I40IW_CM_STATE_SYN_RCVD:
2738		i40iw_cleanup_retrans_entry(cm_node);
2739		ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2740		if (ret)
2741			break;
2742		cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2743		cm_node->state = I40IW_CM_STATE_ESTABLISHED;
2744		if (datasize) {
2745			cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2746			i40iw_handle_rcv_mpa(cm_node, rbuf);
2747		}
2748		break;
2749	case I40IW_CM_STATE_ESTABLISHED:
2750		i40iw_cleanup_retrans_entry(cm_node);
2751		if (datasize) {
2752			cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2753			i40iw_handle_rcv_mpa(cm_node, rbuf);
2754		}
2755		break;
2756	case I40IW_CM_STATE_MPAREQ_SENT:
2757		cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2758		if (datasize) {
2759			cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2760			cm_node->ack_rcvd = false;
2761			i40iw_handle_rcv_mpa(cm_node, rbuf);
2762		} else {
2763			cm_node->ack_rcvd = true;
2764		}
2765		break;
2766	case I40IW_CM_STATE_LISTENING:
2767		i40iw_cleanup_retrans_entry(cm_node);
2768		cm_node->state = I40IW_CM_STATE_CLOSED;
2769		i40iw_send_reset(cm_node);
2770		break;
2771	case I40IW_CM_STATE_CLOSED:
2772		i40iw_cleanup_retrans_entry(cm_node);
2773		atomic_inc(&cm_node->ref_count);
2774		i40iw_send_reset(cm_node);
2775		break;
2776	case I40IW_CM_STATE_LAST_ACK:
2777	case I40IW_CM_STATE_CLOSING:
2778		i40iw_cleanup_retrans_entry(cm_node);
2779		cm_node->state = I40IW_CM_STATE_CLOSED;
2780		if (!cm_node->accept_pend)
2781			cm_node->cm_id->rem_ref(cm_node->cm_id);
2782		i40iw_rem_ref_cm_node(cm_node);
2783		break;
2784	case I40IW_CM_STATE_FIN_WAIT1:
2785		i40iw_cleanup_retrans_entry(cm_node);
2786		cm_node->state = I40IW_CM_STATE_FIN_WAIT2;
2787		break;
2788	case I40IW_CM_STATE_SYN_SENT:
2789	case I40IW_CM_STATE_FIN_WAIT2:
2790	case I40IW_CM_STATE_OFFLOADED:
2791	case I40IW_CM_STATE_MPAREQ_RCVD:
2792	case I40IW_CM_STATE_UNKNOWN:
2793	default:
2794		i40iw_cleanup_retrans_entry(cm_node);
2795		break;
2796	}
2797	return ret;
2798}
2799
2800/**
2801 * i40iw_process_packet - process cm packet
2802 * @cm_node: connection's node
2803 * @rbuf: receive buffer
2804 */
2805static void i40iw_process_packet(struct i40iw_cm_node *cm_node,
2806				 struct i40iw_puda_buf *rbuf)
2807{
2808	enum i40iw_tcpip_pkt_type pkt_type = I40IW_PKT_TYPE_UNKNOWN;
2809	struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2810	u32 fin_set = 0;
2811	int ret;
2812
2813	if (tcph->rst) {
2814		pkt_type = I40IW_PKT_TYPE_RST;
2815	} else if (tcph->syn) {
2816		pkt_type = I40IW_PKT_TYPE_SYN;
2817		if (tcph->ack)
2818			pkt_type = I40IW_PKT_TYPE_SYNACK;
2819	} else if (tcph->ack) {
2820		pkt_type = I40IW_PKT_TYPE_ACK;
2821	}
2822	if (tcph->fin)
2823		fin_set = 1;
2824
2825	switch (pkt_type) {
2826	case I40IW_PKT_TYPE_SYN:
2827		i40iw_handle_syn_pkt(cm_node, rbuf);
2828		break;
2829	case I40IW_PKT_TYPE_SYNACK:
2830		i40iw_handle_synack_pkt(cm_node, rbuf);
2831		break;
2832	case I40IW_PKT_TYPE_ACK:
2833		ret = i40iw_handle_ack_pkt(cm_node, rbuf);
2834		if (fin_set && !ret)
2835			i40iw_handle_fin_pkt(cm_node);
2836		break;
2837	case I40IW_PKT_TYPE_RST:
2838		i40iw_handle_rst_pkt(cm_node, rbuf);
2839		break;
2840	default:
2841		if (fin_set &&
2842		    (!i40iw_check_seq(cm_node, (struct tcphdr *)rbuf->tcph)))
2843			i40iw_handle_fin_pkt(cm_node);
2844		break;
2845	}
2846}
2847
2848/**
2849 * i40iw_make_listen_node - create a listen node with params
2850 * @cm_core: cm's core
2851 * @iwdev: iwarp device structure
2852 * @cm_info: quad info for connection
2853 */
2854static struct i40iw_cm_listener *i40iw_make_listen_node(
2855					struct i40iw_cm_core *cm_core,
2856					struct i40iw_device *iwdev,
2857					struct i40iw_cm_info *cm_info)
2858{
2859	struct i40iw_cm_listener *listener;
2860	unsigned long flags;
2861
2862	/* cannot have multiple matching listeners */
2863	listener = i40iw_find_listener(cm_core, cm_info->loc_addr,
2864				       cm_info->loc_port,
2865				       cm_info->vlan_id,
2866				       I40IW_CM_LISTENER_EITHER_STATE);
2867	if (listener &&
2868	    (listener->listener_state == I40IW_CM_LISTENER_ACTIVE_STATE)) {
2869		atomic_dec(&listener->ref_count);
2870		i40iw_debug(cm_core->dev,
2871			    I40IW_DEBUG_CM,
2872			    "Not creating listener since it already exists\n");
2873		return NULL;
2874	}
2875
2876	if (!listener) {
2877		/* create a CM listen node (1/2 node to compare incoming traffic to) */
2878		listener = kzalloc(sizeof(*listener), GFP_KERNEL);
2879		if (!listener)
2880			return NULL;
2881		cm_core->stats_listen_nodes_created++;
2882		memcpy(listener->loc_addr, cm_info->loc_addr, sizeof(listener->loc_addr));
2883		listener->loc_port = cm_info->loc_port;
2884
2885		INIT_LIST_HEAD(&listener->child_listen_list);
2886
2887		atomic_set(&listener->ref_count, 1);
2888	} else {
2889		listener->reused_node = 1;
2890	}
2891
2892	listener->cm_id = cm_info->cm_id;
2893	listener->ipv4 = cm_info->ipv4;
2894	listener->vlan_id = cm_info->vlan_id;
2895	atomic_set(&listener->pend_accepts_cnt, 0);
2896	listener->cm_core = cm_core;
2897	listener->iwdev = iwdev;
2898
2899	listener->backlog = cm_info->backlog;
2900	listener->listener_state = I40IW_CM_LISTENER_ACTIVE_STATE;
2901
2902	if (!listener->reused_node) {
2903		spin_lock_irqsave(&cm_core->listen_list_lock, flags);
2904		list_add(&listener->list, &cm_core->listen_nodes);
2905		spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
2906	}
2907
2908	return listener;
2909}
2910
2911/**
2912 * i40iw_create_cm_node - make a connection node with params
2913 * @cm_core: cm's core
2914 * @iwdev: iwarp device structure
2915 * @conn_param: upper layer connection parameters
2916 * @cm_info: quad info for connection
2917 */
2918static struct i40iw_cm_node *i40iw_create_cm_node(
2919					struct i40iw_cm_core *cm_core,
2920					struct i40iw_device *iwdev,
2921					struct iw_cm_conn_param *conn_param,
2922					struct i40iw_cm_info *cm_info)
2923{
2924	struct i40iw_cm_node *cm_node;
2925	struct i40iw_cm_listener *loopback_remotelistener;
2926	struct i40iw_cm_node *loopback_remotenode;
2927	struct i40iw_cm_info loopback_cm_info;
2928
2929	u16 private_data_len = conn_param->private_data_len;
2930	const void *private_data = conn_param->private_data;
2931
2932	/* create a CM connection node */
2933	cm_node = i40iw_make_cm_node(cm_core, iwdev, cm_info, NULL);
2934	if (!cm_node)
2935		return ERR_PTR(-ENOMEM);
2936	/* set our node side to client (active) side */
2937	cm_node->tcp_cntxt.client = 1;
2938	cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2939
2940	i40iw_record_ird_ord(cm_node, conn_param->ird, conn_param->ord);
2941
2942	if (!memcmp(cm_info->loc_addr, cm_info->rem_addr, sizeof(cm_info->loc_addr))) {
2943		loopback_remotelistener = i40iw_find_listener(
2944						cm_core,
2945						cm_info->rem_addr,
2946						cm_node->rem_port,
2947						cm_node->vlan_id,
2948						I40IW_CM_LISTENER_ACTIVE_STATE);
2949		if (!loopback_remotelistener) {
2950			i40iw_rem_ref_cm_node(cm_node);
2951			return ERR_PTR(-ECONNREFUSED);
2952		} else {
2953			loopback_cm_info = *cm_info;
2954			loopback_cm_info.loc_port = cm_info->rem_port;
2955			loopback_cm_info.rem_port = cm_info->loc_port;
2956			loopback_cm_info.cm_id = loopback_remotelistener->cm_id;
2957			loopback_cm_info.ipv4 = cm_info->ipv4;
2958			loopback_remotenode = i40iw_make_cm_node(cm_core,
2959								 iwdev,
2960								 &loopback_cm_info,
2961								 loopback_remotelistener);
2962			if (!loopback_remotenode) {
2963				i40iw_rem_ref_cm_node(cm_node);
2964				return ERR_PTR(-ENOMEM);
2965			}
2966			cm_core->stats_loopbacks++;
2967			loopback_remotenode->loopbackpartner = cm_node;
2968			loopback_remotenode->tcp_cntxt.rcv_wscale =
2969				I40IW_CM_DEFAULT_RCV_WND_SCALE;
2970			cm_node->loopbackpartner = loopback_remotenode;
2971			memcpy(loopback_remotenode->pdata_buf, private_data,
2972			       private_data_len);
2973			loopback_remotenode->pdata.size = private_data_len;
2974
2975			if (loopback_remotenode->ord_size > cm_node->ird_size)
2976				loopback_remotenode->ord_size =
2977					cm_node->ird_size;
2978
2979			cm_node->state = I40IW_CM_STATE_OFFLOADED;
2980			cm_node->tcp_cntxt.rcv_nxt =
2981				loopback_remotenode->tcp_cntxt.loc_seq_num;
2982			loopback_remotenode->tcp_cntxt.rcv_nxt =
2983				cm_node->tcp_cntxt.loc_seq_num;
2984			cm_node->tcp_cntxt.max_snd_wnd =
2985				loopback_remotenode->tcp_cntxt.rcv_wnd;
2986			loopback_remotenode->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2987			cm_node->tcp_cntxt.snd_wnd = loopback_remotenode->tcp_cntxt.rcv_wnd;
2988			loopback_remotenode->tcp_cntxt.snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2989			cm_node->tcp_cntxt.snd_wscale = loopback_remotenode->tcp_cntxt.rcv_wscale;
2990			loopback_remotenode->tcp_cntxt.snd_wscale = cm_node->tcp_cntxt.rcv_wscale;
2991		}
2992		return cm_node;
2993	}
2994
2995	cm_node->pdata.size = private_data_len;
2996	cm_node->pdata.addr = cm_node->pdata_buf;
2997
2998	memcpy(cm_node->pdata_buf, private_data, private_data_len);
2999
3000	cm_node->state = I40IW_CM_STATE_SYN_SENT;
3001	return cm_node;
3002}
3003
3004/**
3005 * i40iw_cm_reject - reject and teardown a connection
3006 * @cm_node: connection's node
3007 * @pdate: ptr to private data for reject
3008 * @plen: size of private data
3009 */
3010static int i40iw_cm_reject(struct i40iw_cm_node *cm_node, const void *pdata, u8 plen)
3011{
3012	int ret = 0;
3013	int err;
3014	int passive_state;
3015	struct iw_cm_id *cm_id = cm_node->cm_id;
3016	struct i40iw_cm_node *loopback = cm_node->loopbackpartner;
3017
3018	if (cm_node->tcp_cntxt.client)
3019		return ret;
3020	i40iw_cleanup_retrans_entry(cm_node);
3021
3022	if (!loopback) {
3023		passive_state = atomic_add_return(1, &cm_node->passive_state);
3024		if (passive_state == I40IW_SEND_RESET_EVENT) {
3025			cm_node->state = I40IW_CM_STATE_CLOSED;
3026			i40iw_rem_ref_cm_node(cm_node);
3027		} else {
3028			if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3029				i40iw_rem_ref_cm_node(cm_node);
3030			} else {
3031				ret = i40iw_send_mpa_reject(cm_node, pdata, plen);
3032				if (ret) {
3033					cm_node->state = I40IW_CM_STATE_CLOSED;
3034					err = i40iw_send_reset(cm_node);
3035					if (err)
3036						i40iw_pr_err("send reset failed\n");
3037				} else {
3038					cm_id->add_ref(cm_id);
3039				}
3040			}
3041		}
3042	} else {
3043		cm_node->cm_id = NULL;
3044		if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3045			i40iw_rem_ref_cm_node(cm_node);
3046			i40iw_rem_ref_cm_node(loopback);
3047		} else {
3048			ret = i40iw_send_cm_event(loopback,
3049						  loopback->cm_id,
3050						  IW_CM_EVENT_CONNECT_REPLY,
3051						  -ECONNREFUSED);
3052			i40iw_rem_ref_cm_node(cm_node);
3053			loopback->state = I40IW_CM_STATE_CLOSING;
3054
3055			cm_id = loopback->cm_id;
3056			i40iw_rem_ref_cm_node(loopback);
3057			cm_id->rem_ref(cm_id);
3058		}
3059	}
3060
3061	return ret;
3062}
3063
3064/**
3065 * i40iw_cm_close - close of cm connection
3066 * @cm_node: connection's node
3067 */
3068static int i40iw_cm_close(struct i40iw_cm_node *cm_node)
3069{
3070	int ret = 0;
3071
3072	if (!cm_node)
3073		return -EINVAL;
3074
3075	switch (cm_node->state) {
3076	case I40IW_CM_STATE_SYN_RCVD:
3077	case I40IW_CM_STATE_SYN_SENT:
3078	case I40IW_CM_STATE_ONE_SIDE_ESTABLISHED:
3079	case I40IW_CM_STATE_ESTABLISHED:
3080	case I40IW_CM_STATE_ACCEPTING:
3081	case I40IW_CM_STATE_MPAREQ_SENT:
3082	case I40IW_CM_STATE_MPAREQ_RCVD:
3083		i40iw_cleanup_retrans_entry(cm_node);
3084		i40iw_send_reset(cm_node);
3085		break;
3086	case I40IW_CM_STATE_CLOSE_WAIT:
3087		cm_node->state = I40IW_CM_STATE_LAST_ACK;
3088		i40iw_send_fin(cm_node);
3089		break;
3090	case I40IW_CM_STATE_FIN_WAIT1:
3091	case I40IW_CM_STATE_FIN_WAIT2:
3092	case I40IW_CM_STATE_LAST_ACK:
3093	case I40IW_CM_STATE_TIME_WAIT:
3094	case I40IW_CM_STATE_CLOSING:
3095		ret = -1;
3096		break;
3097	case I40IW_CM_STATE_LISTENING:
3098		i40iw_cleanup_retrans_entry(cm_node);
3099		i40iw_send_reset(cm_node);
3100		break;
3101	case I40IW_CM_STATE_MPAREJ_RCVD:
3102	case I40IW_CM_STATE_UNKNOWN:
3103	case I40IW_CM_STATE_INITED:
3104	case I40IW_CM_STATE_CLOSED:
3105	case I40IW_CM_STATE_LISTENER_DESTROYED:
3106		i40iw_rem_ref_cm_node(cm_node);
3107		break;
3108	case I40IW_CM_STATE_OFFLOADED:
3109		if (cm_node->send_entry)
3110			i40iw_pr_err("send_entry\n");
3111		i40iw_rem_ref_cm_node(cm_node);
3112		break;
3113	}
3114	return ret;
3115}
3116
3117/**
3118 * i40iw_receive_ilq - recv an ETHERNET packet, and process it
3119 * through CM
3120 * @vsi: pointer to the vsi structure
3121 * @rbuf: receive buffer
3122 */
3123void i40iw_receive_ilq(struct i40iw_sc_vsi *vsi, struct i40iw_puda_buf *rbuf)
3124{
3125	struct i40iw_cm_node *cm_node;
3126	struct i40iw_cm_listener *listener;
3127	struct iphdr *iph;
3128	struct ipv6hdr *ip6h;
3129	struct tcphdr *tcph;
3130	struct i40iw_cm_info cm_info;
3131	struct i40iw_sc_dev *dev = vsi->dev;
3132	struct i40iw_device *iwdev = (struct i40iw_device *)dev->back_dev;
3133	struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3134	struct vlan_ethhdr *ethh;
3135	u16 vtag;
3136
3137	/* if vlan, then maclen = 18 else 14 */
3138	iph = (struct iphdr *)rbuf->iph;
3139	memset(&cm_info, 0, sizeof(cm_info));
3140
3141	i40iw_debug_buf(dev,
3142			I40IW_DEBUG_ILQ,
3143			"RECEIVE ILQ BUFFER",
3144			rbuf->mem.va,
3145			rbuf->totallen);
3146	ethh = (struct vlan_ethhdr *)rbuf->mem.va;
3147
3148	if (ethh->h_vlan_proto == htons(ETH_P_8021Q)) {
3149		vtag = ntohs(ethh->h_vlan_TCI);
3150		cm_info.user_pri = (vtag & VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
3151		cm_info.vlan_id = vtag & VLAN_VID_MASK;
3152		i40iw_debug(cm_core->dev,
3153			    I40IW_DEBUG_CM,
3154			    "%s vlan_id=%d\n",
3155			    __func__,
3156			    cm_info.vlan_id);
3157	} else {
3158		cm_info.vlan_id = I40IW_NO_VLAN;
3159	}
3160	tcph = (struct tcphdr *)rbuf->tcph;
3161
3162	if (rbuf->ipv4) {
3163		cm_info.loc_addr[0] = ntohl(iph->daddr);
3164		cm_info.rem_addr[0] = ntohl(iph->saddr);
3165		cm_info.ipv4 = true;
3166		cm_info.tos = iph->tos;
3167	} else {
3168		ip6h = (struct ipv6hdr *)rbuf->iph;
3169		i40iw_copy_ip_ntohl(cm_info.loc_addr,
3170				    ip6h->daddr.in6_u.u6_addr32);
3171		i40iw_copy_ip_ntohl(cm_info.rem_addr,
3172				    ip6h->saddr.in6_u.u6_addr32);
3173		cm_info.ipv4 = false;
3174		cm_info.tos = (ip6h->priority << 4) | (ip6h->flow_lbl[0] >> 4);
3175	}
3176	cm_info.loc_port = ntohs(tcph->dest);
3177	cm_info.rem_port = ntohs(tcph->source);
3178	cm_node = i40iw_find_node(cm_core,
3179				  cm_info.rem_port,
3180				  cm_info.rem_addr,
3181				  cm_info.loc_port,
3182				  cm_info.loc_addr,
3183				  true,
3184				  false);
3185
3186	if (!cm_node) {
3187		/* Only type of packet accepted are for */
3188		/* the PASSIVE open (syn only) */
3189		if (!tcph->syn || tcph->ack)
3190			return;
3191		listener =
3192		    i40iw_find_listener(cm_core,
3193					cm_info.loc_addr,
3194					cm_info.loc_port,
3195					cm_info.vlan_id,
3196					I40IW_CM_LISTENER_ACTIVE_STATE);
3197		if (!listener) {
3198			cm_info.cm_id = NULL;
3199			i40iw_debug(cm_core->dev,
3200				    I40IW_DEBUG_CM,
3201				    "%s no listener found\n",
3202				    __func__);
3203			return;
3204		}
3205		cm_info.cm_id = listener->cm_id;
3206		cm_node = i40iw_make_cm_node(cm_core, iwdev, &cm_info, listener);
3207		if (!cm_node) {
3208			i40iw_debug(cm_core->dev,
3209				    I40IW_DEBUG_CM,
3210				    "%s allocate node failed\n",
3211				    __func__);
3212			atomic_dec(&listener->ref_count);
3213			return;
3214		}
3215		if (!tcph->rst && !tcph->fin) {
3216			cm_node->state = I40IW_CM_STATE_LISTENING;
3217		} else {
3218			i40iw_rem_ref_cm_node(cm_node);
3219			return;
3220		}
3221		atomic_inc(&cm_node->ref_count);
3222	} else if (cm_node->state == I40IW_CM_STATE_OFFLOADED) {
3223		i40iw_rem_ref_cm_node(cm_node);
3224		return;
3225	}
3226	i40iw_process_packet(cm_node, rbuf);
3227	i40iw_rem_ref_cm_node(cm_node);
3228}
3229
3230/**
3231 * i40iw_setup_cm_core - allocate a top level instance of a cm
3232 * core
3233 * @iwdev: iwarp device structure
3234 */
3235int i40iw_setup_cm_core(struct i40iw_device *iwdev)
3236{
3237	struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3238
3239	cm_core->iwdev = iwdev;
3240	cm_core->dev = &iwdev->sc_dev;
3241
3242	INIT_LIST_HEAD(&cm_core->accelerated_list);
3243	INIT_LIST_HEAD(&cm_core->non_accelerated_list);
3244	INIT_LIST_HEAD(&cm_core->listen_nodes);
3245
3246	timer_setup(&cm_core->tcp_timer, i40iw_cm_timer_tick, 0);
3247
3248	spin_lock_init(&cm_core->ht_lock);
3249	spin_lock_init(&cm_core->listen_list_lock);
3250	spin_lock_init(&cm_core->apbvt_lock);
3251
3252	cm_core->event_wq = alloc_ordered_workqueue("iwewq",
3253						    WQ_MEM_RECLAIM);
3254	if (!cm_core->event_wq)
3255		goto error;
3256
3257	cm_core->disconn_wq = alloc_ordered_workqueue("iwdwq",
3258						      WQ_MEM_RECLAIM);
3259	if (!cm_core->disconn_wq)
3260		goto error;
3261
3262	return 0;
3263error:
3264	i40iw_cleanup_cm_core(&iwdev->cm_core);
3265
3266	return -ENOMEM;
3267}
3268
3269/**
3270 * i40iw_cleanup_cm_core - deallocate a top level instance of a
3271 * cm core
3272 * @cm_core: cm's core
3273 */
3274void i40iw_cleanup_cm_core(struct i40iw_cm_core *cm_core)
3275{
3276	unsigned long flags;
3277
3278	if (!cm_core)
3279		return;
3280
3281	spin_lock_irqsave(&cm_core->ht_lock, flags);
3282	if (timer_pending(&cm_core->tcp_timer))
3283		del_timer_sync(&cm_core->tcp_timer);
3284	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3285
3286	if (cm_core->event_wq)
3287		destroy_workqueue(cm_core->event_wq);
3288	if (cm_core->disconn_wq)
3289		destroy_workqueue(cm_core->disconn_wq);
3290}
3291
3292/**
3293 * i40iw_init_tcp_ctx - setup qp context
3294 * @cm_node: connection's node
3295 * @tcp_info: offload info for tcp
3296 * @iwqp: associate qp for the connection
3297 */
3298static void i40iw_init_tcp_ctx(struct i40iw_cm_node *cm_node,
3299			       struct i40iw_tcp_offload_info *tcp_info,
3300			       struct i40iw_qp *iwqp)
3301{
3302	tcp_info->ipv4 = cm_node->ipv4;
3303	tcp_info->drop_ooo_seg = true;
3304	tcp_info->wscale = true;
3305	tcp_info->ignore_tcp_opt = true;
3306	tcp_info->ignore_tcp_uns_opt = true;
3307	tcp_info->no_nagle = false;
3308
3309	tcp_info->ttl = I40IW_DEFAULT_TTL;
3310	tcp_info->rtt_var = cpu_to_le32(I40IW_DEFAULT_RTT_VAR);
3311	tcp_info->ss_thresh = cpu_to_le32(I40IW_DEFAULT_SS_THRESH);
3312	tcp_info->rexmit_thresh = I40IW_DEFAULT_REXMIT_THRESH;
3313
3314	tcp_info->tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3315	tcp_info->snd_wscale = cm_node->tcp_cntxt.snd_wscale;
3316	tcp_info->rcv_wscale = cm_node->tcp_cntxt.rcv_wscale;
3317
3318	tcp_info->snd_nxt = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3319	tcp_info->snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.snd_wnd);
3320	tcp_info->rcv_nxt = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3321	tcp_info->snd_max = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3322
3323	tcp_info->snd_una = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3324	tcp_info->cwnd = cpu_to_le32(2 * cm_node->tcp_cntxt.mss);
3325	tcp_info->snd_wl1 = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3326	tcp_info->snd_wl2 = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3327	tcp_info->max_snd_window = cpu_to_le32(cm_node->tcp_cntxt.max_snd_wnd);
3328	tcp_info->rcv_wnd = cpu_to_le32(cm_node->tcp_cntxt.rcv_wnd <<
3329					cm_node->tcp_cntxt.rcv_wscale);
3330
3331	tcp_info->flow_label = 0;
3332	tcp_info->snd_mss = cpu_to_le32(((u32)cm_node->tcp_cntxt.mss));
3333	if (cm_node->vlan_id <= VLAN_VID_MASK) {
3334		tcp_info->insert_vlan_tag = true;
3335		tcp_info->vlan_tag = cpu_to_le16(((u16)cm_node->user_pri << I40IW_VLAN_PRIO_SHIFT) |
3336						  cm_node->vlan_id);
3337	}
3338	if (cm_node->ipv4) {
3339		tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3340		tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3341
3342		tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[0]);
3343		tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[0]);
3344		tcp_info->arp_idx =
3345			cpu_to_le16((u16)i40iw_arp_table(
3346							 iwqp->iwdev,
3347							 &tcp_info->dest_ip_addr3,
3348							 true,
3349							 NULL,
3350							 I40IW_ARP_RESOLVE));
3351	} else {
3352		tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3353		tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3354		tcp_info->dest_ip_addr0 = cpu_to_le32(cm_node->rem_addr[0]);
3355		tcp_info->dest_ip_addr1 = cpu_to_le32(cm_node->rem_addr[1]);
3356		tcp_info->dest_ip_addr2 = cpu_to_le32(cm_node->rem_addr[2]);
3357		tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[3]);
3358		tcp_info->local_ipaddr0 = cpu_to_le32(cm_node->loc_addr[0]);
3359		tcp_info->local_ipaddr1 = cpu_to_le32(cm_node->loc_addr[1]);
3360		tcp_info->local_ipaddr2 = cpu_to_le32(cm_node->loc_addr[2]);
3361		tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[3]);
3362		tcp_info->arp_idx =
3363			cpu_to_le16((u16)i40iw_arp_table(
3364							 iwqp->iwdev,
3365							 &tcp_info->dest_ip_addr0,
3366							 false,
3367							 NULL,
3368							 I40IW_ARP_RESOLVE));
3369	}
3370}
3371
3372/**
3373 * i40iw_cm_init_tsa_conn - setup qp for RTS
3374 * @iwqp: associate qp for the connection
3375 * @cm_node: connection's node
3376 */
3377static void i40iw_cm_init_tsa_conn(struct i40iw_qp *iwqp,
3378				   struct i40iw_cm_node *cm_node)
3379{
3380	struct i40iw_tcp_offload_info tcp_info;
3381	struct i40iwarp_offload_info *iwarp_info;
3382	struct i40iw_qp_host_ctx_info *ctx_info;
3383	struct i40iw_device *iwdev = iwqp->iwdev;
3384	struct i40iw_sc_dev *dev = &iwqp->iwdev->sc_dev;
3385
3386	memset(&tcp_info, 0x00, sizeof(struct i40iw_tcp_offload_info));
3387	iwarp_info = &iwqp->iwarp_info;
3388	ctx_info = &iwqp->ctx_info;
3389
3390	ctx_info->tcp_info = &tcp_info;
3391	ctx_info->send_cq_num = iwqp->iwscq->sc_cq.cq_uk.cq_id;
3392	ctx_info->rcv_cq_num = iwqp->iwrcq->sc_cq.cq_uk.cq_id;
3393
3394	iwarp_info->ord_size = cm_node->ord_size;
3395	iwarp_info->ird_size = i40iw_derive_hw_ird_setting(cm_node->ird_size);
3396
3397	if (iwarp_info->ord_size == 1)
3398		iwarp_info->ord_size = 2;
3399
3400	iwarp_info->rd_enable = true;
3401	iwarp_info->rdmap_ver = 1;
3402	iwarp_info->ddp_ver = 1;
3403
3404	iwarp_info->pd_id = iwqp->iwpd->sc_pd.pd_id;
3405
3406	ctx_info->tcp_info_valid = true;
3407	ctx_info->iwarp_info_valid = true;
3408	ctx_info->add_to_qoslist = true;
3409	ctx_info->user_pri = cm_node->user_pri;
3410
3411	i40iw_init_tcp_ctx(cm_node, &tcp_info, iwqp);
3412	if (cm_node->snd_mark_en) {
3413		iwarp_info->snd_mark_en = true;
3414		iwarp_info->snd_mark_offset = (tcp_info.snd_nxt &
3415				SNDMARKER_SEQNMASK) + cm_node->lsmm_size;
3416	}
3417
3418	cm_node->state = I40IW_CM_STATE_OFFLOADED;
3419	tcp_info.tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3420	tcp_info.src_mac_addr_idx = iwdev->mac_ip_table_idx;
3421	tcp_info.tos = cm_node->tos;
3422
3423	dev->iw_priv_qp_ops->qp_setctx(&iwqp->sc_qp, (u64 *)(iwqp->host_ctx.va), ctx_info);
3424
3425	/* once tcp_info is set, no need to do it again */
3426	ctx_info->tcp_info_valid = false;
3427	ctx_info->iwarp_info_valid = false;
3428	ctx_info->add_to_qoslist = false;
3429}
3430
3431/**
3432 * i40iw_cm_disconn - when a connection is being closed
3433 * @iwqp: associate qp for the connection
3434 */
3435void i40iw_cm_disconn(struct i40iw_qp *iwqp)
3436{
3437	struct disconn_work *work;
3438	struct i40iw_device *iwdev = iwqp->iwdev;
3439	struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3440	unsigned long flags;
3441
3442	work = kzalloc(sizeof(*work), GFP_ATOMIC);
3443	if (!work)
3444		return;	/* Timer will clean up */
3445
3446	spin_lock_irqsave(&iwdev->qptable_lock, flags);
3447	if (!iwdev->qp_table[iwqp->ibqp.qp_num]) {
3448		spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3449		i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
3450			    "%s qp_id %d is already freed\n",
3451			     __func__, iwqp->ibqp.qp_num);
3452		kfree(work);
3453		return;
3454	}
3455	i40iw_qp_add_ref(&iwqp->ibqp);
3456	spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3457
3458	work->iwqp = iwqp;
3459	INIT_WORK(&work->work, i40iw_disconnect_worker);
3460	queue_work(cm_core->disconn_wq, &work->work);
3461	return;
3462}
3463
3464/**
3465 * i40iw_qp_disconnect - free qp and close cm
3466 * @iwqp: associate qp for the connection
3467 */
3468static void i40iw_qp_disconnect(struct i40iw_qp *iwqp)
3469{
3470	struct i40iw_device *iwdev;
3471	struct i40iw_ib_device *iwibdev;
3472
3473	iwdev = to_iwdev(iwqp->ibqp.device);
3474	if (!iwdev) {
3475		i40iw_pr_err("iwdev == NULL\n");
3476		return;
3477	}
3478
3479	iwibdev = iwdev->iwibdev;
3480
3481	if (iwqp->active_conn) {
3482		/* indicate this connection is NOT active */
3483		iwqp->active_conn = 0;
3484	} else {
3485		/* Need to free the Last Streaming Mode Message */
3486		if (iwqp->ietf_mem.va) {
3487			if (iwqp->lsmm_mr)
3488				iwibdev->ibdev.ops.dereg_mr(iwqp->lsmm_mr,
3489							    NULL);
3490			i40iw_free_dma_mem(iwdev->sc_dev.hw, &iwqp->ietf_mem);
3491		}
3492	}
3493
3494	/* close the CM node down if it is still active */
3495	if (iwqp->cm_node) {
3496		i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "%s Call close API\n", __func__);
3497		i40iw_cm_close(iwqp->cm_node);
3498	}
3499}
3500
3501/**
3502 * i40iw_cm_disconn_true - called by worker thread to disconnect qp
3503 * @iwqp: associate qp for the connection
3504 */
3505static void i40iw_cm_disconn_true(struct i40iw_qp *iwqp)
3506{
3507	struct iw_cm_id *cm_id;
3508	struct i40iw_device *iwdev;
3509	struct i40iw_sc_qp *qp = &iwqp->sc_qp;
3510	u16 last_ae;
3511	u8 original_hw_tcp_state;
3512	u8 original_ibqp_state;
3513	int disconn_status = 0;
3514	int issue_disconn = 0;
3515	int issue_close = 0;
3516	int issue_flush = 0;
3517	struct ib_event ibevent;
3518	unsigned long flags;
3519	int ret;
3520
3521	if (!iwqp) {
3522		i40iw_pr_err("iwqp == NULL\n");
3523		return;
3524	}
3525
3526	spin_lock_irqsave(&iwqp->lock, flags);
3527	cm_id = iwqp->cm_id;
3528	/* make sure we havent already closed this connection */
3529	if (!cm_id) {
3530		spin_unlock_irqrestore(&iwqp->lock, flags);
3531		return;
3532	}
3533
3534	iwdev = to_iwdev(iwqp->ibqp.device);
3535
3536	original_hw_tcp_state = iwqp->hw_tcp_state;
3537	original_ibqp_state = iwqp->ibqp_state;
3538	last_ae = iwqp->last_aeq;
3539
3540	if (qp->term_flags) {
3541		issue_disconn = 1;
3542		issue_close = 1;
3543		iwqp->cm_id = NULL;
3544		/*When term timer expires after cm_timer, don't want
3545		 *terminate-handler to issue cm_disconn which can re-free
3546		 *a QP even after its refcnt=0.
3547		 */
3548		i40iw_terminate_del_timer(qp);
3549		if (!iwqp->flush_issued) {
3550			iwqp->flush_issued = 1;
3551			issue_flush = 1;
3552		}
3553	} else if ((original_hw_tcp_state == I40IW_TCP_STATE_CLOSE_WAIT) ||
3554		   ((original_ibqp_state == IB_QPS_RTS) &&
3555		    (last_ae == I40IW_AE_LLP_CONNECTION_RESET))) {
3556		issue_disconn = 1;
3557		if (last_ae == I40IW_AE_LLP_CONNECTION_RESET)
3558			disconn_status = -ECONNRESET;
3559	}
3560
3561	if (((original_hw_tcp_state == I40IW_TCP_STATE_CLOSED) ||
3562	     (original_hw_tcp_state == I40IW_TCP_STATE_TIME_WAIT) ||
3563	     (last_ae == I40IW_AE_RDMAP_ROE_BAD_LLP_CLOSE) ||
3564	     (last_ae == I40IW_AE_LLP_CONNECTION_RESET) ||
3565	      iwdev->reset)) {
3566		issue_close = 1;
3567		iwqp->cm_id = NULL;
3568		if (!iwqp->flush_issued) {
3569			iwqp->flush_issued = 1;
3570			issue_flush = 1;
3571		}
3572	}
3573
3574	spin_unlock_irqrestore(&iwqp->lock, flags);
3575	if (issue_flush && !iwqp->destroyed) {
3576		/* Flush the queues */
3577		i40iw_flush_wqes(iwdev, iwqp);
3578
3579		if (qp->term_flags && iwqp->ibqp.event_handler) {
3580			ibevent.device = iwqp->ibqp.device;
3581			ibevent.event = (qp->eventtype == TERM_EVENT_QP_FATAL) ?
3582					IB_EVENT_QP_FATAL : IB_EVENT_QP_ACCESS_ERR;
3583			ibevent.element.qp = &iwqp->ibqp;
3584			iwqp->ibqp.event_handler(&ibevent, iwqp->ibqp.qp_context);
3585		}
3586	}
3587
3588	if (cm_id && cm_id->event_handler) {
3589		if (issue_disconn) {
3590			ret = i40iw_send_cm_event(NULL,
3591						  cm_id,
3592						  IW_CM_EVENT_DISCONNECT,
3593						  disconn_status);
3594
3595			if (ret)
3596				i40iw_debug(&iwdev->sc_dev,
3597					    I40IW_DEBUG_CM,
3598					    "disconnect event failed %s: - cm_id = %p\n",
3599					    __func__, cm_id);
3600		}
3601		if (issue_close) {
3602			i40iw_qp_disconnect(iwqp);
3603			cm_id->provider_data = iwqp;
3604			ret = i40iw_send_cm_event(NULL, cm_id, IW_CM_EVENT_CLOSE, 0);
3605			if (ret)
3606				i40iw_debug(&iwdev->sc_dev,
3607					    I40IW_DEBUG_CM,
3608					    "close event failed %s: - cm_id = %p\n",
3609					    __func__, cm_id);
3610			cm_id->rem_ref(cm_id);
3611		}
3612	}
3613}
3614
3615/**
3616 * i40iw_disconnect_worker - worker for connection close
3617 * @work: points or disconn structure
3618 */
3619static void i40iw_disconnect_worker(struct work_struct *work)
3620{
3621	struct disconn_work *dwork = container_of(work, struct disconn_work, work);
3622	struct i40iw_qp *iwqp = dwork->iwqp;
3623
3624	kfree(dwork);
3625	i40iw_cm_disconn_true(iwqp);
3626	i40iw_qp_rem_ref(&iwqp->ibqp);
3627}
3628
3629/**
3630 * i40iw_accept - registered call for connection to be accepted
3631 * @cm_id: cm information for passive connection
3632 * @conn_param: accpet parameters
3633 */
3634int i40iw_accept(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3635{
3636	struct ib_qp *ibqp;
3637	struct i40iw_qp *iwqp;
3638	struct i40iw_device *iwdev;
3639	struct i40iw_sc_dev *dev;
3640	struct i40iw_cm_core *cm_core;
3641	struct i40iw_cm_node *cm_node;
3642	struct ib_qp_attr attr;
3643	int passive_state;
3644	struct ib_mr *ibmr;
3645	struct i40iw_pd *iwpd;
3646	u16 buf_len = 0;
3647	struct i40iw_kmem_info accept;
3648	enum i40iw_status_code status;
3649	u64 tagged_offset;
3650	unsigned long flags;
3651
3652	memset(&attr, 0, sizeof(attr));
3653	ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3654	if (!ibqp)
3655		return -EINVAL;
3656
3657	iwqp = to_iwqp(ibqp);
3658	iwdev = iwqp->iwdev;
3659	dev = &iwdev->sc_dev;
3660	cm_core = &iwdev->cm_core;
3661	cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3662
3663	if (((struct sockaddr_in *)&cm_id->local_addr)->sin_family == AF_INET) {
3664		cm_node->ipv4 = true;
3665		cm_node->vlan_id = i40iw_get_vlan_ipv4(cm_node->loc_addr);
3666	} else {
3667		cm_node->ipv4 = false;
3668		i40iw_netdev_vlan_ipv6(cm_node->loc_addr, &cm_node->vlan_id);
3669	}
3670	i40iw_debug(cm_node->dev,
3671		    I40IW_DEBUG_CM,
3672		    "Accept vlan_id=%d\n",
3673		    cm_node->vlan_id);
3674	if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3675		if (cm_node->loopbackpartner)
3676			i40iw_rem_ref_cm_node(cm_node->loopbackpartner);
3677		i40iw_rem_ref_cm_node(cm_node);
3678		return -EINVAL;
3679	}
3680
3681	passive_state = atomic_add_return(1, &cm_node->passive_state);
3682	if (passive_state == I40IW_SEND_RESET_EVENT) {
3683		i40iw_rem_ref_cm_node(cm_node);
3684		return -ECONNRESET;
3685	}
3686
3687	cm_node->cm_core->stats_accepts++;
3688	iwqp->cm_node = (void *)cm_node;
3689	cm_node->iwqp = iwqp;
3690
3691	buf_len = conn_param->private_data_len + I40IW_MAX_IETF_SIZE;
3692
3693	status = i40iw_allocate_dma_mem(dev->hw, &iwqp->ietf_mem, buf_len, 1);
3694
3695	if (status)
3696		return -ENOMEM;
3697	cm_node->pdata.size = conn_param->private_data_len;
3698	accept.addr = iwqp->ietf_mem.va;
3699	accept.size = i40iw_cm_build_mpa_frame(cm_node, &accept, MPA_KEY_REPLY);
3700	memcpy(accept.addr + accept.size, conn_param->private_data,
3701	       conn_param->private_data_len);
3702
3703	/* setup our first outgoing iWarp send WQE (the IETF frame response) */
3704	if ((cm_node->ipv4 &&
3705	     !i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
3706	    (!cm_node->ipv4 &&
3707	     !i40iw_ipv6_is_loopback(cm_node->loc_addr, cm_node->rem_addr))) {
3708		iwpd = iwqp->iwpd;
3709		tagged_offset = (uintptr_t)iwqp->ietf_mem.va;
3710		ibmr = i40iw_reg_phys_mr(&iwpd->ibpd,
3711					 iwqp->ietf_mem.pa,
3712					 buf_len,
3713					 IB_ACCESS_LOCAL_WRITE,
3714					 &tagged_offset);
3715		if (IS_ERR(ibmr)) {
3716			i40iw_free_dma_mem(dev->hw, &iwqp->ietf_mem);
3717			return -ENOMEM;
3718		}
3719
3720		ibmr->pd = &iwpd->ibpd;
3721		ibmr->device = iwpd->ibpd.device;
3722		iwqp->lsmm_mr = ibmr;
3723		if (iwqp->page)
3724			iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3725		dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp,
3726							iwqp->ietf_mem.va,
3727							(accept.size + conn_param->private_data_len),
3728							ibmr->lkey);
3729
3730	} else {
3731		if (iwqp->page)
3732			iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3733		dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp, NULL, 0, 0);
3734	}
3735
3736	if (iwqp->page)
3737		kunmap(iwqp->page);
3738
3739	iwqp->cm_id = cm_id;
3740	cm_node->cm_id = cm_id;
3741
3742	cm_id->provider_data = (void *)iwqp;
3743	iwqp->active_conn = 0;
3744
3745	cm_node->lsmm_size = accept.size + conn_param->private_data_len;
3746	i40iw_cm_init_tsa_conn(iwqp, cm_node);
3747	cm_id->add_ref(cm_id);
3748	i40iw_qp_add_ref(&iwqp->ibqp);
3749
3750	attr.qp_state = IB_QPS_RTS;
3751	cm_node->qhash_set = false;
3752	i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
3753
3754	cm_node->accelerated = true;
3755	spin_lock_irqsave(&cm_core->ht_lock, flags);
3756	list_move_tail(&cm_node->list, &cm_core->accelerated_list);
3757	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3758
3759	status =
3760		i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_ESTABLISHED, 0);
3761	if (status)
3762		i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - ESTABLISHED\n");
3763
3764	if (cm_node->loopbackpartner) {
3765		cm_node->loopbackpartner->pdata.size = conn_param->private_data_len;
3766
3767		/* copy entire MPA frame to our cm_node's frame */
3768		memcpy(cm_node->loopbackpartner->pdata_buf,
3769		       conn_param->private_data,
3770		       conn_param->private_data_len);
3771		i40iw_create_event(cm_node->loopbackpartner, I40IW_CM_EVENT_CONNECTED);
3772	}
3773
3774	if (cm_node->accept_pend) {
3775		atomic_dec(&cm_node->listener->pend_accepts_cnt);
3776		cm_node->accept_pend = 0;
3777	}
3778	return 0;
3779}
3780
3781/**
3782 * i40iw_reject - registered call for connection to be rejected
3783 * @cm_id: cm information for passive connection
3784 * @pdata: private data to be sent
3785 * @pdata_len: private data length
3786 */
3787int i40iw_reject(struct iw_cm_id *cm_id, const void *pdata, u8 pdata_len)
3788{
3789	struct i40iw_device *iwdev;
3790	struct i40iw_cm_node *cm_node;
3791	struct i40iw_cm_node *loopback;
3792
3793	cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3794	loopback = cm_node->loopbackpartner;
3795	cm_node->cm_id = cm_id;
3796	cm_node->pdata.size = pdata_len;
3797
3798	iwdev = to_iwdev(cm_id->device);
3799	if (!iwdev)
3800		return -EINVAL;
3801	cm_node->cm_core->stats_rejects++;
3802
3803	if (pdata_len + sizeof(struct ietf_mpa_v2) > MAX_CM_BUFFER)
3804		return -EINVAL;
3805
3806	if (loopback) {
3807		memcpy(&loopback->pdata_buf, pdata, pdata_len);
3808		loopback->pdata.size = pdata_len;
3809	}
3810
3811	return i40iw_cm_reject(cm_node, pdata, pdata_len);
3812}
3813
3814/**
3815 * i40iw_connect - registered call for connection to be established
3816 * @cm_id: cm information for passive connection
3817 * @conn_param: Information about the connection
3818 */
3819int i40iw_connect(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3820{
3821	struct ib_qp *ibqp;
3822	struct i40iw_qp *iwqp;
3823	struct i40iw_device *iwdev;
3824	struct i40iw_cm_node *cm_node;
3825	struct i40iw_cm_info cm_info;
3826	struct sockaddr_in *laddr;
3827	struct sockaddr_in *raddr;
3828	struct sockaddr_in6 *laddr6;
3829	struct sockaddr_in6 *raddr6;
3830	int ret = 0;
3831
3832	ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3833	if (!ibqp)
3834		return -EINVAL;
3835	iwqp = to_iwqp(ibqp);
3836	if (!iwqp)
3837		return -EINVAL;
3838	iwdev = to_iwdev(iwqp->ibqp.device);
3839	if (!iwdev)
3840		return -EINVAL;
3841
3842	laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3843	raddr = (struct sockaddr_in *)&cm_id->m_remote_addr;
3844	laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3845	raddr6 = (struct sockaddr_in6 *)&cm_id->m_remote_addr;
3846
3847	if (!(laddr->sin_port) || !(raddr->sin_port))
3848		return -EINVAL;
3849
3850	iwqp->active_conn = 1;
3851	iwqp->cm_id = NULL;
3852	cm_id->provider_data = iwqp;
3853
3854	/* set up the connection params for the node */
3855	if (cm_id->remote_addr.ss_family == AF_INET) {
3856		cm_info.ipv4 = true;
3857		memset(cm_info.loc_addr, 0, sizeof(cm_info.loc_addr));
3858		memset(cm_info.rem_addr, 0, sizeof(cm_info.rem_addr));
3859		cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3860		cm_info.rem_addr[0] = ntohl(raddr->sin_addr.s_addr);
3861		cm_info.loc_port = ntohs(laddr->sin_port);
3862		cm_info.rem_port = ntohs(raddr->sin_port);
3863		cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3864	} else {
3865		cm_info.ipv4 = false;
3866		i40iw_copy_ip_ntohl(cm_info.loc_addr,
3867				    laddr6->sin6_addr.in6_u.u6_addr32);
3868		i40iw_copy_ip_ntohl(cm_info.rem_addr,
3869				    raddr6->sin6_addr.in6_u.u6_addr32);
3870		cm_info.loc_port = ntohs(laddr6->sin6_port);
3871		cm_info.rem_port = ntohs(raddr6->sin6_port);
3872		i40iw_netdev_vlan_ipv6(cm_info.loc_addr, &cm_info.vlan_id);
3873	}
3874	cm_info.cm_id = cm_id;
3875	cm_info.tos = cm_id->tos;
3876	cm_info.user_pri = rt_tos2priority(cm_id->tos);
3877	i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "%s TOS:[%d] UP:[%d]\n",
3878		    __func__, cm_id->tos, cm_info.user_pri);
3879	cm_id->add_ref(cm_id);
3880	cm_node = i40iw_create_cm_node(&iwdev->cm_core, iwdev,
3881				       conn_param, &cm_info);
3882
3883	if (IS_ERR(cm_node)) {
3884		ret = PTR_ERR(cm_node);
3885		cm_id->rem_ref(cm_id);
3886		return ret;
3887	}
3888
3889	if ((cm_info.ipv4 && (laddr->sin_addr.s_addr != raddr->sin_addr.s_addr)) ||
3890	    (!cm_info.ipv4 && memcmp(laddr6->sin6_addr.in6_u.u6_addr32,
3891				     raddr6->sin6_addr.in6_u.u6_addr32,
3892				     sizeof(laddr6->sin6_addr.in6_u.u6_addr32)))) {
3893		if (i40iw_manage_qhash(iwdev, &cm_info, I40IW_QHASH_TYPE_TCP_ESTABLISHED,
3894				       I40IW_QHASH_MANAGE_TYPE_ADD, NULL, true)) {
3895			ret = -EINVAL;
3896			goto err;
3897		}
3898		cm_node->qhash_set = true;
3899	}
3900
3901	if (i40iw_manage_apbvt(iwdev, cm_info.loc_port,
3902			       I40IW_MANAGE_APBVT_ADD)) {
3903		ret =  -EINVAL;
3904		goto err;
3905	}
3906
3907	cm_node->apbvt_set = true;
3908	iwqp->cm_node = cm_node;
3909	cm_node->iwqp = iwqp;
3910	iwqp->cm_id = cm_id;
3911	i40iw_qp_add_ref(&iwqp->ibqp);
3912
3913	if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
3914		cm_node->state = I40IW_CM_STATE_SYN_SENT;
3915		ret = i40iw_send_syn(cm_node, 0);
3916		if (ret)
3917			goto err;
3918	}
3919
3920	if (cm_node->loopbackpartner) {
3921		cm_node->loopbackpartner->state = I40IW_CM_STATE_MPAREQ_RCVD;
3922		i40iw_create_event(cm_node->loopbackpartner,
3923				   I40IW_CM_EVENT_MPA_REQ);
3924	}
3925
3926	i40iw_debug(cm_node->dev,
3927		    I40IW_DEBUG_CM,
3928		    "Api - connect(): port=0x%04x, cm_node=%p, cm_id = %p.\n",
3929		    cm_node->rem_port,
3930		    cm_node,
3931		    cm_node->cm_id);
3932
3933	return 0;
3934
3935err:
3936	if (cm_info.ipv4)
3937		i40iw_debug(&iwdev->sc_dev,
3938			    I40IW_DEBUG_CM,
3939			    "Api - connect() FAILED: dest addr=%pI4",
3940			    cm_info.rem_addr);
3941	else
3942		i40iw_debug(&iwdev->sc_dev,
3943			    I40IW_DEBUG_CM,
3944			    "Api - connect() FAILED: dest addr=%pI6",
3945			    cm_info.rem_addr);
3946
3947	i40iw_rem_ref_cm_node(cm_node);
3948	cm_id->rem_ref(cm_id);
3949	iwdev->cm_core.stats_connect_errs++;
3950	return ret;
3951}
3952
3953/**
3954 * i40iw_create_listen - registered call creating listener
3955 * @cm_id: cm information for passive connection
3956 * @backlog: to max accept pending count
3957 */
3958int i40iw_create_listen(struct iw_cm_id *cm_id, int backlog)
3959{
3960	struct i40iw_device *iwdev;
3961	struct i40iw_cm_listener *cm_listen_node;
3962	struct i40iw_cm_info cm_info;
3963	enum i40iw_status_code ret;
3964	struct sockaddr_in *laddr;
3965	struct sockaddr_in6 *laddr6;
3966	bool wildcard = false;
3967
3968	iwdev = to_iwdev(cm_id->device);
3969	if (!iwdev)
3970		return -EINVAL;
3971
3972	laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3973	laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3974	memset(&cm_info, 0, sizeof(cm_info));
3975	if (laddr->sin_family == AF_INET) {
3976		cm_info.ipv4 = true;
3977		cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3978		cm_info.loc_port = ntohs(laddr->sin_port);
3979
3980		if (laddr->sin_addr.s_addr != INADDR_ANY)
3981			cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3982		else
3983			wildcard = true;
3984
3985	} else {
3986		cm_info.ipv4 = false;
3987		i40iw_copy_ip_ntohl(cm_info.loc_addr,
3988				    laddr6->sin6_addr.in6_u.u6_addr32);
3989		cm_info.loc_port = ntohs(laddr6->sin6_port);
3990		if (ipv6_addr_type(&laddr6->sin6_addr) != IPV6_ADDR_ANY)
3991			i40iw_netdev_vlan_ipv6(cm_info.loc_addr,
3992					       &cm_info.vlan_id);
3993		else
3994			wildcard = true;
3995	}
3996	cm_info.backlog = backlog;
3997	cm_info.cm_id = cm_id;
3998
3999	cm_listen_node = i40iw_make_listen_node(&iwdev->cm_core, iwdev, &cm_info);
4000	if (!cm_listen_node) {
4001		i40iw_pr_err("cm_listen_node == NULL\n");
4002		return -ENOMEM;
4003	}
4004
4005	cm_id->provider_data = cm_listen_node;
4006
4007	cm_listen_node->tos = cm_id->tos;
4008	cm_listen_node->user_pri = rt_tos2priority(cm_id->tos);
4009	cm_info.user_pri = cm_listen_node->user_pri;
4010
4011	if (!cm_listen_node->reused_node) {
4012		if (wildcard) {
4013			if (cm_info.ipv4)
4014				ret = i40iw_add_mqh_4(iwdev,
4015						      &cm_info,
4016						      cm_listen_node);
4017			else
4018				ret = i40iw_add_mqh_6(iwdev,
4019						      &cm_info,
4020						      cm_listen_node);
4021			if (ret)
4022				goto error;
4023
4024			ret = i40iw_manage_apbvt(iwdev,
4025						 cm_info.loc_port,
4026						 I40IW_MANAGE_APBVT_ADD);
4027
4028			if (ret)
4029				goto error;
4030		} else {
4031			ret = i40iw_manage_qhash(iwdev,
4032						 &cm_info,
4033						 I40IW_QHASH_TYPE_TCP_SYN,
4034						 I40IW_QHASH_MANAGE_TYPE_ADD,
4035						 NULL,
4036						 true);
4037			if (ret)
4038				goto error;
4039			cm_listen_node->qhash_set = true;
4040			ret = i40iw_manage_apbvt(iwdev,
4041						 cm_info.loc_port,
4042						 I40IW_MANAGE_APBVT_ADD);
4043			if (ret)
4044				goto error;
4045		}
4046	}
4047	cm_id->add_ref(cm_id);
4048	cm_listen_node->cm_core->stats_listen_created++;
4049	return 0;
4050 error:
4051	i40iw_cm_del_listen(&iwdev->cm_core, (void *)cm_listen_node, false);
4052	return -EINVAL;
4053}
4054
4055/**
4056 * i40iw_destroy_listen - registered call to destroy listener
4057 * @cm_id: cm information for passive connection
4058 */
4059int i40iw_destroy_listen(struct iw_cm_id *cm_id)
4060{
4061	struct i40iw_device *iwdev;
4062
4063	iwdev = to_iwdev(cm_id->device);
4064	if (cm_id->provider_data)
4065		i40iw_cm_del_listen(&iwdev->cm_core, cm_id->provider_data, true);
4066	else
4067		i40iw_pr_err("cm_id->provider_data was NULL\n");
4068
4069	cm_id->rem_ref(cm_id);
4070
4071	return 0;
4072}
4073
4074/**
4075 * i40iw_cm_event_connected - handle connected active node
4076 * @event: the info for cm_node of connection
4077 */
4078static void i40iw_cm_event_connected(struct i40iw_cm_event *event)
4079{
4080	struct i40iw_qp *iwqp;
4081	struct i40iw_device *iwdev;
4082	struct i40iw_cm_core *cm_core;
4083	struct i40iw_cm_node *cm_node;
4084	struct i40iw_sc_dev *dev;
4085	struct ib_qp_attr attr;
4086	struct iw_cm_id *cm_id;
4087	unsigned long flags;
4088	int status;
4089	bool read0;
4090
4091	cm_node = event->cm_node;
4092	cm_id = cm_node->cm_id;
4093	iwqp = (struct i40iw_qp *)cm_id->provider_data;
4094	iwdev = to_iwdev(iwqp->ibqp.device);
4095	dev = &iwdev->sc_dev;
4096	cm_core = &iwdev->cm_core;
4097
4098	if (iwqp->destroyed) {
4099		status = -ETIMEDOUT;
4100		goto error;
4101	}
4102	i40iw_cm_init_tsa_conn(iwqp, cm_node);
4103	read0 = (cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO);
4104	if (iwqp->page)
4105		iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
4106	dev->iw_priv_qp_ops->qp_send_rtt(&iwqp->sc_qp, read0);
4107	if (iwqp->page)
4108		kunmap(iwqp->page);
4109
4110	memset(&attr, 0, sizeof(attr));
4111	attr.qp_state = IB_QPS_RTS;
4112	cm_node->qhash_set = false;
4113	i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4114
4115	cm_node->accelerated = true;
4116	spin_lock_irqsave(&cm_core->ht_lock, flags);
4117	list_move_tail(&cm_node->list, &cm_core->accelerated_list);
4118	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4119	status = i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_CONNECT_REPLY,
4120				     0);
4121	if (status)
4122		i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - CONNECT_REPLY\n");
4123
4124	return;
4125
4126error:
4127	iwqp->cm_id = NULL;
4128	cm_id->provider_data = NULL;
4129	i40iw_send_cm_event(event->cm_node,
4130			    cm_id,
4131			    IW_CM_EVENT_CONNECT_REPLY,
4132			    status);
4133	cm_id->rem_ref(cm_id);
4134	i40iw_rem_ref_cm_node(event->cm_node);
4135}
4136
4137/**
4138 * i40iw_cm_event_reset - handle reset
4139 * @event: the info for cm_node of connection
4140 */
4141static void i40iw_cm_event_reset(struct i40iw_cm_event *event)
4142{
4143	struct i40iw_cm_node *cm_node = event->cm_node;
4144	struct iw_cm_id   *cm_id = cm_node->cm_id;
4145	struct i40iw_qp *iwqp;
4146
4147	if (!cm_id)
4148		return;
4149
4150	iwqp = cm_id->provider_data;
4151	if (!iwqp)
4152		return;
4153
4154	i40iw_debug(cm_node->dev,
4155		    I40IW_DEBUG_CM,
4156		    "reset event %p - cm_id = %p\n",
4157		     event->cm_node, cm_id);
4158	iwqp->cm_id = NULL;
4159
4160	i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_DISCONNECT, -ECONNRESET);
4161	i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_CLOSE, 0);
4162}
4163
4164/**
4165 * i40iw_cm_event_handler - worker thread callback to send event to cm upper layer
4166 * @work: pointer of cm event info.
4167 */
4168static void i40iw_cm_event_handler(struct work_struct *work)
4169{
4170	struct i40iw_cm_event *event = container_of(work,
4171						    struct i40iw_cm_event,
4172						    event_work);
4173	struct i40iw_cm_node *cm_node;
4174
4175	if (!event || !event->cm_node || !event->cm_node->cm_core)
4176		return;
4177
4178	cm_node = event->cm_node;
4179
4180	switch (event->type) {
4181	case I40IW_CM_EVENT_MPA_REQ:
4182		i40iw_send_cm_event(cm_node,
4183				    cm_node->cm_id,
4184				    IW_CM_EVENT_CONNECT_REQUEST,
4185				    0);
4186		break;
4187	case I40IW_CM_EVENT_RESET:
4188		i40iw_cm_event_reset(event);
4189		break;
4190	case I40IW_CM_EVENT_CONNECTED:
4191		if (!event->cm_node->cm_id ||
4192		    (event->cm_node->state != I40IW_CM_STATE_OFFLOADED))
4193			break;
4194		i40iw_cm_event_connected(event);
4195		break;
4196	case I40IW_CM_EVENT_MPA_REJECT:
4197		if (!event->cm_node->cm_id ||
4198		    (cm_node->state == I40IW_CM_STATE_OFFLOADED))
4199			break;
4200		i40iw_send_cm_event(cm_node,
4201				    cm_node->cm_id,
4202				    IW_CM_EVENT_CONNECT_REPLY,
4203				    -ECONNREFUSED);
4204		break;
4205	case I40IW_CM_EVENT_ABORTED:
4206		if (!event->cm_node->cm_id ||
4207		    (event->cm_node->state == I40IW_CM_STATE_OFFLOADED))
4208			break;
4209		i40iw_event_connect_error(event);
4210		break;
4211	default:
4212		i40iw_pr_err("event type = %d\n", event->type);
4213		break;
4214	}
4215
4216	event->cm_info.cm_id->rem_ref(event->cm_info.cm_id);
4217	i40iw_rem_ref_cm_node(event->cm_node);
4218	kfree(event);
4219}
4220
4221/**
4222 * i40iw_cm_post_event - queue event request for worker thread
4223 * @event: cm node's info for up event call
4224 */
4225static void i40iw_cm_post_event(struct i40iw_cm_event *event)
4226{
4227	atomic_inc(&event->cm_node->ref_count);
4228	event->cm_info.cm_id->add_ref(event->cm_info.cm_id);
4229	INIT_WORK(&event->event_work, i40iw_cm_event_handler);
4230
4231	queue_work(event->cm_node->cm_core->event_wq, &event->event_work);
4232}
4233
4234/**
4235 * i40iw_qhash_ctrl - enable/disable qhash for list
4236 * @iwdev: device pointer
4237 * @parent_listen_node: parent listen node
4238 * @nfo: cm info node
4239 * @ipaddr: Pointer to IPv4 or IPv6 address
4240 * @ipv4: flag indicating IPv4 when true
4241 * @ifup: flag indicating interface up when true
4242 *
4243 * Enables or disables the qhash for the node in the child
4244 * listen list that matches ipaddr. If no matching IP was found
4245 * it will allocate and add a new child listen node to the
4246 * parent listen node. The listen_list_lock is assumed to be
4247 * held when called.
4248 */
4249static void i40iw_qhash_ctrl(struct i40iw_device *iwdev,
4250			     struct i40iw_cm_listener *parent_listen_node,
4251			     struct i40iw_cm_info *nfo,
4252			     u32 *ipaddr, bool ipv4, bool ifup)
4253{
4254	struct list_head *child_listen_list = &parent_listen_node->child_listen_list;
4255	struct i40iw_cm_listener *child_listen_node;
4256	struct list_head *pos, *tpos;
4257	enum i40iw_status_code ret;
4258	bool node_allocated = false;
4259	enum i40iw_quad_hash_manage_type op =
4260		ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4261
4262	list_for_each_safe(pos, tpos, child_listen_list) {
4263		child_listen_node =
4264			list_entry(pos,
4265				   struct i40iw_cm_listener,
4266				   child_listen_list);
4267		if (!memcmp(child_listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16))
4268			goto set_qhash;
4269	}
4270
4271	/* if not found then add a child listener if interface is going up */
4272	if (!ifup)
4273		return;
4274	child_listen_node = kmemdup(parent_listen_node,
4275			sizeof(*child_listen_node), GFP_ATOMIC);
4276	if (!child_listen_node)
4277		return;
4278	node_allocated = true;
4279
4280	memcpy(child_listen_node->loc_addr, ipaddr,  ipv4 ? 4 : 16);
4281
4282set_qhash:
4283	memcpy(nfo->loc_addr,
4284	       child_listen_node->loc_addr,
4285	       sizeof(nfo->loc_addr));
4286	nfo->vlan_id = child_listen_node->vlan_id;
4287	ret = i40iw_manage_qhash(iwdev, nfo,
4288				 I40IW_QHASH_TYPE_TCP_SYN,
4289				 op,
4290				 NULL, false);
4291	if (!ret) {
4292		child_listen_node->qhash_set = ifup;
4293		if (node_allocated)
4294			list_add(&child_listen_node->child_listen_list,
4295				 &parent_listen_node->child_listen_list);
4296	} else if (node_allocated) {
4297		kfree(child_listen_node);
4298	}
4299}
4300
4301/**
4302 * i40iw_cm_teardown_connections - teardown QPs
4303 * @iwdev: device pointer
4304 * @ipaddr: Pointer to IPv4 or IPv6 address
4305 * @ipv4: flag indicating IPv4 when true
4306 * @disconnect_all: flag indicating disconnect all QPs
4307 * teardown QPs where source or destination addr matches ip addr
4308 */
4309void i40iw_cm_teardown_connections(struct i40iw_device *iwdev, u32 *ipaddr,
4310				   struct i40iw_cm_info *nfo,
4311				   bool disconnect_all)
4312{
4313	struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4314	struct list_head *list_core_temp;
4315	struct list_head *list_node;
4316	struct i40iw_cm_node *cm_node;
4317	unsigned long flags;
4318	struct list_head teardown_list;
4319	struct ib_qp_attr attr;
4320
4321	INIT_LIST_HEAD(&teardown_list);
4322	spin_lock_irqsave(&cm_core->ht_lock, flags);
4323	list_for_each_safe(list_node, list_core_temp,
4324			   &cm_core->accelerated_list) {
4325		cm_node = container_of(list_node, struct i40iw_cm_node, list);
4326		if (disconnect_all ||
4327		    (nfo->vlan_id == cm_node->vlan_id &&
4328		    (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4329		     !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4330			atomic_inc(&cm_node->ref_count);
4331			list_add(&cm_node->teardown_entry, &teardown_list);
4332		}
4333	}
4334	list_for_each_safe(list_node, list_core_temp,
4335			   &cm_core->non_accelerated_list) {
4336		cm_node = container_of(list_node, struct i40iw_cm_node, list);
4337		if (disconnect_all ||
4338		    (nfo->vlan_id == cm_node->vlan_id &&
4339		    (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4340		     !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4341			atomic_inc(&cm_node->ref_count);
4342			list_add(&cm_node->teardown_entry, &teardown_list);
4343		}
4344	}
4345	spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4346
4347	list_for_each_safe(list_node, list_core_temp, &teardown_list) {
4348		cm_node = container_of(list_node, struct i40iw_cm_node,
4349				       teardown_entry);
4350		attr.qp_state = IB_QPS_ERR;
4351		i40iw_modify_qp(&cm_node->iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4352		if (iwdev->reset)
4353			i40iw_cm_disconn(cm_node->iwqp);
4354		i40iw_rem_ref_cm_node(cm_node);
4355	}
4356}
4357
4358/**
4359 * i40iw_ifdown_notify - process an ifdown on an interface
4360 * @iwdev: device pointer
4361 * @ipaddr: Pointer to IPv4 or IPv6 address
4362 * @ipv4: flag indicating IPv4 when true
4363 * @ifup: flag indicating interface up when true
4364 */
4365void i40iw_if_notify(struct i40iw_device *iwdev, struct net_device *netdev,
4366		     u32 *ipaddr, bool ipv4, bool ifup)
4367{
4368	struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4369	unsigned long flags;
4370	struct i40iw_cm_listener *listen_node;
4371	static const u32 ip_zero[4] = { 0, 0, 0, 0 };
4372	struct i40iw_cm_info nfo;
4373	u16 vlan_id = rdma_vlan_dev_vlan_id(netdev);
4374	enum i40iw_status_code ret;
4375	enum i40iw_quad_hash_manage_type op =
4376		ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4377
4378	nfo.vlan_id = vlan_id;
4379	nfo.ipv4 = ipv4;
4380
4381	/* Disable or enable qhash for listeners */
4382	spin_lock_irqsave(&cm_core->listen_list_lock, flags);
4383	list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
4384		if (vlan_id == listen_node->vlan_id &&
4385		    (!memcmp(listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16) ||
4386		    !memcmp(listen_node->loc_addr, ip_zero, ipv4 ? 4 : 16))) {
4387			memcpy(nfo.loc_addr, listen_node->loc_addr,
4388			       sizeof(nfo.loc_addr));
4389			nfo.loc_port = listen_node->loc_port;
4390			nfo.user_pri = listen_node->user_pri;
4391			if (!list_empty(&listen_node->child_listen_list)) {
4392				i40iw_qhash_ctrl(iwdev,
4393						 listen_node,
4394						 &nfo,
4395						 ipaddr, ipv4, ifup);
4396			} else if (memcmp(listen_node->loc_addr, ip_zero,
4397					  ipv4 ? 4 : 16)) {
4398				ret = i40iw_manage_qhash(iwdev,
4399							 &nfo,
4400							 I40IW_QHASH_TYPE_TCP_SYN,
4401							 op,
4402							 NULL,
4403							 false);
4404				if (!ret)
4405					listen_node->qhash_set = ifup;
4406			}
4407		}
4408	}
4409	spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
4410
4411	/* teardown connected qp's on ifdown */
4412	if (!ifup)
4413		i40iw_cm_teardown_connections(iwdev, ipaddr, &nfo, false);
4414}
4415