]> git.ipfire.org Git - thirdparty/linux.git/blob - drivers/infiniband/hw/i40iw/i40iw_cm.c
io_uring: reset -EBUSY error when io sq thread is waken up
[thirdparty/linux.git] / drivers / infiniband / hw / i40iw / i40iw_cm.c
1 /*******************************************************************************
2 *
3 * Copyright (c) 2015-2016 Intel Corporation. All rights reserved.
4 *
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenFabrics.org BSD license below:
10 *
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
13 * conditions are met:
14 *
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
17 * disclaimer.
18 *
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
23 *
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31 * SOFTWARE.
32 *
33 *******************************************************************************/
34
35 #include <linux/atomic.h>
36 #include <linux/ip.h>
37 #include <linux/tcp.h>
38 #include <linux/init.h>
39 #include <linux/if_arp.h>
40 #include <linux/if_vlan.h>
41 #include <linux/notifier.h>
42 #include <linux/net.h>
43 #include <linux/types.h>
44 #include <linux/timer.h>
45 #include <linux/time.h>
46 #include <linux/delay.h>
47 #include <linux/etherdevice.h>
48 #include <linux/netdevice.h>
49 #include <linux/random.h>
50 #include <linux/list.h>
51 #include <linux/threads.h>
52 #include <linux/highmem.h>
53 #include <net/arp.h>
54 #include <net/ndisc.h>
55 #include <net/neighbour.h>
56 #include <net/route.h>
57 #include <net/addrconf.h>
58 #include <net/ip6_route.h>
59 #include <net/ip_fib.h>
60 #include <net/secure_seq.h>
61 #include <net/tcp.h>
62 #include <asm/checksum.h>
63
64 #include "i40iw.h"
65
66 static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *);
67 static void i40iw_cm_post_event(struct i40iw_cm_event *event);
68 static void i40iw_disconnect_worker(struct work_struct *work);
69
70 /**
71 * i40iw_free_sqbuf - put back puda buffer if refcount = 0
72 * @vsi: pointer to vsi structure
73 * @buf: puda buffer to free
74 */
75 void i40iw_free_sqbuf(struct i40iw_sc_vsi *vsi, void *bufp)
76 {
77 struct i40iw_puda_buf *buf = (struct i40iw_puda_buf *)bufp;
78 struct i40iw_puda_rsrc *ilq = vsi->ilq;
79
80 if (!atomic_dec_return(&buf->refcount))
81 i40iw_puda_ret_bufpool(ilq, buf);
82 }
83
84 /**
85 * i40iw_derive_hw_ird_setting - Calculate IRD
86 *
87 * @cm_ird: IRD of connection's node
88 *
89 * The ird from the connection is rounded to a supported HW
90 * setting (2,8,32,64) and then encoded for ird_size field of
91 * qp_ctx
92 */
93 static u8 i40iw_derive_hw_ird_setting(u16 cm_ird)
94 {
95 u8 encoded_ird_size;
96
97 /* ird_size field is encoded in qp_ctx */
98 switch (cm_ird ? roundup_pow_of_two(cm_ird) : 0) {
99 case I40IW_HW_IRD_SETTING_64:
100 encoded_ird_size = 3;
101 break;
102 case I40IW_HW_IRD_SETTING_32:
103 case I40IW_HW_IRD_SETTING_16:
104 encoded_ird_size = 2;
105 break;
106 case I40IW_HW_IRD_SETTING_8:
107 case I40IW_HW_IRD_SETTING_4:
108 encoded_ird_size = 1;
109 break;
110 case I40IW_HW_IRD_SETTING_2:
111 default:
112 encoded_ird_size = 0;
113 break;
114 }
115 return encoded_ird_size;
116 }
117
118 /**
119 * i40iw_record_ird_ord - Record IRD/ORD passed in
120 * @cm_node: connection's node
121 * @conn_ird: connection IRD
122 * @conn_ord: connection ORD
123 */
124 static void i40iw_record_ird_ord(struct i40iw_cm_node *cm_node, u32 conn_ird,
125 u32 conn_ord)
126 {
127 if (conn_ird > I40IW_MAX_IRD_SIZE)
128 conn_ird = I40IW_MAX_IRD_SIZE;
129
130 if (conn_ord > I40IW_MAX_ORD_SIZE)
131 conn_ord = I40IW_MAX_ORD_SIZE;
132 else if (!conn_ord && cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO)
133 conn_ord = 1;
134
135 cm_node->ird_size = conn_ird;
136 cm_node->ord_size = conn_ord;
137 }
138
139 /**
140 * i40iw_copy_ip_ntohl - change network to host ip
141 * @dst: host ip
142 * @src: big endian
143 */
144 void i40iw_copy_ip_ntohl(u32 *dst, __be32 *src)
145 {
146 *dst++ = ntohl(*src++);
147 *dst++ = ntohl(*src++);
148 *dst++ = ntohl(*src++);
149 *dst = ntohl(*src);
150 }
151
152 /**
153 * i40iw_copy_ip_htonl - change host addr to network ip
154 * @dst: host ip
155 * @src: little endian
156 */
157 static inline void i40iw_copy_ip_htonl(__be32 *dst, u32 *src)
158 {
159 *dst++ = htonl(*src++);
160 *dst++ = htonl(*src++);
161 *dst++ = htonl(*src++);
162 *dst = htonl(*src);
163 }
164
165 /**
166 * i40iw_fill_sockaddr4 - get addr info for passive connection
167 * @cm_node: connection's node
168 * @event: upper layer's cm event
169 */
170 static inline void i40iw_fill_sockaddr4(struct i40iw_cm_node *cm_node,
171 struct iw_cm_event *event)
172 {
173 struct sockaddr_in *laddr = (struct sockaddr_in *)&event->local_addr;
174 struct sockaddr_in *raddr = (struct sockaddr_in *)&event->remote_addr;
175
176 laddr->sin_family = AF_INET;
177 raddr->sin_family = AF_INET;
178
179 laddr->sin_port = htons(cm_node->loc_port);
180 raddr->sin_port = htons(cm_node->rem_port);
181
182 laddr->sin_addr.s_addr = htonl(cm_node->loc_addr[0]);
183 raddr->sin_addr.s_addr = htonl(cm_node->rem_addr[0]);
184 }
185
186 /**
187 * i40iw_fill_sockaddr6 - get ipv6 addr info for passive side
188 * @cm_node: connection's node
189 * @event: upper layer's cm event
190 */
191 static inline void i40iw_fill_sockaddr6(struct i40iw_cm_node *cm_node,
192 struct iw_cm_event *event)
193 {
194 struct sockaddr_in6 *laddr6 = (struct sockaddr_in6 *)&event->local_addr;
195 struct sockaddr_in6 *raddr6 = (struct sockaddr_in6 *)&event->remote_addr;
196
197 laddr6->sin6_family = AF_INET6;
198 raddr6->sin6_family = AF_INET6;
199
200 laddr6->sin6_port = htons(cm_node->loc_port);
201 raddr6->sin6_port = htons(cm_node->rem_port);
202
203 i40iw_copy_ip_htonl(laddr6->sin6_addr.in6_u.u6_addr32,
204 cm_node->loc_addr);
205 i40iw_copy_ip_htonl(raddr6->sin6_addr.in6_u.u6_addr32,
206 cm_node->rem_addr);
207 }
208
209 /**
210 * i40iw_get_addr_info
211 * @cm_node: contains ip/tcp info
212 * @cm_info: to get a copy of the cm_node ip/tcp info
213 */
214 static void i40iw_get_addr_info(struct i40iw_cm_node *cm_node,
215 struct i40iw_cm_info *cm_info)
216 {
217 cm_info->ipv4 = cm_node->ipv4;
218 cm_info->vlan_id = cm_node->vlan_id;
219 memcpy(cm_info->loc_addr, cm_node->loc_addr, sizeof(cm_info->loc_addr));
220 memcpy(cm_info->rem_addr, cm_node->rem_addr, sizeof(cm_info->rem_addr));
221 cm_info->loc_port = cm_node->loc_port;
222 cm_info->rem_port = cm_node->rem_port;
223 cm_info->user_pri = cm_node->user_pri;
224 }
225
226 /**
227 * i40iw_get_cmevent_info - for cm event upcall
228 * @cm_node: connection's node
229 * @cm_id: upper layers cm struct for the event
230 * @event: upper layer's cm event
231 */
232 static inline void i40iw_get_cmevent_info(struct i40iw_cm_node *cm_node,
233 struct iw_cm_id *cm_id,
234 struct iw_cm_event *event)
235 {
236 memcpy(&event->local_addr, &cm_id->m_local_addr,
237 sizeof(event->local_addr));
238 memcpy(&event->remote_addr, &cm_id->m_remote_addr,
239 sizeof(event->remote_addr));
240 if (cm_node) {
241 event->private_data = (void *)cm_node->pdata_buf;
242 event->private_data_len = (u8)cm_node->pdata.size;
243 event->ird = cm_node->ird_size;
244 event->ord = cm_node->ord_size;
245 }
246 }
247
248 /**
249 * i40iw_send_cm_event - upcall cm's event handler
250 * @cm_node: connection's node
251 * @cm_id: upper layer's cm info struct
252 * @type: Event type to indicate
253 * @status: status for the event type
254 */
255 static int i40iw_send_cm_event(struct i40iw_cm_node *cm_node,
256 struct iw_cm_id *cm_id,
257 enum iw_cm_event_type type,
258 int status)
259 {
260 struct iw_cm_event event;
261
262 memset(&event, 0, sizeof(event));
263 event.event = type;
264 event.status = status;
265 switch (type) {
266 case IW_CM_EVENT_CONNECT_REQUEST:
267 if (cm_node->ipv4)
268 i40iw_fill_sockaddr4(cm_node, &event);
269 else
270 i40iw_fill_sockaddr6(cm_node, &event);
271 event.provider_data = (void *)cm_node;
272 event.private_data = (void *)cm_node->pdata_buf;
273 event.private_data_len = (u8)cm_node->pdata.size;
274 event.ird = cm_node->ird_size;
275 break;
276 case IW_CM_EVENT_CONNECT_REPLY:
277 i40iw_get_cmevent_info(cm_node, cm_id, &event);
278 break;
279 case IW_CM_EVENT_ESTABLISHED:
280 event.ird = cm_node->ird_size;
281 event.ord = cm_node->ord_size;
282 break;
283 case IW_CM_EVENT_DISCONNECT:
284 break;
285 case IW_CM_EVENT_CLOSE:
286 break;
287 default:
288 i40iw_pr_err("event type received type = %d\n", type);
289 return -1;
290 }
291 return cm_id->event_handler(cm_id, &event);
292 }
293
294 /**
295 * i40iw_create_event - create cm event
296 * @cm_node: connection's node
297 * @type: Event type to generate
298 */
299 static struct i40iw_cm_event *i40iw_create_event(struct i40iw_cm_node *cm_node,
300 enum i40iw_cm_event_type type)
301 {
302 struct i40iw_cm_event *event;
303
304 if (!cm_node->cm_id)
305 return NULL;
306
307 event = kzalloc(sizeof(*event), GFP_ATOMIC);
308
309 if (!event)
310 return NULL;
311
312 event->type = type;
313 event->cm_node = cm_node;
314 memcpy(event->cm_info.rem_addr, cm_node->rem_addr, sizeof(event->cm_info.rem_addr));
315 memcpy(event->cm_info.loc_addr, cm_node->loc_addr, sizeof(event->cm_info.loc_addr));
316 event->cm_info.rem_port = cm_node->rem_port;
317 event->cm_info.loc_port = cm_node->loc_port;
318 event->cm_info.cm_id = cm_node->cm_id;
319
320 i40iw_debug(cm_node->dev,
321 I40IW_DEBUG_CM,
322 "node=%p event=%p type=%u dst=%pI4 src=%pI4\n",
323 cm_node,
324 event,
325 type,
326 event->cm_info.loc_addr,
327 event->cm_info.rem_addr);
328
329 i40iw_cm_post_event(event);
330 return event;
331 }
332
333 /**
334 * i40iw_free_retrans_entry - free send entry
335 * @cm_node: connection's node
336 */
337 static void i40iw_free_retrans_entry(struct i40iw_cm_node *cm_node)
338 {
339 struct i40iw_device *iwdev = cm_node->iwdev;
340 struct i40iw_timer_entry *send_entry;
341
342 send_entry = cm_node->send_entry;
343 if (send_entry) {
344 cm_node->send_entry = NULL;
345 i40iw_free_sqbuf(&iwdev->vsi, (void *)send_entry->sqbuf);
346 kfree(send_entry);
347 atomic_dec(&cm_node->ref_count);
348 }
349 }
350
351 /**
352 * i40iw_cleanup_retrans_entry - free send entry with lock
353 * @cm_node: connection's node
354 */
355 static void i40iw_cleanup_retrans_entry(struct i40iw_cm_node *cm_node)
356 {
357 unsigned long flags;
358
359 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
360 i40iw_free_retrans_entry(cm_node);
361 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
362 }
363
364 /**
365 * i40iw_form_cm_frame - get a free packet and build frame
366 * @cm_node: connection's node ionfo to use in frame
367 * @options: pointer to options info
368 * @hdr: pointer mpa header
369 * @pdata: pointer to private data
370 * @flags: indicates FIN or ACK
371 */
372 static struct i40iw_puda_buf *i40iw_form_cm_frame(struct i40iw_cm_node *cm_node,
373 struct i40iw_kmem_info *options,
374 struct i40iw_kmem_info *hdr,
375 struct i40iw_kmem_info *pdata,
376 u8 flags)
377 {
378 struct i40iw_puda_buf *sqbuf;
379 struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
380 u8 *buf;
381
382 struct tcphdr *tcph;
383 struct iphdr *iph;
384 struct ipv6hdr *ip6h;
385 struct ethhdr *ethh;
386 u16 packetsize;
387 u16 eth_hlen = ETH_HLEN;
388 u32 opts_len = 0;
389 u32 pd_len = 0;
390 u32 hdr_len = 0;
391 u16 vtag;
392
393 sqbuf = i40iw_puda_get_bufpool(vsi->ilq);
394 if (!sqbuf)
395 return NULL;
396 buf = sqbuf->mem.va;
397
398 if (options)
399 opts_len = (u32)options->size;
400
401 if (hdr)
402 hdr_len = hdr->size;
403
404 if (pdata)
405 pd_len = pdata->size;
406
407 if (cm_node->vlan_id <= VLAN_VID_MASK)
408 eth_hlen += 4;
409
410 if (cm_node->ipv4)
411 packetsize = sizeof(*iph) + sizeof(*tcph);
412 else
413 packetsize = sizeof(*ip6h) + sizeof(*tcph);
414 packetsize += opts_len + hdr_len + pd_len;
415
416 memset(buf, 0x00, eth_hlen + packetsize);
417
418 sqbuf->totallen = packetsize + eth_hlen;
419 sqbuf->maclen = eth_hlen;
420 sqbuf->tcphlen = sizeof(*tcph) + opts_len;
421 sqbuf->scratch = (void *)cm_node;
422
423 ethh = (struct ethhdr *)buf;
424 buf += eth_hlen;
425
426 if (cm_node->ipv4) {
427 sqbuf->ipv4 = true;
428
429 iph = (struct iphdr *)buf;
430 buf += sizeof(*iph);
431 tcph = (struct tcphdr *)buf;
432 buf += sizeof(*tcph);
433
434 ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
435 ether_addr_copy(ethh->h_source, cm_node->loc_mac);
436 if (cm_node->vlan_id <= VLAN_VID_MASK) {
437 ((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
438 vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
439 ((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
440
441 ((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IP);
442 } else {
443 ethh->h_proto = htons(ETH_P_IP);
444 }
445
446 iph->version = IPVERSION;
447 iph->ihl = 5; /* 5 * 4Byte words, IP headr len */
448 iph->tos = cm_node->tos;
449 iph->tot_len = htons(packetsize);
450 iph->id = htons(++cm_node->tcp_cntxt.loc_id);
451
452 iph->frag_off = htons(0x4000);
453 iph->ttl = 0x40;
454 iph->protocol = IPPROTO_TCP;
455 iph->saddr = htonl(cm_node->loc_addr[0]);
456 iph->daddr = htonl(cm_node->rem_addr[0]);
457 } else {
458 sqbuf->ipv4 = false;
459 ip6h = (struct ipv6hdr *)buf;
460 buf += sizeof(*ip6h);
461 tcph = (struct tcphdr *)buf;
462 buf += sizeof(*tcph);
463
464 ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
465 ether_addr_copy(ethh->h_source, cm_node->loc_mac);
466 if (cm_node->vlan_id <= VLAN_VID_MASK) {
467 ((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
468 vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
469 ((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
470 ((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IPV6);
471 } else {
472 ethh->h_proto = htons(ETH_P_IPV6);
473 }
474 ip6h->version = 6;
475 ip6h->priority = cm_node->tos >> 4;
476 ip6h->flow_lbl[0] = cm_node->tos << 4;
477 ip6h->flow_lbl[1] = 0;
478 ip6h->flow_lbl[2] = 0;
479 ip6h->payload_len = htons(packetsize - sizeof(*ip6h));
480 ip6h->nexthdr = 6;
481 ip6h->hop_limit = 128;
482 i40iw_copy_ip_htonl(ip6h->saddr.in6_u.u6_addr32,
483 cm_node->loc_addr);
484 i40iw_copy_ip_htonl(ip6h->daddr.in6_u.u6_addr32,
485 cm_node->rem_addr);
486 }
487
488 tcph->source = htons(cm_node->loc_port);
489 tcph->dest = htons(cm_node->rem_port);
490
491 tcph->seq = htonl(cm_node->tcp_cntxt.loc_seq_num);
492
493 if (flags & SET_ACK) {
494 cm_node->tcp_cntxt.loc_ack_num = cm_node->tcp_cntxt.rcv_nxt;
495 tcph->ack_seq = htonl(cm_node->tcp_cntxt.loc_ack_num);
496 tcph->ack = 1;
497 } else {
498 tcph->ack_seq = 0;
499 }
500
501 if (flags & SET_SYN) {
502 cm_node->tcp_cntxt.loc_seq_num++;
503 tcph->syn = 1;
504 } else {
505 cm_node->tcp_cntxt.loc_seq_num += hdr_len + pd_len;
506 }
507
508 if (flags & SET_FIN) {
509 cm_node->tcp_cntxt.loc_seq_num++;
510 tcph->fin = 1;
511 }
512
513 if (flags & SET_RST)
514 tcph->rst = 1;
515
516 tcph->doff = (u16)((sizeof(*tcph) + opts_len + 3) >> 2);
517 sqbuf->tcphlen = tcph->doff << 2;
518 tcph->window = htons(cm_node->tcp_cntxt.rcv_wnd);
519 tcph->urg_ptr = 0;
520
521 if (opts_len) {
522 memcpy(buf, options->addr, opts_len);
523 buf += opts_len;
524 }
525
526 if (hdr_len) {
527 memcpy(buf, hdr->addr, hdr_len);
528 buf += hdr_len;
529 }
530
531 if (pdata && pdata->addr)
532 memcpy(buf, pdata->addr, pdata->size);
533
534 atomic_set(&sqbuf->refcount, 1);
535
536 return sqbuf;
537 }
538
539 /**
540 * i40iw_send_reset - Send RST packet
541 * @cm_node: connection's node
542 */
543 int i40iw_send_reset(struct i40iw_cm_node *cm_node)
544 {
545 struct i40iw_puda_buf *sqbuf;
546 int flags = SET_RST | SET_ACK;
547
548 sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, flags);
549 if (!sqbuf) {
550 i40iw_pr_err("no sqbuf\n");
551 return -1;
552 }
553
554 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 0, 1);
555 }
556
557 /**
558 * i40iw_active_open_err - send event for active side cm error
559 * @cm_node: connection's node
560 * @reset: Flag to send reset or not
561 */
562 static void i40iw_active_open_err(struct i40iw_cm_node *cm_node, bool reset)
563 {
564 i40iw_cleanup_retrans_entry(cm_node);
565 cm_node->cm_core->stats_connect_errs++;
566 if (reset) {
567 i40iw_debug(cm_node->dev,
568 I40IW_DEBUG_CM,
569 "%s cm_node=%p state=%d\n",
570 __func__,
571 cm_node,
572 cm_node->state);
573 atomic_inc(&cm_node->ref_count);
574 i40iw_send_reset(cm_node);
575 }
576
577 cm_node->state = I40IW_CM_STATE_CLOSED;
578 i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
579 }
580
581 /**
582 * i40iw_passive_open_err - handle passive side cm error
583 * @cm_node: connection's node
584 * @reset: send reset or just free cm_node
585 */
586 static void i40iw_passive_open_err(struct i40iw_cm_node *cm_node, bool reset)
587 {
588 i40iw_cleanup_retrans_entry(cm_node);
589 cm_node->cm_core->stats_passive_errs++;
590 cm_node->state = I40IW_CM_STATE_CLOSED;
591 i40iw_debug(cm_node->dev,
592 I40IW_DEBUG_CM,
593 "%s cm_node=%p state =%d\n",
594 __func__,
595 cm_node,
596 cm_node->state);
597 if (reset)
598 i40iw_send_reset(cm_node);
599 else
600 i40iw_rem_ref_cm_node(cm_node);
601 }
602
603 /**
604 * i40iw_event_connect_error - to create connect error event
605 * @event: cm information for connect event
606 */
607 static void i40iw_event_connect_error(struct i40iw_cm_event *event)
608 {
609 struct i40iw_qp *iwqp;
610 struct iw_cm_id *cm_id;
611
612 cm_id = event->cm_node->cm_id;
613 if (!cm_id)
614 return;
615
616 iwqp = cm_id->provider_data;
617
618 if (!iwqp || !iwqp->iwdev)
619 return;
620
621 iwqp->cm_id = NULL;
622 cm_id->provider_data = NULL;
623 i40iw_send_cm_event(event->cm_node, cm_id,
624 IW_CM_EVENT_CONNECT_REPLY,
625 -ECONNRESET);
626 cm_id->rem_ref(cm_id);
627 i40iw_rem_ref_cm_node(event->cm_node);
628 }
629
630 /**
631 * i40iw_process_options
632 * @cm_node: connection's node
633 * @optionsloc: point to start of options
634 * @optionsize: size of all options
635 * @syn_packet: flag if syn packet
636 */
637 static int i40iw_process_options(struct i40iw_cm_node *cm_node,
638 u8 *optionsloc,
639 u32 optionsize,
640 u32 syn_packet)
641 {
642 u32 tmp;
643 u32 offset = 0;
644 union all_known_options *all_options;
645 char got_mss_option = 0;
646
647 while (offset < optionsize) {
648 all_options = (union all_known_options *)(optionsloc + offset);
649 switch (all_options->as_base.optionnum) {
650 case OPTION_NUMBER_END:
651 offset = optionsize;
652 break;
653 case OPTION_NUMBER_NONE:
654 offset += 1;
655 continue;
656 case OPTION_NUMBER_MSS:
657 i40iw_debug(cm_node->dev,
658 I40IW_DEBUG_CM,
659 "%s: MSS Length: %d Offset: %d Size: %d\n",
660 __func__,
661 all_options->as_mss.length,
662 offset,
663 optionsize);
664 got_mss_option = 1;
665 if (all_options->as_mss.length != 4)
666 return -1;
667 tmp = ntohs(all_options->as_mss.mss);
668 if (tmp > 0 && tmp < cm_node->tcp_cntxt.mss)
669 cm_node->tcp_cntxt.mss = tmp;
670 break;
671 case OPTION_NUMBER_WINDOW_SCALE:
672 cm_node->tcp_cntxt.snd_wscale =
673 all_options->as_windowscale.shiftcount;
674 break;
675 default:
676 i40iw_debug(cm_node->dev,
677 I40IW_DEBUG_CM,
678 "TCP Option not understood: %x\n",
679 all_options->as_base.optionnum);
680 break;
681 }
682 offset += all_options->as_base.length;
683 }
684 if (!got_mss_option && syn_packet)
685 cm_node->tcp_cntxt.mss = I40IW_CM_DEFAULT_MSS;
686 return 0;
687 }
688
689 /**
690 * i40iw_handle_tcp_options -
691 * @cm_node: connection's node
692 * @tcph: pointer tcp header
693 * @optionsize: size of options rcvd
694 * @passive: active or passive flag
695 */
696 static int i40iw_handle_tcp_options(struct i40iw_cm_node *cm_node,
697 struct tcphdr *tcph,
698 int optionsize,
699 int passive)
700 {
701 u8 *optionsloc = (u8 *)&tcph[1];
702
703 if (optionsize) {
704 if (i40iw_process_options(cm_node,
705 optionsloc,
706 optionsize,
707 (u32)tcph->syn)) {
708 i40iw_debug(cm_node->dev,
709 I40IW_DEBUG_CM,
710 "%s: Node %p, Sending RESET\n",
711 __func__,
712 cm_node);
713 if (passive)
714 i40iw_passive_open_err(cm_node, true);
715 else
716 i40iw_active_open_err(cm_node, true);
717 return -1;
718 }
719 }
720
721 cm_node->tcp_cntxt.snd_wnd = ntohs(tcph->window) <<
722 cm_node->tcp_cntxt.snd_wscale;
723
724 if (cm_node->tcp_cntxt.snd_wnd > cm_node->tcp_cntxt.max_snd_wnd)
725 cm_node->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.snd_wnd;
726 return 0;
727 }
728
729 /**
730 * i40iw_build_mpa_v1 - build a MPA V1 frame
731 * @cm_node: connection's node
732 * @mpa_key: to do read0 or write0
733 */
734 static void i40iw_build_mpa_v1(struct i40iw_cm_node *cm_node,
735 void *start_addr,
736 u8 mpa_key)
737 {
738 struct ietf_mpa_v1 *mpa_frame = (struct ietf_mpa_v1 *)start_addr;
739
740 switch (mpa_key) {
741 case MPA_KEY_REQUEST:
742 memcpy(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE);
743 break;
744 case MPA_KEY_REPLY:
745 memcpy(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE);
746 break;
747 default:
748 break;
749 }
750 mpa_frame->flags = IETF_MPA_FLAGS_CRC;
751 mpa_frame->rev = cm_node->mpa_frame_rev;
752 mpa_frame->priv_data_len = htons(cm_node->pdata.size);
753 }
754
755 /**
756 * i40iw_build_mpa_v2 - build a MPA V2 frame
757 * @cm_node: connection's node
758 * @start_addr: buffer start address
759 * @mpa_key: to do read0 or write0
760 */
761 static void i40iw_build_mpa_v2(struct i40iw_cm_node *cm_node,
762 void *start_addr,
763 u8 mpa_key)
764 {
765 struct ietf_mpa_v2 *mpa_frame = (struct ietf_mpa_v2 *)start_addr;
766 struct ietf_rtr_msg *rtr_msg = &mpa_frame->rtr_msg;
767 u16 ctrl_ird, ctrl_ord;
768
769 /* initialize the upper 5 bytes of the frame */
770 i40iw_build_mpa_v1(cm_node, start_addr, mpa_key);
771 mpa_frame->flags |= IETF_MPA_V2_FLAG;
772 mpa_frame->priv_data_len += htons(IETF_RTR_MSG_SIZE);
773
774 /* initialize RTR msg */
775 if (cm_node->mpav2_ird_ord == IETF_NO_IRD_ORD) {
776 ctrl_ird = IETF_NO_IRD_ORD;
777 ctrl_ord = IETF_NO_IRD_ORD;
778 } else {
779 ctrl_ird = (cm_node->ird_size > IETF_NO_IRD_ORD) ?
780 IETF_NO_IRD_ORD : cm_node->ird_size;
781 ctrl_ord = (cm_node->ord_size > IETF_NO_IRD_ORD) ?
782 IETF_NO_IRD_ORD : cm_node->ord_size;
783 }
784
785 ctrl_ird |= IETF_PEER_TO_PEER;
786
787 switch (mpa_key) {
788 case MPA_KEY_REQUEST:
789 ctrl_ord |= IETF_RDMA0_WRITE;
790 ctrl_ord |= IETF_RDMA0_READ;
791 break;
792 case MPA_KEY_REPLY:
793 switch (cm_node->send_rdma0_op) {
794 case SEND_RDMA_WRITE_ZERO:
795 ctrl_ord |= IETF_RDMA0_WRITE;
796 break;
797 case SEND_RDMA_READ_ZERO:
798 ctrl_ord |= IETF_RDMA0_READ;
799 break;
800 }
801 break;
802 default:
803 break;
804 }
805 rtr_msg->ctrl_ird = htons(ctrl_ird);
806 rtr_msg->ctrl_ord = htons(ctrl_ord);
807 }
808
809 /**
810 * i40iw_cm_build_mpa_frame - build mpa frame for mpa version 1 or version 2
811 * @cm_node: connection's node
812 * @mpa: mpa: data buffer
813 * @mpa_key: to do read0 or write0
814 */
815 static int i40iw_cm_build_mpa_frame(struct i40iw_cm_node *cm_node,
816 struct i40iw_kmem_info *mpa,
817 u8 mpa_key)
818 {
819 int hdr_len = 0;
820
821 switch (cm_node->mpa_frame_rev) {
822 case IETF_MPA_V1:
823 hdr_len = sizeof(struct ietf_mpa_v1);
824 i40iw_build_mpa_v1(cm_node, mpa->addr, mpa_key);
825 break;
826 case IETF_MPA_V2:
827 hdr_len = sizeof(struct ietf_mpa_v2);
828 i40iw_build_mpa_v2(cm_node, mpa->addr, mpa_key);
829 break;
830 default:
831 break;
832 }
833
834 return hdr_len;
835 }
836
837 /**
838 * i40iw_send_mpa_request - active node send mpa request to passive node
839 * @cm_node: connection's node
840 */
841 static int i40iw_send_mpa_request(struct i40iw_cm_node *cm_node)
842 {
843 struct i40iw_puda_buf *sqbuf;
844
845 if (!cm_node) {
846 i40iw_pr_err("cm_node == NULL\n");
847 return -1;
848 }
849
850 cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
851 cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
852 &cm_node->mpa_hdr,
853 MPA_KEY_REQUEST);
854 if (!cm_node->mpa_hdr.size) {
855 i40iw_pr_err("mpa size = %d\n", cm_node->mpa_hdr.size);
856 return -1;
857 }
858
859 sqbuf = i40iw_form_cm_frame(cm_node,
860 NULL,
861 &cm_node->mpa_hdr,
862 &cm_node->pdata,
863 SET_ACK);
864 if (!sqbuf) {
865 i40iw_pr_err("sq_buf == NULL\n");
866 return -1;
867 }
868 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
869 }
870
871 /**
872 * i40iw_send_mpa_reject -
873 * @cm_node: connection's node
874 * @pdata: reject data for connection
875 * @plen: length of reject data
876 */
877 static int i40iw_send_mpa_reject(struct i40iw_cm_node *cm_node,
878 const void *pdata,
879 u8 plen)
880 {
881 struct i40iw_puda_buf *sqbuf;
882 struct i40iw_kmem_info priv_info;
883
884 cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
885 cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
886 &cm_node->mpa_hdr,
887 MPA_KEY_REPLY);
888
889 cm_node->mpa_frame.flags |= IETF_MPA_FLAGS_REJECT;
890 priv_info.addr = (void *)pdata;
891 priv_info.size = plen;
892
893 sqbuf = i40iw_form_cm_frame(cm_node,
894 NULL,
895 &cm_node->mpa_hdr,
896 &priv_info,
897 SET_ACK | SET_FIN);
898 if (!sqbuf) {
899 i40iw_pr_err("no sqbuf\n");
900 return -ENOMEM;
901 }
902 cm_node->state = I40IW_CM_STATE_FIN_WAIT1;
903 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
904 }
905
906 /**
907 * recv_mpa - process an IETF MPA frame
908 * @cm_node: connection's node
909 * @buffer: Data pointer
910 * @type: to return accept or reject
911 * @len: Len of mpa buffer
912 */
913 static int i40iw_parse_mpa(struct i40iw_cm_node *cm_node, u8 *buffer, u32 *type, u32 len)
914 {
915 struct ietf_mpa_v1 *mpa_frame;
916 struct ietf_mpa_v2 *mpa_v2_frame;
917 struct ietf_rtr_msg *rtr_msg;
918 int mpa_hdr_len;
919 int priv_data_len;
920
921 *type = I40IW_MPA_REQUEST_ACCEPT;
922
923 if (len < sizeof(struct ietf_mpa_v1)) {
924 i40iw_pr_err("ietf buffer small (%x)\n", len);
925 return -1;
926 }
927
928 mpa_frame = (struct ietf_mpa_v1 *)buffer;
929 mpa_hdr_len = sizeof(struct ietf_mpa_v1);
930 priv_data_len = ntohs(mpa_frame->priv_data_len);
931
932 if (priv_data_len > IETF_MAX_PRIV_DATA_LEN) {
933 i40iw_pr_err("large pri_data %d\n", priv_data_len);
934 return -1;
935 }
936 if (mpa_frame->rev != IETF_MPA_V1 && mpa_frame->rev != IETF_MPA_V2) {
937 i40iw_pr_err("unsupported mpa rev = %d\n", mpa_frame->rev);
938 return -1;
939 }
940 if (mpa_frame->rev > cm_node->mpa_frame_rev) {
941 i40iw_pr_err("rev %d\n", mpa_frame->rev);
942 return -1;
943 }
944 cm_node->mpa_frame_rev = mpa_frame->rev;
945
946 if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
947 if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE)) {
948 i40iw_pr_err("Unexpected MPA Key received\n");
949 return -1;
950 }
951 } else {
952 if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE)) {
953 i40iw_pr_err("Unexpected MPA Key received\n");
954 return -1;
955 }
956 }
957
958 if (priv_data_len + mpa_hdr_len > len) {
959 i40iw_pr_err("ietf buffer len(%x + %x != %x)\n",
960 priv_data_len, mpa_hdr_len, len);
961 return -1;
962 }
963 if (len > MAX_CM_BUFFER) {
964 i40iw_pr_err("ietf buffer large len = %d\n", len);
965 return -1;
966 }
967
968 switch (mpa_frame->rev) {
969 case IETF_MPA_V2:{
970 u16 ird_size;
971 u16 ord_size;
972 u16 ctrl_ord;
973 u16 ctrl_ird;
974
975 mpa_v2_frame = (struct ietf_mpa_v2 *)buffer;
976 mpa_hdr_len += IETF_RTR_MSG_SIZE;
977 rtr_msg = &mpa_v2_frame->rtr_msg;
978
979 /* parse rtr message */
980 ctrl_ord = ntohs(rtr_msg->ctrl_ord);
981 ctrl_ird = ntohs(rtr_msg->ctrl_ird);
982 ird_size = ctrl_ird & IETF_NO_IRD_ORD;
983 ord_size = ctrl_ord & IETF_NO_IRD_ORD;
984
985 if (!(ctrl_ird & IETF_PEER_TO_PEER))
986 return -1;
987
988 if (ird_size == IETF_NO_IRD_ORD || ord_size == IETF_NO_IRD_ORD) {
989 cm_node->mpav2_ird_ord = IETF_NO_IRD_ORD;
990 goto negotiate_done;
991 }
992
993 if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
994 /* responder */
995 if (!ord_size && (ctrl_ord & IETF_RDMA0_READ))
996 cm_node->ird_size = 1;
997 if (cm_node->ord_size > ird_size)
998 cm_node->ord_size = ird_size;
999 } else {
1000 /* initiator */
1001 if (!ird_size && (ctrl_ord & IETF_RDMA0_READ))
1002 return -1;
1003 if (cm_node->ord_size > ird_size)
1004 cm_node->ord_size = ird_size;
1005
1006 if (cm_node->ird_size < ord_size)
1007 /* no resources available */
1008 return -1;
1009 }
1010
1011 negotiate_done:
1012 if (ctrl_ord & IETF_RDMA0_READ)
1013 cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
1014 else if (ctrl_ord & IETF_RDMA0_WRITE)
1015 cm_node->send_rdma0_op = SEND_RDMA_WRITE_ZERO;
1016 else /* Not supported RDMA0 operation */
1017 return -1;
1018 i40iw_debug(cm_node->dev, I40IW_DEBUG_CM,
1019 "MPAV2: Negotiated ORD: %d, IRD: %d\n",
1020 cm_node->ord_size, cm_node->ird_size);
1021 break;
1022 }
1023 break;
1024 case IETF_MPA_V1:
1025 default:
1026 break;
1027 }
1028
1029 memcpy(cm_node->pdata_buf, buffer + mpa_hdr_len, priv_data_len);
1030 cm_node->pdata.size = priv_data_len;
1031
1032 if (mpa_frame->flags & IETF_MPA_FLAGS_REJECT)
1033 *type = I40IW_MPA_REQUEST_REJECT;
1034
1035 if (mpa_frame->flags & IETF_MPA_FLAGS_MARKERS)
1036 cm_node->snd_mark_en = true;
1037
1038 return 0;
1039 }
1040
1041 /**
1042 * i40iw_schedule_cm_timer
1043 * @@cm_node: connection's node
1044 * @sqbuf: buffer to send
1045 * @type: if it is send or close
1046 * @send_retrans: if rexmits to be done
1047 * @close_when_complete: is cm_node to be removed
1048 *
1049 * note - cm_node needs to be protected before calling this. Encase in:
1050 * i40iw_rem_ref_cm_node(cm_core, cm_node);
1051 * i40iw_schedule_cm_timer(...)
1052 * atomic_inc(&cm_node->ref_count);
1053 */
1054 int i40iw_schedule_cm_timer(struct i40iw_cm_node *cm_node,
1055 struct i40iw_puda_buf *sqbuf,
1056 enum i40iw_timer_type type,
1057 int send_retrans,
1058 int close_when_complete)
1059 {
1060 struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1061 struct i40iw_cm_core *cm_core = cm_node->cm_core;
1062 struct i40iw_timer_entry *new_send;
1063 int ret = 0;
1064 u32 was_timer_set;
1065 unsigned long flags;
1066
1067 new_send = kzalloc(sizeof(*new_send), GFP_ATOMIC);
1068 if (!new_send) {
1069 if (type != I40IW_TIMER_TYPE_CLOSE)
1070 i40iw_free_sqbuf(vsi, (void *)sqbuf);
1071 return -ENOMEM;
1072 }
1073 new_send->retrycount = I40IW_DEFAULT_RETRYS;
1074 new_send->retranscount = I40IW_DEFAULT_RETRANS;
1075 new_send->sqbuf = sqbuf;
1076 new_send->timetosend = jiffies;
1077 new_send->type = type;
1078 new_send->send_retrans = send_retrans;
1079 new_send->close_when_complete = close_when_complete;
1080
1081 if (type == I40IW_TIMER_TYPE_CLOSE) {
1082 new_send->timetosend += (HZ / 10);
1083 if (cm_node->close_entry) {
1084 kfree(new_send);
1085 i40iw_pr_err("already close entry\n");
1086 return -EINVAL;
1087 }
1088 cm_node->close_entry = new_send;
1089 }
1090
1091 if (type == I40IW_TIMER_TYPE_SEND) {
1092 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1093 cm_node->send_entry = new_send;
1094 atomic_inc(&cm_node->ref_count);
1095 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1096 new_send->timetosend = jiffies + I40IW_RETRY_TIMEOUT;
1097
1098 atomic_inc(&sqbuf->refcount);
1099 i40iw_puda_send_buf(vsi->ilq, sqbuf);
1100 if (!send_retrans) {
1101 i40iw_cleanup_retrans_entry(cm_node);
1102 if (close_when_complete)
1103 i40iw_rem_ref_cm_node(cm_node);
1104 return ret;
1105 }
1106 }
1107
1108 spin_lock_irqsave(&cm_core->ht_lock, flags);
1109 was_timer_set = timer_pending(&cm_core->tcp_timer);
1110
1111 if (!was_timer_set) {
1112 cm_core->tcp_timer.expires = new_send->timetosend;
1113 add_timer(&cm_core->tcp_timer);
1114 }
1115 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1116
1117 return ret;
1118 }
1119
1120 /**
1121 * i40iw_retrans_expired - Could not rexmit the packet
1122 * @cm_node: connection's node
1123 */
1124 static void i40iw_retrans_expired(struct i40iw_cm_node *cm_node)
1125 {
1126 struct iw_cm_id *cm_id = cm_node->cm_id;
1127 enum i40iw_cm_node_state state = cm_node->state;
1128
1129 cm_node->state = I40IW_CM_STATE_CLOSED;
1130 switch (state) {
1131 case I40IW_CM_STATE_SYN_RCVD:
1132 case I40IW_CM_STATE_CLOSING:
1133 i40iw_rem_ref_cm_node(cm_node);
1134 break;
1135 case I40IW_CM_STATE_FIN_WAIT1:
1136 case I40IW_CM_STATE_LAST_ACK:
1137 if (cm_node->cm_id)
1138 cm_id->rem_ref(cm_id);
1139 i40iw_send_reset(cm_node);
1140 break;
1141 default:
1142 atomic_inc(&cm_node->ref_count);
1143 i40iw_send_reset(cm_node);
1144 i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
1145 break;
1146 }
1147 }
1148
1149 /**
1150 * i40iw_handle_close_entry - for handling retry/timeouts
1151 * @cm_node: connection's node
1152 * @rem_node: flag for remove cm_node
1153 */
1154 static void i40iw_handle_close_entry(struct i40iw_cm_node *cm_node, u32 rem_node)
1155 {
1156 struct i40iw_timer_entry *close_entry = cm_node->close_entry;
1157 struct iw_cm_id *cm_id = cm_node->cm_id;
1158 struct i40iw_qp *iwqp;
1159 unsigned long flags;
1160
1161 if (!close_entry)
1162 return;
1163 iwqp = (struct i40iw_qp *)close_entry->sqbuf;
1164 if (iwqp) {
1165 spin_lock_irqsave(&iwqp->lock, flags);
1166 if (iwqp->cm_id) {
1167 iwqp->hw_tcp_state = I40IW_TCP_STATE_CLOSED;
1168 iwqp->hw_iwarp_state = I40IW_QP_STATE_ERROR;
1169 iwqp->last_aeq = I40IW_AE_RESET_SENT;
1170 iwqp->ibqp_state = IB_QPS_ERR;
1171 spin_unlock_irqrestore(&iwqp->lock, flags);
1172 i40iw_cm_disconn(iwqp);
1173 } else {
1174 spin_unlock_irqrestore(&iwqp->lock, flags);
1175 }
1176 } else if (rem_node) {
1177 /* TIME_WAIT state */
1178 i40iw_rem_ref_cm_node(cm_node);
1179 }
1180 if (cm_id)
1181 cm_id->rem_ref(cm_id);
1182 kfree(close_entry);
1183 cm_node->close_entry = NULL;
1184 }
1185
1186 /**
1187 * i40iw_build_timer_list - Add cm_nodes to timer list
1188 * @timer_list: ptr to timer list
1189 * @hte: ptr to accelerated or non-accelerated list
1190 */
1191 static void i40iw_build_timer_list(struct list_head *timer_list,
1192 struct list_head *hte)
1193 {
1194 struct i40iw_cm_node *cm_node;
1195 struct list_head *list_core_temp, *list_node;
1196
1197 list_for_each_safe(list_node, list_core_temp, hte) {
1198 cm_node = container_of(list_node, struct i40iw_cm_node, list);
1199 if (cm_node->close_entry || cm_node->send_entry) {
1200 atomic_inc(&cm_node->ref_count);
1201 list_add(&cm_node->timer_entry, timer_list);
1202 }
1203 }
1204 }
1205
1206 /**
1207 * i40iw_cm_timer_tick - system's timer expired callback
1208 * @pass: Pointing to cm_core
1209 */
1210 static void i40iw_cm_timer_tick(struct timer_list *t)
1211 {
1212 unsigned long nexttimeout = jiffies + I40IW_LONG_TIME;
1213 struct i40iw_cm_node *cm_node;
1214 struct i40iw_timer_entry *send_entry, *close_entry;
1215 struct list_head *list_core_temp;
1216 struct i40iw_sc_vsi *vsi;
1217 struct list_head *list_node;
1218 struct i40iw_cm_core *cm_core = from_timer(cm_core, t, tcp_timer);
1219 u32 settimer = 0;
1220 unsigned long timetosend;
1221 unsigned long flags;
1222
1223 struct list_head timer_list;
1224
1225 INIT_LIST_HEAD(&timer_list);
1226
1227 spin_lock_irqsave(&cm_core->ht_lock, flags);
1228 i40iw_build_timer_list(&timer_list, &cm_core->non_accelerated_list);
1229 i40iw_build_timer_list(&timer_list, &cm_core->accelerated_list);
1230 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1231
1232 list_for_each_safe(list_node, list_core_temp, &timer_list) {
1233 cm_node = container_of(list_node,
1234 struct i40iw_cm_node,
1235 timer_entry);
1236 close_entry = cm_node->close_entry;
1237
1238 if (close_entry) {
1239 if (time_after(close_entry->timetosend, jiffies)) {
1240 if (nexttimeout > close_entry->timetosend ||
1241 !settimer) {
1242 nexttimeout = close_entry->timetosend;
1243 settimer = 1;
1244 }
1245 } else {
1246 i40iw_handle_close_entry(cm_node, 1);
1247 }
1248 }
1249
1250 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1251
1252 send_entry = cm_node->send_entry;
1253 if (!send_entry)
1254 goto done;
1255 if (time_after(send_entry->timetosend, jiffies)) {
1256 if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
1257 if ((nexttimeout > send_entry->timetosend) ||
1258 !settimer) {
1259 nexttimeout = send_entry->timetosend;
1260 settimer = 1;
1261 }
1262 } else {
1263 i40iw_free_retrans_entry(cm_node);
1264 }
1265 goto done;
1266 }
1267
1268 if ((cm_node->state == I40IW_CM_STATE_OFFLOADED) ||
1269 (cm_node->state == I40IW_CM_STATE_CLOSED)) {
1270 i40iw_free_retrans_entry(cm_node);
1271 goto done;
1272 }
1273
1274 if (!send_entry->retranscount || !send_entry->retrycount) {
1275 i40iw_free_retrans_entry(cm_node);
1276
1277 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1278 i40iw_retrans_expired(cm_node);
1279 cm_node->state = I40IW_CM_STATE_CLOSED;
1280 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1281 goto done;
1282 }
1283 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1284
1285 vsi = &cm_node->iwdev->vsi;
1286
1287 if (!cm_node->ack_rcvd) {
1288 atomic_inc(&send_entry->sqbuf->refcount);
1289 i40iw_puda_send_buf(vsi->ilq, send_entry->sqbuf);
1290 cm_node->cm_core->stats_pkt_retrans++;
1291 }
1292 spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1293 if (send_entry->send_retrans) {
1294 send_entry->retranscount--;
1295 timetosend = (I40IW_RETRY_TIMEOUT <<
1296 (I40IW_DEFAULT_RETRANS -
1297 send_entry->retranscount));
1298
1299 send_entry->timetosend = jiffies +
1300 min(timetosend, I40IW_MAX_TIMEOUT);
1301 if (nexttimeout > send_entry->timetosend || !settimer) {
1302 nexttimeout = send_entry->timetosend;
1303 settimer = 1;
1304 }
1305 } else {
1306 int close_when_complete;
1307
1308 close_when_complete = send_entry->close_when_complete;
1309 i40iw_debug(cm_node->dev,
1310 I40IW_DEBUG_CM,
1311 "cm_node=%p state=%d\n",
1312 cm_node,
1313 cm_node->state);
1314 i40iw_free_retrans_entry(cm_node);
1315 if (close_when_complete)
1316 i40iw_rem_ref_cm_node(cm_node);
1317 }
1318 done:
1319 spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1320 i40iw_rem_ref_cm_node(cm_node);
1321 }
1322
1323 if (settimer) {
1324 spin_lock_irqsave(&cm_core->ht_lock, flags);
1325 if (!timer_pending(&cm_core->tcp_timer)) {
1326 cm_core->tcp_timer.expires = nexttimeout;
1327 add_timer(&cm_core->tcp_timer);
1328 }
1329 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1330 }
1331 }
1332
1333 /**
1334 * i40iw_send_syn - send SYN packet
1335 * @cm_node: connection's node
1336 * @sendack: flag to set ACK bit or not
1337 */
1338 int i40iw_send_syn(struct i40iw_cm_node *cm_node, u32 sendack)
1339 {
1340 struct i40iw_puda_buf *sqbuf;
1341 int flags = SET_SYN;
1342 char optionsbuffer[sizeof(struct option_mss) +
1343 sizeof(struct option_windowscale) +
1344 sizeof(struct option_base) + TCP_OPTIONS_PADDING];
1345 struct i40iw_kmem_info opts;
1346
1347 int optionssize = 0;
1348 /* Sending MSS option */
1349 union all_known_options *options;
1350
1351 opts.addr = optionsbuffer;
1352 if (!cm_node) {
1353 i40iw_pr_err("no cm_node\n");
1354 return -EINVAL;
1355 }
1356
1357 options = (union all_known_options *)&optionsbuffer[optionssize];
1358 options->as_mss.optionnum = OPTION_NUMBER_MSS;
1359 options->as_mss.length = sizeof(struct option_mss);
1360 options->as_mss.mss = htons(cm_node->tcp_cntxt.mss);
1361 optionssize += sizeof(struct option_mss);
1362
1363 options = (union all_known_options *)&optionsbuffer[optionssize];
1364 options->as_windowscale.optionnum = OPTION_NUMBER_WINDOW_SCALE;
1365 options->as_windowscale.length = sizeof(struct option_windowscale);
1366 options->as_windowscale.shiftcount = cm_node->tcp_cntxt.rcv_wscale;
1367 optionssize += sizeof(struct option_windowscale);
1368 options = (union all_known_options *)&optionsbuffer[optionssize];
1369 options->as_end = OPTION_NUMBER_END;
1370 optionssize += 1;
1371
1372 if (sendack)
1373 flags |= SET_ACK;
1374
1375 opts.size = optionssize;
1376
1377 sqbuf = i40iw_form_cm_frame(cm_node, &opts, NULL, NULL, flags);
1378 if (!sqbuf) {
1379 i40iw_pr_err("no sqbuf\n");
1380 return -1;
1381 }
1382 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1383 }
1384
1385 /**
1386 * i40iw_send_ack - Send ACK packet
1387 * @cm_node: connection's node
1388 */
1389 static void i40iw_send_ack(struct i40iw_cm_node *cm_node)
1390 {
1391 struct i40iw_puda_buf *sqbuf;
1392 struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1393
1394 sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK);
1395 if (sqbuf)
1396 i40iw_puda_send_buf(vsi->ilq, sqbuf);
1397 else
1398 i40iw_pr_err("no sqbuf\n");
1399 }
1400
1401 /**
1402 * i40iw_send_fin - Send FIN pkt
1403 * @cm_node: connection's node
1404 */
1405 static int i40iw_send_fin(struct i40iw_cm_node *cm_node)
1406 {
1407 struct i40iw_puda_buf *sqbuf;
1408
1409 sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK | SET_FIN);
1410 if (!sqbuf) {
1411 i40iw_pr_err("no sqbuf\n");
1412 return -1;
1413 }
1414 return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1415 }
1416
1417 /**
1418 * i40iw_find_node - find a cm node that matches the reference cm node
1419 * @cm_core: cm's core
1420 * @rem_port: remote tcp port num
1421 * @rem_addr: remote ip addr
1422 * @loc_port: local tcp port num
1423 * @loc_addr: loc ip addr
1424 * @add_refcnt: flag to increment refcount of cm_node
1425 * @accelerated_list: flag for accelerated vs non-accelerated list to search
1426 */
1427 struct i40iw_cm_node *i40iw_find_node(struct i40iw_cm_core *cm_core,
1428 u16 rem_port,
1429 u32 *rem_addr,
1430 u16 loc_port,
1431 u32 *loc_addr,
1432 bool add_refcnt,
1433 bool accelerated_list)
1434 {
1435 struct list_head *hte;
1436 struct i40iw_cm_node *cm_node;
1437 unsigned long flags;
1438
1439 hte = accelerated_list ?
1440 &cm_core->accelerated_list : &cm_core->non_accelerated_list;
1441
1442 /* walk list and find cm_node associated with this session ID */
1443 spin_lock_irqsave(&cm_core->ht_lock, flags);
1444 list_for_each_entry(cm_node, hte, list) {
1445 if (!memcmp(cm_node->loc_addr, loc_addr, sizeof(cm_node->loc_addr)) &&
1446 (cm_node->loc_port == loc_port) &&
1447 !memcmp(cm_node->rem_addr, rem_addr, sizeof(cm_node->rem_addr)) &&
1448 (cm_node->rem_port == rem_port)) {
1449 if (add_refcnt)
1450 atomic_inc(&cm_node->ref_count);
1451 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1452 return cm_node;
1453 }
1454 }
1455 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1456
1457 /* no owner node */
1458 return NULL;
1459 }
1460
1461 /**
1462 * i40iw_find_listener - find a cm node listening on this addr-port pair
1463 * @cm_core: cm's core
1464 * @dst_port: listener tcp port num
1465 * @dst_addr: listener ip addr
1466 * @listener_state: state to match with listen node's
1467 */
1468 static struct i40iw_cm_listener *i40iw_find_listener(
1469 struct i40iw_cm_core *cm_core,
1470 u32 *dst_addr,
1471 u16 dst_port,
1472 u16 vlan_id,
1473 enum i40iw_cm_listener_state
1474 listener_state)
1475 {
1476 struct i40iw_cm_listener *listen_node;
1477 static const u32 ip_zero[4] = { 0, 0, 0, 0 };
1478 u32 listen_addr[4];
1479 u16 listen_port;
1480 unsigned long flags;
1481
1482 /* walk list and find cm_node associated with this session ID */
1483 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1484 list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1485 memcpy(listen_addr, listen_node->loc_addr, sizeof(listen_addr));
1486 listen_port = listen_node->loc_port;
1487 /* compare node pair, return node handle if a match */
1488 if ((!memcmp(listen_addr, dst_addr, sizeof(listen_addr)) ||
1489 !memcmp(listen_addr, ip_zero, sizeof(listen_addr))) &&
1490 (listen_port == dst_port) &&
1491 (listener_state & listen_node->listener_state)) {
1492 atomic_inc(&listen_node->ref_count);
1493 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1494 return listen_node;
1495 }
1496 }
1497 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1498 return NULL;
1499 }
1500
1501 /**
1502 * i40iw_add_hte_node - add a cm node to the hash table
1503 * @cm_core: cm's core
1504 * @cm_node: connection's node
1505 */
1506 static void i40iw_add_hte_node(struct i40iw_cm_core *cm_core,
1507 struct i40iw_cm_node *cm_node)
1508 {
1509 unsigned long flags;
1510
1511 if (!cm_node || !cm_core) {
1512 i40iw_pr_err("cm_node or cm_core == NULL\n");
1513 return;
1514 }
1515
1516 spin_lock_irqsave(&cm_core->ht_lock, flags);
1517 list_add_tail(&cm_node->list, &cm_core->non_accelerated_list);
1518 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1519 }
1520
1521 /**
1522 * i40iw_find_port - find port that matches reference port
1523 * @hte: ptr to accelerated or non-accelerated list
1524 * @accelerated_list: flag for accelerated vs non-accelerated list
1525 */
1526 static bool i40iw_find_port(struct list_head *hte, u16 port)
1527 {
1528 struct i40iw_cm_node *cm_node;
1529
1530 list_for_each_entry(cm_node, hte, list) {
1531 if (cm_node->loc_port == port)
1532 return true;
1533 }
1534 return false;
1535 }
1536
1537 /**
1538 * i40iw_port_in_use - determine if port is in use
1539 * @cm_core: cm's core
1540 * @port: port number
1541 */
1542 bool i40iw_port_in_use(struct i40iw_cm_core *cm_core, u16 port)
1543 {
1544 struct i40iw_cm_listener *listen_node;
1545 unsigned long flags;
1546
1547 spin_lock_irqsave(&cm_core->ht_lock, flags);
1548 if (i40iw_find_port(&cm_core->accelerated_list, port) ||
1549 i40iw_find_port(&cm_core->non_accelerated_list, port)) {
1550 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1551 return true;
1552 }
1553 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1554
1555 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1556 list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1557 if (listen_node->loc_port == port) {
1558 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1559 return true;
1560 }
1561 }
1562 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1563
1564 return false;
1565 }
1566
1567 /**
1568 * i40iw_del_multiple_qhash - Remove qhash and child listens
1569 * @iwdev: iWarp device
1570 * @cm_info: CM info for parent listen node
1571 * @cm_parent_listen_node: The parent listen node
1572 */
1573 static enum i40iw_status_code i40iw_del_multiple_qhash(
1574 struct i40iw_device *iwdev,
1575 struct i40iw_cm_info *cm_info,
1576 struct i40iw_cm_listener *cm_parent_listen_node)
1577 {
1578 struct i40iw_cm_listener *child_listen_node;
1579 enum i40iw_status_code ret = I40IW_ERR_CONFIG;
1580 struct list_head *pos, *tpos;
1581 unsigned long flags;
1582
1583 spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1584 list_for_each_safe(pos, tpos, &cm_parent_listen_node->child_listen_list) {
1585 child_listen_node = list_entry(pos, struct i40iw_cm_listener, child_listen_list);
1586 if (child_listen_node->ipv4)
1587 i40iw_debug(&iwdev->sc_dev,
1588 I40IW_DEBUG_CM,
1589 "removing child listen for IP=%pI4, port=%d, vlan=%d\n",
1590 child_listen_node->loc_addr,
1591 child_listen_node->loc_port,
1592 child_listen_node->vlan_id);
1593 else
1594 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
1595 "removing child listen for IP=%pI6, port=%d, vlan=%d\n",
1596 child_listen_node->loc_addr,
1597 child_listen_node->loc_port,
1598 child_listen_node->vlan_id);
1599 list_del(pos);
1600 memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1601 sizeof(cm_info->loc_addr));
1602 cm_info->vlan_id = child_listen_node->vlan_id;
1603 if (child_listen_node->qhash_set) {
1604 ret = i40iw_manage_qhash(iwdev, cm_info,
1605 I40IW_QHASH_TYPE_TCP_SYN,
1606 I40IW_QHASH_MANAGE_TYPE_DELETE,
1607 NULL, false);
1608 child_listen_node->qhash_set = false;
1609 } else {
1610 ret = I40IW_SUCCESS;
1611 }
1612 i40iw_debug(&iwdev->sc_dev,
1613 I40IW_DEBUG_CM,
1614 "freed pointer = %p\n",
1615 child_listen_node);
1616 kfree(child_listen_node);
1617 cm_parent_listen_node->cm_core->stats_listen_nodes_destroyed++;
1618 }
1619 spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1620
1621 return ret;
1622 }
1623
1624 /**
1625 * i40iw_netdev_vlan_ipv6 - Gets the netdev and vlan
1626 * @addr: local IPv6 address
1627 * @vlan_id: vlan id for the given IPv6 address
1628 *
1629 * Returns the net_device of the IPv6 address and also sets the
1630 * vlan id for that address.
1631 */
1632 static struct net_device *i40iw_netdev_vlan_ipv6(u32 *addr, u16 *vlan_id)
1633 {
1634 struct net_device *ip_dev = NULL;
1635 struct in6_addr laddr6;
1636
1637 if (!IS_ENABLED(CONFIG_IPV6))
1638 return NULL;
1639 i40iw_copy_ip_htonl(laddr6.in6_u.u6_addr32, addr);
1640 if (vlan_id)
1641 *vlan_id = I40IW_NO_VLAN;
1642 rcu_read_lock();
1643 for_each_netdev_rcu(&init_net, ip_dev) {
1644 if (ipv6_chk_addr(&init_net, &laddr6, ip_dev, 1)) {
1645 if (vlan_id)
1646 *vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1647 break;
1648 }
1649 }
1650 rcu_read_unlock();
1651 return ip_dev;
1652 }
1653
1654 /**
1655 * i40iw_get_vlan_ipv4 - Returns the vlan_id for IPv4 address
1656 * @addr: local IPv4 address
1657 */
1658 static u16 i40iw_get_vlan_ipv4(u32 *addr)
1659 {
1660 struct net_device *netdev;
1661 u16 vlan_id = I40IW_NO_VLAN;
1662
1663 netdev = ip_dev_find(&init_net, htonl(addr[0]));
1664 if (netdev) {
1665 vlan_id = rdma_vlan_dev_vlan_id(netdev);
1666 dev_put(netdev);
1667 }
1668 return vlan_id;
1669 }
1670
1671 /**
1672 * i40iw_add_mqh_6 - Adds multiple qhashes for IPv6
1673 * @iwdev: iWarp device
1674 * @cm_info: CM info for parent listen node
1675 * @cm_parent_listen_node: The parent listen node
1676 *
1677 * Adds a qhash and a child listen node for every IPv6 address
1678 * on the adapter and adds the associated qhash filter
1679 */
1680 static enum i40iw_status_code i40iw_add_mqh_6(struct i40iw_device *iwdev,
1681 struct i40iw_cm_info *cm_info,
1682 struct i40iw_cm_listener *cm_parent_listen_node)
1683 {
1684 struct net_device *ip_dev;
1685 struct inet6_dev *idev;
1686 struct inet6_ifaddr *ifp, *tmp;
1687 enum i40iw_status_code ret = 0;
1688 struct i40iw_cm_listener *child_listen_node;
1689 unsigned long flags;
1690
1691 rtnl_lock();
1692 for_each_netdev(&init_net, ip_dev) {
1693 if ((((rdma_vlan_dev_vlan_id(ip_dev) < I40IW_NO_VLAN) &&
1694 (rdma_vlan_dev_real_dev(ip_dev) == iwdev->netdev)) ||
1695 (ip_dev == iwdev->netdev)) && (ip_dev->flags & IFF_UP)) {
1696 idev = __in6_dev_get(ip_dev);
1697 if (!idev) {
1698 i40iw_pr_err("idev == NULL\n");
1699 break;
1700 }
1701 list_for_each_entry_safe(ifp, tmp, &idev->addr_list, if_list) {
1702 i40iw_debug(&iwdev->sc_dev,
1703 I40IW_DEBUG_CM,
1704 "IP=%pI6, vlan_id=%d, MAC=%pM\n",
1705 &ifp->addr,
1706 rdma_vlan_dev_vlan_id(ip_dev),
1707 ip_dev->dev_addr);
1708 child_listen_node =
1709 kzalloc(sizeof(*child_listen_node), GFP_ATOMIC);
1710 i40iw_debug(&iwdev->sc_dev,
1711 I40IW_DEBUG_CM,
1712 "Allocating child listener %p\n",
1713 child_listen_node);
1714 if (!child_listen_node) {
1715 ret = I40IW_ERR_NO_MEMORY;
1716 goto exit;
1717 }
1718 cm_info->vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1719 cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1720
1721 memcpy(child_listen_node, cm_parent_listen_node,
1722 sizeof(*child_listen_node));
1723
1724 i40iw_copy_ip_ntohl(child_listen_node->loc_addr,
1725 ifp->addr.in6_u.u6_addr32);
1726 memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1727 sizeof(cm_info->loc_addr));
1728
1729 ret = i40iw_manage_qhash(iwdev, cm_info,
1730 I40IW_QHASH_TYPE_TCP_SYN,
1731 I40IW_QHASH_MANAGE_TYPE_ADD,
1732 NULL, true);
1733 if (!ret) {
1734 child_listen_node->qhash_set = true;
1735 spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1736 list_add(&child_listen_node->child_listen_list,
1737 &cm_parent_listen_node->child_listen_list);
1738 spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1739 cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1740 } else {
1741 kfree(child_listen_node);
1742 }
1743 }
1744 }
1745 }
1746 exit:
1747 rtnl_unlock();
1748 return ret;
1749 }
1750
1751 /**
1752 * i40iw_add_mqh_4 - Adds multiple qhashes for IPv4
1753 * @iwdev: iWarp device
1754 * @cm_info: CM info for parent listen node
1755 * @cm_parent_listen_node: The parent listen node
1756 *
1757 * Adds a qhash and a child listen node for every IPv4 address
1758 * on the adapter and adds the associated qhash filter
1759 */
1760 static enum i40iw_status_code i40iw_add_mqh_4(
1761 struct i40iw_device *iwdev,
1762 struct i40iw_cm_info *cm_info,
1763 struct i40iw_cm_listener *cm_parent_listen_node)
1764 {
1765 struct net_device *dev;
1766 struct in_device *idev;
1767 struct i40iw_cm_listener *child_listen_node;
1768 enum i40iw_status_code ret = 0;
1769 unsigned long flags;
1770
1771 rtnl_lock();
1772 for_each_netdev(&init_net, dev) {
1773 if ((((rdma_vlan_dev_vlan_id(dev) < I40IW_NO_VLAN) &&
1774 (rdma_vlan_dev_real_dev(dev) == iwdev->netdev)) ||
1775 (dev == iwdev->netdev)) && (dev->flags & IFF_UP)) {
1776 const struct in_ifaddr *ifa;
1777
1778 idev = in_dev_get(dev);
1779
1780 in_dev_for_each_ifa_rtnl(ifa, idev) {
1781 i40iw_debug(&iwdev->sc_dev,
1782 I40IW_DEBUG_CM,
1783 "Allocating child CM Listener forIP=%pI4, vlan_id=%d, MAC=%pM\n",
1784 &ifa->ifa_address,
1785 rdma_vlan_dev_vlan_id(dev),
1786 dev->dev_addr);
1787 child_listen_node = kzalloc(sizeof(*child_listen_node), GFP_KERNEL);
1788 cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1789 i40iw_debug(&iwdev->sc_dev,
1790 I40IW_DEBUG_CM,
1791 "Allocating child listener %p\n",
1792 child_listen_node);
1793 if (!child_listen_node) {
1794 in_dev_put(idev);
1795 ret = I40IW_ERR_NO_MEMORY;
1796 goto exit;
1797 }
1798 cm_info->vlan_id = rdma_vlan_dev_vlan_id(dev);
1799 cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1800 memcpy(child_listen_node,
1801 cm_parent_listen_node,
1802 sizeof(*child_listen_node));
1803
1804 child_listen_node->loc_addr[0] = ntohl(ifa->ifa_address);
1805 memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1806 sizeof(cm_info->loc_addr));
1807
1808 ret = i40iw_manage_qhash(iwdev,
1809 cm_info,
1810 I40IW_QHASH_TYPE_TCP_SYN,
1811 I40IW_QHASH_MANAGE_TYPE_ADD,
1812 NULL,
1813 true);
1814 if (!ret) {
1815 child_listen_node->qhash_set = true;
1816 spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1817 list_add(&child_listen_node->child_listen_list,
1818 &cm_parent_listen_node->child_listen_list);
1819 spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1820 } else {
1821 kfree(child_listen_node);
1822 cm_parent_listen_node->cm_core->stats_listen_nodes_created--;
1823 }
1824 }
1825
1826 in_dev_put(idev);
1827 }
1828 }
1829 exit:
1830 rtnl_unlock();
1831 return ret;
1832 }
1833
1834 /**
1835 * i40iw_dec_refcnt_listen - delete listener and associated cm nodes
1836 * @cm_core: cm's core
1837 * @free_hanging_nodes: to free associated cm_nodes
1838 * @apbvt_del: flag to delete the apbvt
1839 */
1840 static int i40iw_dec_refcnt_listen(struct i40iw_cm_core *cm_core,
1841 struct i40iw_cm_listener *listener,
1842 int free_hanging_nodes, bool apbvt_del)
1843 {
1844 int ret = -EINVAL;
1845 int err = 0;
1846 struct list_head *list_pos;
1847 struct list_head *list_temp;
1848 struct i40iw_cm_node *cm_node;
1849 struct list_head reset_list;
1850 struct i40iw_cm_info nfo;
1851 struct i40iw_cm_node *loopback;
1852 enum i40iw_cm_node_state old_state;
1853 unsigned long flags;
1854
1855 /* free non-accelerated child nodes for this listener */
1856 INIT_LIST_HEAD(&reset_list);
1857 if (free_hanging_nodes) {
1858 spin_lock_irqsave(&cm_core->ht_lock, flags);
1859 list_for_each_safe(list_pos,
1860 list_temp, &cm_core->non_accelerated_list) {
1861 cm_node = container_of(list_pos, struct i40iw_cm_node, list);
1862 if ((cm_node->listener == listener) &&
1863 !cm_node->accelerated) {
1864 atomic_inc(&cm_node->ref_count);
1865 list_add(&cm_node->reset_entry, &reset_list);
1866 }
1867 }
1868 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1869 }
1870
1871 list_for_each_safe(list_pos, list_temp, &reset_list) {
1872 cm_node = container_of(list_pos, struct i40iw_cm_node, reset_entry);
1873 loopback = cm_node->loopbackpartner;
1874 if (cm_node->state >= I40IW_CM_STATE_FIN_WAIT1) {
1875 i40iw_rem_ref_cm_node(cm_node);
1876 } else {
1877 if (!loopback) {
1878 i40iw_cleanup_retrans_entry(cm_node);
1879 err = i40iw_send_reset(cm_node);
1880 if (err) {
1881 cm_node->state = I40IW_CM_STATE_CLOSED;
1882 i40iw_pr_err("send reset\n");
1883 } else {
1884 old_state = cm_node->state;
1885 cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1886 if (old_state != I40IW_CM_STATE_MPAREQ_RCVD)
1887 i40iw_rem_ref_cm_node(cm_node);
1888 }
1889 } else {
1890 struct i40iw_cm_event event;
1891
1892 event.cm_node = loopback;
1893 memcpy(event.cm_info.rem_addr,
1894 loopback->rem_addr, sizeof(event.cm_info.rem_addr));
1895 memcpy(event.cm_info.loc_addr,
1896 loopback->loc_addr, sizeof(event.cm_info.loc_addr));
1897 event.cm_info.rem_port = loopback->rem_port;
1898 event.cm_info.loc_port = loopback->loc_port;
1899 event.cm_info.cm_id = loopback->cm_id;
1900 event.cm_info.ipv4 = loopback->ipv4;
1901 atomic_inc(&loopback->ref_count);
1902 loopback->state = I40IW_CM_STATE_CLOSED;
1903 i40iw_event_connect_error(&event);
1904 cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1905 i40iw_rem_ref_cm_node(cm_node);
1906 }
1907 }
1908 }
1909
1910 if (!atomic_dec_return(&listener->ref_count)) {
1911 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1912 list_del(&listener->list);
1913 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1914
1915 if (listener->iwdev) {
1916 if (apbvt_del)
1917 i40iw_manage_apbvt(listener->iwdev,
1918 listener->loc_port,
1919 I40IW_MANAGE_APBVT_DEL);
1920
1921 memcpy(nfo.loc_addr, listener->loc_addr, sizeof(nfo.loc_addr));
1922 nfo.loc_port = listener->loc_port;
1923 nfo.ipv4 = listener->ipv4;
1924 nfo.vlan_id = listener->vlan_id;
1925 nfo.user_pri = listener->user_pri;
1926
1927 if (!list_empty(&listener->child_listen_list)) {
1928 i40iw_del_multiple_qhash(listener->iwdev, &nfo, listener);
1929 } else {
1930 if (listener->qhash_set)
1931 i40iw_manage_qhash(listener->iwdev,
1932 &nfo,
1933 I40IW_QHASH_TYPE_TCP_SYN,
1934 I40IW_QHASH_MANAGE_TYPE_DELETE,
1935 NULL,
1936 false);
1937 }
1938 }
1939
1940 cm_core->stats_listen_destroyed++;
1941 kfree(listener);
1942 cm_core->stats_listen_nodes_destroyed++;
1943 listener = NULL;
1944 ret = 0;
1945 }
1946
1947 if (listener) {
1948 if (atomic_read(&listener->pend_accepts_cnt) > 0)
1949 i40iw_debug(cm_core->dev,
1950 I40IW_DEBUG_CM,
1951 "%s: listener (%p) pending accepts=%u\n",
1952 __func__,
1953 listener,
1954 atomic_read(&listener->pend_accepts_cnt));
1955 }
1956
1957 return ret;
1958 }
1959
1960 /**
1961 * i40iw_cm_del_listen - delete a linstener
1962 * @cm_core: cm's core
1963 * @listener: passive connection's listener
1964 * @apbvt_del: flag to delete apbvt
1965 */
1966 static int i40iw_cm_del_listen(struct i40iw_cm_core *cm_core,
1967 struct i40iw_cm_listener *listener,
1968 bool apbvt_del)
1969 {
1970 listener->listener_state = I40IW_CM_LISTENER_PASSIVE_STATE;
1971 listener->cm_id = NULL; /* going to be destroyed pretty soon */
1972 return i40iw_dec_refcnt_listen(cm_core, listener, 1, apbvt_del);
1973 }
1974
1975 /**
1976 * i40iw_addr_resolve_neigh - resolve neighbor address
1977 * @iwdev: iwarp device structure
1978 * @src_ip: local ip address
1979 * @dst_ip: remote ip address
1980 * @arpindex: if there is an arp entry
1981 */
1982 static int i40iw_addr_resolve_neigh(struct i40iw_device *iwdev,
1983 u32 src_ip,
1984 u32 dst_ip,
1985 int arpindex)
1986 {
1987 struct rtable *rt;
1988 struct neighbour *neigh;
1989 int rc = arpindex;
1990 struct net_device *netdev = iwdev->netdev;
1991 __be32 dst_ipaddr = htonl(dst_ip);
1992 __be32 src_ipaddr = htonl(src_ip);
1993
1994 rt = ip_route_output(&init_net, dst_ipaddr, src_ipaddr, 0, 0);
1995 if (IS_ERR(rt)) {
1996 i40iw_pr_err("ip_route_output\n");
1997 return rc;
1998 }
1999
2000 if (netif_is_bond_slave(netdev))
2001 netdev = netdev_master_upper_dev_get(netdev);
2002
2003 neigh = dst_neigh_lookup(&rt->dst, &dst_ipaddr);
2004
2005 rcu_read_lock();
2006 if (neigh) {
2007 if (neigh->nud_state & NUD_VALID) {
2008 if (arpindex >= 0) {
2009 if (ether_addr_equal(iwdev->arp_table[arpindex].mac_addr,
2010 neigh->ha))
2011 /* Mac address same as arp table */
2012 goto resolve_neigh_exit;
2013 i40iw_manage_arp_cache(iwdev,
2014 iwdev->arp_table[arpindex].mac_addr,
2015 &dst_ip,
2016 true,
2017 I40IW_ARP_DELETE);
2018 }
2019
2020 i40iw_manage_arp_cache(iwdev, neigh->ha, &dst_ip, true, I40IW_ARP_ADD);
2021 rc = i40iw_arp_table(iwdev, &dst_ip, true, NULL, I40IW_ARP_RESOLVE);
2022 } else {
2023 neigh_event_send(neigh, NULL);
2024 }
2025 }
2026 resolve_neigh_exit:
2027
2028 rcu_read_unlock();
2029 if (neigh)
2030 neigh_release(neigh);
2031
2032 ip_rt_put(rt);
2033 return rc;
2034 }
2035
2036 /**
2037 * i40iw_get_dst_ipv6
2038 */
2039 static struct dst_entry *i40iw_get_dst_ipv6(struct sockaddr_in6 *src_addr,
2040 struct sockaddr_in6 *dst_addr)
2041 {
2042 struct dst_entry *dst;
2043 struct flowi6 fl6;
2044
2045 memset(&fl6, 0, sizeof(fl6));
2046 fl6.daddr = dst_addr->sin6_addr;
2047 fl6.saddr = src_addr->sin6_addr;
2048 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
2049 fl6.flowi6_oif = dst_addr->sin6_scope_id;
2050
2051 dst = ip6_route_output(&init_net, NULL, &fl6);
2052 return dst;
2053 }
2054
2055 /**
2056 * i40iw_addr_resolve_neigh_ipv6 - resolve neighbor ipv6 address
2057 * @iwdev: iwarp device structure
2058 * @dst_ip: remote ip address
2059 * @arpindex: if there is an arp entry
2060 */
2061 static int i40iw_addr_resolve_neigh_ipv6(struct i40iw_device *iwdev,
2062 u32 *src,
2063 u32 *dest,
2064 int arpindex)
2065 {
2066 struct neighbour *neigh;
2067 int rc = arpindex;
2068 struct net_device *netdev = iwdev->netdev;
2069 struct dst_entry *dst;
2070 struct sockaddr_in6 dst_addr;
2071 struct sockaddr_in6 src_addr;
2072
2073 memset(&dst_addr, 0, sizeof(dst_addr));
2074 dst_addr.sin6_family = AF_INET6;
2075 i40iw_copy_ip_htonl(dst_addr.sin6_addr.in6_u.u6_addr32, dest);
2076 memset(&src_addr, 0, sizeof(src_addr));
2077 src_addr.sin6_family = AF_INET6;
2078 i40iw_copy_ip_htonl(src_addr.sin6_addr.in6_u.u6_addr32, src);
2079 dst = i40iw_get_dst_ipv6(&src_addr, &dst_addr);
2080 if (!dst || dst->error) {
2081 if (dst) {
2082 i40iw_pr_err("ip6_route_output returned dst->error = %d\n",
2083 dst->error);
2084 dst_release(dst);
2085 }
2086 return rc;
2087 }
2088
2089 if (netif_is_bond_slave(netdev))
2090 netdev = netdev_master_upper_dev_get(netdev);
2091
2092 neigh = dst_neigh_lookup(dst, dst_addr.sin6_addr.in6_u.u6_addr32);
2093
2094 rcu_read_lock();
2095 if (neigh) {
2096 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "dst_neigh_lookup MAC=%pM\n", neigh->ha);
2097 if (neigh->nud_state & NUD_VALID) {
2098 if (arpindex >= 0) {
2099 if (ether_addr_equal
2100 (iwdev->arp_table[arpindex].mac_addr,
2101 neigh->ha)) {
2102 /* Mac address same as in arp table */
2103 goto resolve_neigh_exit6;
2104 }
2105 i40iw_manage_arp_cache(iwdev,
2106 iwdev->arp_table[arpindex].mac_addr,
2107 dest,
2108 false,
2109 I40IW_ARP_DELETE);
2110 }
2111 i40iw_manage_arp_cache(iwdev,
2112 neigh->ha,
2113 dest,
2114 false,
2115 I40IW_ARP_ADD);
2116 rc = i40iw_arp_table(iwdev,
2117 dest,
2118 false,
2119 NULL,
2120 I40IW_ARP_RESOLVE);
2121 } else {
2122 neigh_event_send(neigh, NULL);
2123 }
2124 }
2125
2126 resolve_neigh_exit6:
2127 rcu_read_unlock();
2128 if (neigh)
2129 neigh_release(neigh);
2130 dst_release(dst);
2131 return rc;
2132 }
2133
2134 /**
2135 * i40iw_ipv4_is_loopback - check if loopback
2136 * @loc_addr: local addr to compare
2137 * @rem_addr: remote address
2138 */
2139 static bool i40iw_ipv4_is_loopback(u32 loc_addr, u32 rem_addr)
2140 {
2141 return ipv4_is_loopback(htonl(rem_addr)) || (loc_addr == rem_addr);
2142 }
2143
2144 /**
2145 * i40iw_ipv6_is_loopback - check if loopback
2146 * @loc_addr: local addr to compare
2147 * @rem_addr: remote address
2148 */
2149 static bool i40iw_ipv6_is_loopback(u32 *loc_addr, u32 *rem_addr)
2150 {
2151 struct in6_addr raddr6;
2152
2153 i40iw_copy_ip_htonl(raddr6.in6_u.u6_addr32, rem_addr);
2154 return !memcmp(loc_addr, rem_addr, 16) || ipv6_addr_loopback(&raddr6);
2155 }
2156
2157 /**
2158 * i40iw_make_cm_node - create a new instance of a cm node
2159 * @cm_core: cm's core
2160 * @iwdev: iwarp device structure
2161 * @cm_info: quad info for connection
2162 * @listener: passive connection's listener
2163 */
2164 static struct i40iw_cm_node *i40iw_make_cm_node(
2165 struct i40iw_cm_core *cm_core,
2166 struct i40iw_device *iwdev,
2167 struct i40iw_cm_info *cm_info,
2168 struct i40iw_cm_listener *listener)
2169 {
2170 struct i40iw_cm_node *cm_node;
2171 int oldarpindex;
2172 int arpindex;
2173 struct net_device *netdev = iwdev->netdev;
2174
2175 /* create an hte and cm_node for this instance */
2176 cm_node = kzalloc(sizeof(*cm_node), GFP_ATOMIC);
2177 if (!cm_node)
2178 return NULL;
2179
2180 /* set our node specific transport info */
2181 cm_node->ipv4 = cm_info->ipv4;
2182 cm_node->vlan_id = cm_info->vlan_id;
2183 if ((cm_node->vlan_id == I40IW_NO_VLAN) && iwdev->dcb)
2184 cm_node->vlan_id = 0;
2185 cm_node->tos = cm_info->tos;
2186 cm_node->user_pri = cm_info->user_pri;
2187 if (listener) {
2188 if (listener->tos != cm_info->tos)
2189 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB,
2190 "application TOS[%d] and remote client TOS[%d] mismatch\n",
2191 listener->tos, cm_info->tos);
2192 cm_node->tos = max(listener->tos, cm_info->tos);
2193 cm_node->user_pri = rt_tos2priority(cm_node->tos);
2194 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "listener: TOS:[%d] UP:[%d]\n",
2195 cm_node->tos, cm_node->user_pri);
2196 }
2197 memcpy(cm_node->loc_addr, cm_info->loc_addr, sizeof(cm_node->loc_addr));
2198 memcpy(cm_node->rem_addr, cm_info->rem_addr, sizeof(cm_node->rem_addr));
2199 cm_node->loc_port = cm_info->loc_port;
2200 cm_node->rem_port = cm_info->rem_port;
2201
2202 cm_node->mpa_frame_rev = iwdev->mpa_version;
2203 cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
2204 cm_node->ird_size = I40IW_MAX_IRD_SIZE;
2205 cm_node->ord_size = I40IW_MAX_ORD_SIZE;
2206
2207 cm_node->listener = listener;
2208 cm_node->cm_id = cm_info->cm_id;
2209 ether_addr_copy(cm_node->loc_mac, netdev->dev_addr);
2210 spin_lock_init(&cm_node->retrans_list_lock);
2211 cm_node->ack_rcvd = false;
2212
2213 atomic_set(&cm_node->ref_count, 1);
2214 /* associate our parent CM core */
2215 cm_node->cm_core = cm_core;
2216 cm_node->tcp_cntxt.loc_id = I40IW_CM_DEF_LOCAL_ID;
2217 cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2218 cm_node->tcp_cntxt.rcv_wnd =
2219 I40IW_CM_DEFAULT_RCV_WND_SCALED >> I40IW_CM_DEFAULT_RCV_WND_SCALE;
2220 if (cm_node->ipv4) {
2221 cm_node->tcp_cntxt.loc_seq_num = secure_tcp_seq(htonl(cm_node->loc_addr[0]),
2222 htonl(cm_node->rem_addr[0]),
2223 htons(cm_node->loc_port),
2224 htons(cm_node->rem_port));
2225 cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV4;
2226 } else if (IS_ENABLED(CONFIG_IPV6)) {
2227 __be32 loc[4] = {
2228 htonl(cm_node->loc_addr[0]), htonl(cm_node->loc_addr[1]),
2229 htonl(cm_node->loc_addr[2]), htonl(cm_node->loc_addr[3])
2230 };
2231 __be32 rem[4] = {
2232 htonl(cm_node->rem_addr[0]), htonl(cm_node->rem_addr[1]),
2233 htonl(cm_node->rem_addr[2]), htonl(cm_node->rem_addr[3])
2234 };
2235 cm_node->tcp_cntxt.loc_seq_num = secure_tcpv6_seq(loc, rem,
2236 htons(cm_node->loc_port),
2237 htons(cm_node->rem_port));
2238 cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV6;
2239 }
2240
2241 cm_node->iwdev = iwdev;
2242 cm_node->dev = &iwdev->sc_dev;
2243
2244 if ((cm_node->ipv4 &&
2245 i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
2246 (!cm_node->ipv4 && i40iw_ipv6_is_loopback(cm_node->loc_addr,
2247 cm_node->rem_addr))) {
2248 arpindex = i40iw_arp_table(iwdev,
2249 cm_node->rem_addr,
2250 false,
2251 NULL,
2252 I40IW_ARP_RESOLVE);
2253 } else {
2254 oldarpindex = i40iw_arp_table(iwdev,
2255 cm_node->rem_addr,
2256 false,
2257 NULL,
2258 I40IW_ARP_RESOLVE);
2259 if (cm_node->ipv4)
2260 arpindex = i40iw_addr_resolve_neigh(iwdev,
2261 cm_info->loc_addr[0],
2262 cm_info->rem_addr[0],
2263 oldarpindex);
2264 else if (IS_ENABLED(CONFIG_IPV6))
2265 arpindex = i40iw_addr_resolve_neigh_ipv6(iwdev,
2266 cm_info->loc_addr,
2267 cm_info->rem_addr,
2268 oldarpindex);
2269 else
2270 arpindex = -EINVAL;
2271 }
2272 if (arpindex < 0) {
2273 i40iw_pr_err("cm_node arpindex\n");
2274 kfree(cm_node);
2275 return NULL;
2276 }
2277 ether_addr_copy(cm_node->rem_mac, iwdev->arp_table[arpindex].mac_addr);
2278 i40iw_add_hte_node(cm_core, cm_node);
2279 cm_core->stats_nodes_created++;
2280 return cm_node;
2281 }
2282
2283 /**
2284 * i40iw_rem_ref_cm_node - destroy an instance of a cm node
2285 * @cm_node: connection's node
2286 */
2287 static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *cm_node)
2288 {
2289 struct i40iw_cm_core *cm_core = cm_node->cm_core;
2290 struct i40iw_qp *iwqp;
2291 struct i40iw_cm_info nfo;
2292 unsigned long flags;
2293
2294 spin_lock_irqsave(&cm_node->cm_core->ht_lock, flags);
2295 if (atomic_dec_return(&cm_node->ref_count)) {
2296 spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2297 return;
2298 }
2299 list_del(&cm_node->list);
2300 spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2301
2302 /* if the node is destroyed before connection was accelerated */
2303 if (!cm_node->accelerated && cm_node->accept_pend) {
2304 pr_err("node destroyed before established\n");
2305 atomic_dec(&cm_node->listener->pend_accepts_cnt);
2306 }
2307 if (cm_node->close_entry)
2308 i40iw_handle_close_entry(cm_node, 0);
2309 if (cm_node->listener) {
2310 i40iw_dec_refcnt_listen(cm_core, cm_node->listener, 0, true);
2311 } else {
2312 if (cm_node->apbvt_set) {
2313 i40iw_manage_apbvt(cm_node->iwdev,
2314 cm_node->loc_port,
2315 I40IW_MANAGE_APBVT_DEL);
2316 cm_node->apbvt_set = 0;
2317 }
2318 i40iw_get_addr_info(cm_node, &nfo);
2319 if (cm_node->qhash_set) {
2320 i40iw_manage_qhash(cm_node->iwdev,
2321 &nfo,
2322 I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2323 I40IW_QHASH_MANAGE_TYPE_DELETE,
2324 NULL,
2325 false);
2326 cm_node->qhash_set = 0;
2327 }
2328 }
2329
2330 iwqp = cm_node->iwqp;
2331 if (iwqp) {
2332 iwqp->cm_node = NULL;
2333 i40iw_rem_ref(&iwqp->ibqp);
2334 cm_node->iwqp = NULL;
2335 } else if (cm_node->qhash_set) {
2336 i40iw_get_addr_info(cm_node, &nfo);
2337 i40iw_manage_qhash(cm_node->iwdev,
2338 &nfo,
2339 I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2340 I40IW_QHASH_MANAGE_TYPE_DELETE,
2341 NULL,
2342 false);
2343 cm_node->qhash_set = 0;
2344 }
2345
2346 cm_node->cm_core->stats_nodes_destroyed++;
2347 kfree(cm_node);
2348 }
2349
2350 /**
2351 * i40iw_handle_fin_pkt - FIN packet received
2352 * @cm_node: connection's node
2353 */
2354 static void i40iw_handle_fin_pkt(struct i40iw_cm_node *cm_node)
2355 {
2356 u32 ret;
2357
2358 switch (cm_node->state) {
2359 case I40IW_CM_STATE_SYN_RCVD:
2360 case I40IW_CM_STATE_SYN_SENT:
2361 case I40IW_CM_STATE_ESTABLISHED:
2362 case I40IW_CM_STATE_MPAREJ_RCVD:
2363 cm_node->tcp_cntxt.rcv_nxt++;
2364 i40iw_cleanup_retrans_entry(cm_node);
2365 cm_node->state = I40IW_CM_STATE_LAST_ACK;
2366 i40iw_send_fin(cm_node);
2367 break;
2368 case I40IW_CM_STATE_MPAREQ_SENT:
2369 i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
2370 cm_node->tcp_cntxt.rcv_nxt++;
2371 i40iw_cleanup_retrans_entry(cm_node);
2372 cm_node->state = I40IW_CM_STATE_CLOSED;
2373 atomic_inc(&cm_node->ref_count);
2374 i40iw_send_reset(cm_node);
2375 break;
2376 case I40IW_CM_STATE_FIN_WAIT1:
2377 cm_node->tcp_cntxt.rcv_nxt++;
2378 i40iw_cleanup_retrans_entry(cm_node);
2379 cm_node->state = I40IW_CM_STATE_CLOSING;
2380 i40iw_send_ack(cm_node);
2381 /*
2382 * Wait for ACK as this is simultaneous close.
2383 * After we receive ACK, do not send anything.
2384 * Just rm the node.
2385 */
2386 break;
2387 case I40IW_CM_STATE_FIN_WAIT2:
2388 cm_node->tcp_cntxt.rcv_nxt++;
2389 i40iw_cleanup_retrans_entry(cm_node);
2390 cm_node->state = I40IW_CM_STATE_TIME_WAIT;
2391 i40iw_send_ack(cm_node);
2392 ret =
2393 i40iw_schedule_cm_timer(cm_node, NULL, I40IW_TIMER_TYPE_CLOSE, 1, 0);
2394 if (ret)
2395 i40iw_pr_err("node %p state = %d\n", cm_node, cm_node->state);
2396 break;
2397 case I40IW_CM_STATE_TIME_WAIT:
2398 cm_node->tcp_cntxt.rcv_nxt++;
2399 i40iw_cleanup_retrans_entry(cm_node);
2400 cm_node->state = I40IW_CM_STATE_CLOSED;
2401 i40iw_rem_ref_cm_node(cm_node);
2402 break;
2403 case I40IW_CM_STATE_OFFLOADED:
2404 default:
2405 i40iw_pr_err("bad state node %p state = %d\n", cm_node, cm_node->state);
2406 break;
2407 }
2408 }
2409
2410 /**
2411 * i40iw_handle_rst_pkt - process received RST packet
2412 * @cm_node: connection's node
2413 * @rbuf: receive buffer
2414 */
2415 static void i40iw_handle_rst_pkt(struct i40iw_cm_node *cm_node,
2416 struct i40iw_puda_buf *rbuf)
2417 {
2418 i40iw_cleanup_retrans_entry(cm_node);
2419 switch (cm_node->state) {
2420 case I40IW_CM_STATE_SYN_SENT:
2421 case I40IW_CM_STATE_MPAREQ_SENT:
2422 switch (cm_node->mpa_frame_rev) {
2423 case IETF_MPA_V2:
2424 cm_node->mpa_frame_rev = IETF_MPA_V1;
2425 /* send a syn and goto syn sent state */
2426 cm_node->state = I40IW_CM_STATE_SYN_SENT;
2427 if (i40iw_send_syn(cm_node, 0))
2428 i40iw_active_open_err(cm_node, false);
2429 break;
2430 case IETF_MPA_V1:
2431 default:
2432 i40iw_active_open_err(cm_node, false);
2433 break;
2434 }
2435 break;
2436 case I40IW_CM_STATE_MPAREQ_RCVD:
2437 atomic_add_return(1, &cm_node->passive_state);
2438 break;
2439 case I40IW_CM_STATE_ESTABLISHED:
2440 case I40IW_CM_STATE_SYN_RCVD:
2441 case I40IW_CM_STATE_LISTENING:
2442 i40iw_pr_err("Bad state state = %d\n", cm_node->state);
2443 i40iw_passive_open_err(cm_node, false);
2444 break;
2445 case I40IW_CM_STATE_OFFLOADED:
2446 i40iw_active_open_err(cm_node, false);
2447 break;
2448 case I40IW_CM_STATE_CLOSED:
2449 break;
2450 case I40IW_CM_STATE_FIN_WAIT2:
2451 case I40IW_CM_STATE_FIN_WAIT1:
2452 case I40IW_CM_STATE_LAST_ACK:
2453 cm_node->cm_id->rem_ref(cm_node->cm_id);
2454 /* fall through */
2455 case I40IW_CM_STATE_TIME_WAIT:
2456 cm_node->state = I40IW_CM_STATE_CLOSED;
2457 i40iw_rem_ref_cm_node(cm_node);
2458 break;
2459 default:
2460 break;
2461 }
2462 }
2463
2464 /**
2465 * i40iw_handle_rcv_mpa - Process a recv'd mpa buffer
2466 * @cm_node: connection's node
2467 * @rbuf: receive buffer
2468 */
2469 static void i40iw_handle_rcv_mpa(struct i40iw_cm_node *cm_node,
2470 struct i40iw_puda_buf *rbuf)
2471 {
2472 int ret;
2473 int datasize = rbuf->datalen;
2474 u8 *dataloc = rbuf->data;
2475
2476 enum i40iw_cm_event_type type = I40IW_CM_EVENT_UNKNOWN;
2477 u32 res_type;
2478
2479 ret = i40iw_parse_mpa(cm_node, dataloc, &res_type, datasize);
2480 if (ret) {
2481 if (cm_node->state == I40IW_CM_STATE_MPAREQ_SENT)
2482 i40iw_active_open_err(cm_node, true);
2483 else
2484 i40iw_passive_open_err(cm_node, true);
2485 return;
2486 }
2487
2488 switch (cm_node->state) {
2489 case I40IW_CM_STATE_ESTABLISHED:
2490 if (res_type == I40IW_MPA_REQUEST_REJECT)
2491 i40iw_pr_err("state for reject\n");
2492 cm_node->state = I40IW_CM_STATE_MPAREQ_RCVD;
2493 type = I40IW_CM_EVENT_MPA_REQ;
2494 i40iw_send_ack(cm_node); /* ACK received MPA request */
2495 atomic_set(&cm_node->passive_state,
2496 I40IW_PASSIVE_STATE_INDICATED);
2497 break;
2498 case I40IW_CM_STATE_MPAREQ_SENT:
2499 i40iw_cleanup_retrans_entry(cm_node);
2500 if (res_type == I40IW_MPA_REQUEST_REJECT) {
2501 type = I40IW_CM_EVENT_MPA_REJECT;
2502 cm_node->state = I40IW_CM_STATE_MPAREJ_RCVD;
2503 } else {
2504 type = I40IW_CM_EVENT_CONNECTED;
2505 cm_node->state = I40IW_CM_STATE_OFFLOADED;
2506 }
2507 i40iw_send_ack(cm_node);
2508 break;
2509 default:
2510 pr_err("%s wrong cm_node state =%d\n", __func__, cm_node->state);
2511 break;
2512 }
2513 i40iw_create_event(cm_node, type);
2514 }
2515
2516 /**
2517 * i40iw_indicate_pkt_err - Send up err event to cm
2518 * @cm_node: connection's node
2519 */
2520 static void i40iw_indicate_pkt_err(struct i40iw_cm_node *cm_node)
2521 {
2522 switch (cm_node->state) {
2523 case I40IW_CM_STATE_SYN_SENT:
2524 case I40IW_CM_STATE_MPAREQ_SENT:
2525 i40iw_active_open_err(cm_node, true);
2526 break;
2527 case I40IW_CM_STATE_ESTABLISHED:
2528 case I40IW_CM_STATE_SYN_RCVD:
2529 i40iw_passive_open_err(cm_node, true);
2530 break;
2531 case I40IW_CM_STATE_OFFLOADED:
2532 default:
2533 break;
2534 }
2535 }
2536
2537 /**
2538 * i40iw_check_syn - Check for error on received syn ack
2539 * @cm_node: connection's node
2540 * @tcph: pointer tcp header
2541 */
2542 static int i40iw_check_syn(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2543 {
2544 int err = 0;
2545
2546 if (ntohl(tcph->ack_seq) != cm_node->tcp_cntxt.loc_seq_num) {
2547 err = 1;
2548 i40iw_active_open_err(cm_node, true);
2549 }
2550 return err;
2551 }
2552
2553 /**
2554 * i40iw_check_seq - check seq numbers if OK
2555 * @cm_node: connection's node
2556 * @tcph: pointer tcp header
2557 */
2558 static int i40iw_check_seq(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2559 {
2560 int err = 0;
2561 u32 seq;
2562 u32 ack_seq;
2563 u32 loc_seq_num = cm_node->tcp_cntxt.loc_seq_num;
2564 u32 rcv_nxt = cm_node->tcp_cntxt.rcv_nxt;
2565 u32 rcv_wnd;
2566
2567 seq = ntohl(tcph->seq);
2568 ack_seq = ntohl(tcph->ack_seq);
2569 rcv_wnd = cm_node->tcp_cntxt.rcv_wnd;
2570 if (ack_seq != loc_seq_num)
2571 err = -1;
2572 else if (!between(seq, rcv_nxt, (rcv_nxt + rcv_wnd)))
2573 err = -1;
2574 if (err) {
2575 i40iw_pr_err("seq number\n");
2576 i40iw_indicate_pkt_err(cm_node);
2577 }
2578 return err;
2579 }
2580
2581 /**
2582 * i40iw_handle_syn_pkt - is for Passive node
2583 * @cm_node: connection's node
2584 * @rbuf: receive buffer
2585 */
2586 static void i40iw_handle_syn_pkt(struct i40iw_cm_node *cm_node,
2587 struct i40iw_puda_buf *rbuf)
2588 {
2589 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2590 int ret;
2591 u32 inc_sequence;
2592 int optionsize;
2593 struct i40iw_cm_info nfo;
2594
2595 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2596 inc_sequence = ntohl(tcph->seq);
2597
2598 switch (cm_node->state) {
2599 case I40IW_CM_STATE_SYN_SENT:
2600 case I40IW_CM_STATE_MPAREQ_SENT:
2601 /* Rcvd syn on active open connection */
2602 i40iw_active_open_err(cm_node, 1);
2603 break;
2604 case I40IW_CM_STATE_LISTENING:
2605 /* Passive OPEN */
2606 if (atomic_read(&cm_node->listener->pend_accepts_cnt) >
2607 cm_node->listener->backlog) {
2608 cm_node->cm_core->stats_backlog_drops++;
2609 i40iw_passive_open_err(cm_node, false);
2610 break;
2611 }
2612 ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2613 if (ret) {
2614 i40iw_passive_open_err(cm_node, false);
2615 /* drop pkt */
2616 break;
2617 }
2618 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2619 cm_node->accept_pend = 1;
2620 atomic_inc(&cm_node->listener->pend_accepts_cnt);
2621
2622 cm_node->state = I40IW_CM_STATE_SYN_RCVD;
2623 i40iw_get_addr_info(cm_node, &nfo);
2624 ret = i40iw_manage_qhash(cm_node->iwdev,
2625 &nfo,
2626 I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2627 I40IW_QHASH_MANAGE_TYPE_ADD,
2628 (void *)cm_node,
2629 false);
2630 cm_node->qhash_set = true;
2631 break;
2632 case I40IW_CM_STATE_CLOSED:
2633 i40iw_cleanup_retrans_entry(cm_node);
2634 atomic_inc(&cm_node->ref_count);
2635 i40iw_send_reset(cm_node);
2636 break;
2637 case I40IW_CM_STATE_OFFLOADED:
2638 case I40IW_CM_STATE_ESTABLISHED:
2639 case I40IW_CM_STATE_FIN_WAIT1:
2640 case I40IW_CM_STATE_FIN_WAIT2:
2641 case I40IW_CM_STATE_MPAREQ_RCVD:
2642 case I40IW_CM_STATE_LAST_ACK:
2643 case I40IW_CM_STATE_CLOSING:
2644 case I40IW_CM_STATE_UNKNOWN:
2645 default:
2646 break;
2647 }
2648 }
2649
2650 /**
2651 * i40iw_handle_synack_pkt - Process SYN+ACK packet (active side)
2652 * @cm_node: connection's node
2653 * @rbuf: receive buffer
2654 */
2655 static void i40iw_handle_synack_pkt(struct i40iw_cm_node *cm_node,
2656 struct i40iw_puda_buf *rbuf)
2657 {
2658 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2659 int ret;
2660 u32 inc_sequence;
2661 int optionsize;
2662
2663 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2664 inc_sequence = ntohl(tcph->seq);
2665 switch (cm_node->state) {
2666 case I40IW_CM_STATE_SYN_SENT:
2667 i40iw_cleanup_retrans_entry(cm_node);
2668 /* active open */
2669 if (i40iw_check_syn(cm_node, tcph)) {
2670 i40iw_pr_err("check syn fail\n");
2671 return;
2672 }
2673 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2674 /* setup options */
2675 ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 0);
2676 if (ret) {
2677 i40iw_debug(cm_node->dev,
2678 I40IW_DEBUG_CM,
2679 "cm_node=%p tcp_options failed\n",
2680 cm_node);
2681 break;
2682 }
2683 i40iw_cleanup_retrans_entry(cm_node);
2684 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2685 i40iw_send_ack(cm_node); /* ACK for the syn_ack */
2686 ret = i40iw_send_mpa_request(cm_node);
2687 if (ret) {
2688 i40iw_debug(cm_node->dev,
2689 I40IW_DEBUG_CM,
2690 "cm_node=%p i40iw_send_mpa_request failed\n",
2691 cm_node);
2692 break;
2693 }
2694 cm_node->state = I40IW_CM_STATE_MPAREQ_SENT;
2695 break;
2696 case I40IW_CM_STATE_MPAREQ_RCVD:
2697 i40iw_passive_open_err(cm_node, true);
2698 break;
2699 case I40IW_CM_STATE_LISTENING:
2700 cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2701 i40iw_cleanup_retrans_entry(cm_node);
2702 cm_node->state = I40IW_CM_STATE_CLOSED;
2703 i40iw_send_reset(cm_node);
2704 break;
2705 case I40IW_CM_STATE_CLOSED:
2706 cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2707 i40iw_cleanup_retrans_entry(cm_node);
2708 atomic_inc(&cm_node->ref_count);
2709 i40iw_send_reset(cm_node);
2710 break;
2711 case I40IW_CM_STATE_ESTABLISHED:
2712 case I40IW_CM_STATE_FIN_WAIT1:
2713 case I40IW_CM_STATE_FIN_WAIT2:
2714 case I40IW_CM_STATE_LAST_ACK:
2715 case I40IW_CM_STATE_OFFLOADED:
2716 case I40IW_CM_STATE_CLOSING:
2717 case I40IW_CM_STATE_UNKNOWN:
2718 case I40IW_CM_STATE_MPAREQ_SENT:
2719 default:
2720 break;
2721 }
2722 }
2723
2724 /**
2725 * i40iw_handle_ack_pkt - process packet with ACK
2726 * @cm_node: connection's node
2727 * @rbuf: receive buffer
2728 */
2729 static int i40iw_handle_ack_pkt(struct i40iw_cm_node *cm_node,
2730 struct i40iw_puda_buf *rbuf)
2731 {
2732 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2733 u32 inc_sequence;
2734 int ret = 0;
2735 int optionsize;
2736 u32 datasize = rbuf->datalen;
2737
2738 optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2739
2740 if (i40iw_check_seq(cm_node, tcph))
2741 return -EINVAL;
2742
2743 inc_sequence = ntohl(tcph->seq);
2744 switch (cm_node->state) {
2745 case I40IW_CM_STATE_SYN_RCVD:
2746 i40iw_cleanup_retrans_entry(cm_node);
2747 ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2748 if (ret)
2749 break;
2750 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2751 cm_node->state = I40IW_CM_STATE_ESTABLISHED;
2752 if (datasize) {
2753 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2754 i40iw_handle_rcv_mpa(cm_node, rbuf);
2755 }
2756 break;
2757 case I40IW_CM_STATE_ESTABLISHED:
2758 i40iw_cleanup_retrans_entry(cm_node);
2759 if (datasize) {
2760 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2761 i40iw_handle_rcv_mpa(cm_node, rbuf);
2762 }
2763 break;
2764 case I40IW_CM_STATE_MPAREQ_SENT:
2765 cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2766 if (datasize) {
2767 cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2768 cm_node->ack_rcvd = false;
2769 i40iw_handle_rcv_mpa(cm_node, rbuf);
2770 } else {
2771 cm_node->ack_rcvd = true;
2772 }
2773 break;
2774 case I40IW_CM_STATE_LISTENING:
2775 i40iw_cleanup_retrans_entry(cm_node);
2776 cm_node->state = I40IW_CM_STATE_CLOSED;
2777 i40iw_send_reset(cm_node);
2778 break;
2779 case I40IW_CM_STATE_CLOSED:
2780 i40iw_cleanup_retrans_entry(cm_node);
2781 atomic_inc(&cm_node->ref_count);
2782 i40iw_send_reset(cm_node);
2783 break;
2784 case I40IW_CM_STATE_LAST_ACK:
2785 case I40IW_CM_STATE_CLOSING:
2786 i40iw_cleanup_retrans_entry(cm_node);
2787 cm_node->state = I40IW_CM_STATE_CLOSED;
2788 if (!cm_node->accept_pend)
2789 cm_node->cm_id->rem_ref(cm_node->cm_id);
2790 i40iw_rem_ref_cm_node(cm_node);
2791 break;
2792 case I40IW_CM_STATE_FIN_WAIT1:
2793 i40iw_cleanup_retrans_entry(cm_node);
2794 cm_node->state = I40IW_CM_STATE_FIN_WAIT2;
2795 break;
2796 case I40IW_CM_STATE_SYN_SENT:
2797 case I40IW_CM_STATE_FIN_WAIT2:
2798 case I40IW_CM_STATE_OFFLOADED:
2799 case I40IW_CM_STATE_MPAREQ_RCVD:
2800 case I40IW_CM_STATE_UNKNOWN:
2801 default:
2802 i40iw_cleanup_retrans_entry(cm_node);
2803 break;
2804 }
2805 return ret;
2806 }
2807
2808 /**
2809 * i40iw_process_packet - process cm packet
2810 * @cm_node: connection's node
2811 * @rbuf: receive buffer
2812 */
2813 static void i40iw_process_packet(struct i40iw_cm_node *cm_node,
2814 struct i40iw_puda_buf *rbuf)
2815 {
2816 enum i40iw_tcpip_pkt_type pkt_type = I40IW_PKT_TYPE_UNKNOWN;
2817 struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2818 u32 fin_set = 0;
2819 int ret;
2820
2821 if (tcph->rst) {
2822 pkt_type = I40IW_PKT_TYPE_RST;
2823 } else if (tcph->syn) {
2824 pkt_type = I40IW_PKT_TYPE_SYN;
2825 if (tcph->ack)
2826 pkt_type = I40IW_PKT_TYPE_SYNACK;
2827 } else if (tcph->ack) {
2828 pkt_type = I40IW_PKT_TYPE_ACK;
2829 }
2830 if (tcph->fin)
2831 fin_set = 1;
2832
2833 switch (pkt_type) {
2834 case I40IW_PKT_TYPE_SYN:
2835 i40iw_handle_syn_pkt(cm_node, rbuf);
2836 break;
2837 case I40IW_PKT_TYPE_SYNACK:
2838 i40iw_handle_synack_pkt(cm_node, rbuf);
2839 break;
2840 case I40IW_PKT_TYPE_ACK:
2841 ret = i40iw_handle_ack_pkt(cm_node, rbuf);
2842 if (fin_set && !ret)
2843 i40iw_handle_fin_pkt(cm_node);
2844 break;
2845 case I40IW_PKT_TYPE_RST:
2846 i40iw_handle_rst_pkt(cm_node, rbuf);
2847 break;
2848 default:
2849 if (fin_set &&
2850 (!i40iw_check_seq(cm_node, (struct tcphdr *)rbuf->tcph)))
2851 i40iw_handle_fin_pkt(cm_node);
2852 break;
2853 }
2854 }
2855
2856 /**
2857 * i40iw_make_listen_node - create a listen node with params
2858 * @cm_core: cm's core
2859 * @iwdev: iwarp device structure
2860 * @cm_info: quad info for connection
2861 */
2862 static struct i40iw_cm_listener *i40iw_make_listen_node(
2863 struct i40iw_cm_core *cm_core,
2864 struct i40iw_device *iwdev,
2865 struct i40iw_cm_info *cm_info)
2866 {
2867 struct i40iw_cm_listener *listener;
2868 unsigned long flags;
2869
2870 /* cannot have multiple matching listeners */
2871 listener = i40iw_find_listener(cm_core, cm_info->loc_addr,
2872 cm_info->loc_port,
2873 cm_info->vlan_id,
2874 I40IW_CM_LISTENER_EITHER_STATE);
2875 if (listener &&
2876 (listener->listener_state == I40IW_CM_LISTENER_ACTIVE_STATE)) {
2877 atomic_dec(&listener->ref_count);
2878 i40iw_debug(cm_core->dev,
2879 I40IW_DEBUG_CM,
2880 "Not creating listener since it already exists\n");
2881 return NULL;
2882 }
2883
2884 if (!listener) {
2885 /* create a CM listen node (1/2 node to compare incoming traffic to) */
2886 listener = kzalloc(sizeof(*listener), GFP_KERNEL);
2887 if (!listener)
2888 return NULL;
2889 cm_core->stats_listen_nodes_created++;
2890 memcpy(listener->loc_addr, cm_info->loc_addr, sizeof(listener->loc_addr));
2891 listener->loc_port = cm_info->loc_port;
2892
2893 INIT_LIST_HEAD(&listener->child_listen_list);
2894
2895 atomic_set(&listener->ref_count, 1);
2896 } else {
2897 listener->reused_node = 1;
2898 }
2899
2900 listener->cm_id = cm_info->cm_id;
2901 listener->ipv4 = cm_info->ipv4;
2902 listener->vlan_id = cm_info->vlan_id;
2903 atomic_set(&listener->pend_accepts_cnt, 0);
2904 listener->cm_core = cm_core;
2905 listener->iwdev = iwdev;
2906
2907 listener->backlog = cm_info->backlog;
2908 listener->listener_state = I40IW_CM_LISTENER_ACTIVE_STATE;
2909
2910 if (!listener->reused_node) {
2911 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
2912 list_add(&listener->list, &cm_core->listen_nodes);
2913 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
2914 }
2915
2916 return listener;
2917 }
2918
2919 /**
2920 * i40iw_create_cm_node - make a connection node with params
2921 * @cm_core: cm's core
2922 * @iwdev: iwarp device structure
2923 * @conn_param: upper layer connection parameters
2924 * @cm_info: quad info for connection
2925 */
2926 static struct i40iw_cm_node *i40iw_create_cm_node(
2927 struct i40iw_cm_core *cm_core,
2928 struct i40iw_device *iwdev,
2929 struct iw_cm_conn_param *conn_param,
2930 struct i40iw_cm_info *cm_info)
2931 {
2932 struct i40iw_cm_node *cm_node;
2933 struct i40iw_cm_listener *loopback_remotelistener;
2934 struct i40iw_cm_node *loopback_remotenode;
2935 struct i40iw_cm_info loopback_cm_info;
2936
2937 u16 private_data_len = conn_param->private_data_len;
2938 const void *private_data = conn_param->private_data;
2939
2940 /* create a CM connection node */
2941 cm_node = i40iw_make_cm_node(cm_core, iwdev, cm_info, NULL);
2942 if (!cm_node)
2943 return ERR_PTR(-ENOMEM);
2944 /* set our node side to client (active) side */
2945 cm_node->tcp_cntxt.client = 1;
2946 cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2947
2948 i40iw_record_ird_ord(cm_node, conn_param->ird, conn_param->ord);
2949
2950 if (!memcmp(cm_info->loc_addr, cm_info->rem_addr, sizeof(cm_info->loc_addr))) {
2951 loopback_remotelistener = i40iw_find_listener(
2952 cm_core,
2953 cm_info->rem_addr,
2954 cm_node->rem_port,
2955 cm_node->vlan_id,
2956 I40IW_CM_LISTENER_ACTIVE_STATE);
2957 if (!loopback_remotelistener) {
2958 i40iw_rem_ref_cm_node(cm_node);
2959 return ERR_PTR(-ECONNREFUSED);
2960 } else {
2961 loopback_cm_info = *cm_info;
2962 loopback_cm_info.loc_port = cm_info->rem_port;
2963 loopback_cm_info.rem_port = cm_info->loc_port;
2964 loopback_cm_info.cm_id = loopback_remotelistener->cm_id;
2965 loopback_cm_info.ipv4 = cm_info->ipv4;
2966 loopback_remotenode = i40iw_make_cm_node(cm_core,
2967 iwdev,
2968 &loopback_cm_info,
2969 loopback_remotelistener);
2970 if (!loopback_remotenode) {
2971 i40iw_rem_ref_cm_node(cm_node);
2972 return ERR_PTR(-ENOMEM);
2973 }
2974 cm_core->stats_loopbacks++;
2975 loopback_remotenode->loopbackpartner = cm_node;
2976 loopback_remotenode->tcp_cntxt.rcv_wscale =
2977 I40IW_CM_DEFAULT_RCV_WND_SCALE;
2978 cm_node->loopbackpartner = loopback_remotenode;
2979 memcpy(loopback_remotenode->pdata_buf, private_data,
2980 private_data_len);
2981 loopback_remotenode->pdata.size = private_data_len;
2982
2983 if (loopback_remotenode->ord_size > cm_node->ird_size)
2984 loopback_remotenode->ord_size =
2985 cm_node->ird_size;
2986
2987 cm_node->state = I40IW_CM_STATE_OFFLOADED;
2988 cm_node->tcp_cntxt.rcv_nxt =
2989 loopback_remotenode->tcp_cntxt.loc_seq_num;
2990 loopback_remotenode->tcp_cntxt.rcv_nxt =
2991 cm_node->tcp_cntxt.loc_seq_num;
2992 cm_node->tcp_cntxt.max_snd_wnd =
2993 loopback_remotenode->tcp_cntxt.rcv_wnd;
2994 loopback_remotenode->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2995 cm_node->tcp_cntxt.snd_wnd = loopback_remotenode->tcp_cntxt.rcv_wnd;
2996 loopback_remotenode->tcp_cntxt.snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2997 cm_node->tcp_cntxt.snd_wscale = loopback_remotenode->tcp_cntxt.rcv_wscale;
2998 loopback_remotenode->tcp_cntxt.snd_wscale = cm_node->tcp_cntxt.rcv_wscale;
2999 }
3000 return cm_node;
3001 }
3002
3003 cm_node->pdata.size = private_data_len;
3004 cm_node->pdata.addr = cm_node->pdata_buf;
3005
3006 memcpy(cm_node->pdata_buf, private_data, private_data_len);
3007
3008 cm_node->state = I40IW_CM_STATE_SYN_SENT;
3009 return cm_node;
3010 }
3011
3012 /**
3013 * i40iw_cm_reject - reject and teardown a connection
3014 * @cm_node: connection's node
3015 * @pdate: ptr to private data for reject
3016 * @plen: size of private data
3017 */
3018 static int i40iw_cm_reject(struct i40iw_cm_node *cm_node, const void *pdata, u8 plen)
3019 {
3020 int ret = 0;
3021 int err;
3022 int passive_state;
3023 struct iw_cm_id *cm_id = cm_node->cm_id;
3024 struct i40iw_cm_node *loopback = cm_node->loopbackpartner;
3025
3026 if (cm_node->tcp_cntxt.client)
3027 return ret;
3028 i40iw_cleanup_retrans_entry(cm_node);
3029
3030 if (!loopback) {
3031 passive_state = atomic_add_return(1, &cm_node->passive_state);
3032 if (passive_state == I40IW_SEND_RESET_EVENT) {
3033 cm_node->state = I40IW_CM_STATE_CLOSED;
3034 i40iw_rem_ref_cm_node(cm_node);
3035 } else {
3036 if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3037 i40iw_rem_ref_cm_node(cm_node);
3038 } else {
3039 ret = i40iw_send_mpa_reject(cm_node, pdata, plen);
3040 if (ret) {
3041 cm_node->state = I40IW_CM_STATE_CLOSED;
3042 err = i40iw_send_reset(cm_node);
3043 if (err)
3044 i40iw_pr_err("send reset failed\n");
3045 } else {
3046 cm_id->add_ref(cm_id);
3047 }
3048 }
3049 }
3050 } else {
3051 cm_node->cm_id = NULL;
3052 if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3053 i40iw_rem_ref_cm_node(cm_node);
3054 i40iw_rem_ref_cm_node(loopback);
3055 } else {
3056 ret = i40iw_send_cm_event(loopback,
3057 loopback->cm_id,
3058 IW_CM_EVENT_CONNECT_REPLY,
3059 -ECONNREFUSED);
3060 i40iw_rem_ref_cm_node(cm_node);
3061 loopback->state = I40IW_CM_STATE_CLOSING;
3062
3063 cm_id = loopback->cm_id;
3064 i40iw_rem_ref_cm_node(loopback);
3065 cm_id->rem_ref(cm_id);
3066 }
3067 }
3068
3069 return ret;
3070 }
3071
3072 /**
3073 * i40iw_cm_close - close of cm connection
3074 * @cm_node: connection's node
3075 */
3076 static int i40iw_cm_close(struct i40iw_cm_node *cm_node)
3077 {
3078 int ret = 0;
3079
3080 if (!cm_node)
3081 return -EINVAL;
3082
3083 switch (cm_node->state) {
3084 case I40IW_CM_STATE_SYN_RCVD:
3085 case I40IW_CM_STATE_SYN_SENT:
3086 case I40IW_CM_STATE_ONE_SIDE_ESTABLISHED:
3087 case I40IW_CM_STATE_ESTABLISHED:
3088 case I40IW_CM_STATE_ACCEPTING:
3089 case I40IW_CM_STATE_MPAREQ_SENT:
3090 case I40IW_CM_STATE_MPAREQ_RCVD:
3091 i40iw_cleanup_retrans_entry(cm_node);
3092 i40iw_send_reset(cm_node);
3093 break;
3094 case I40IW_CM_STATE_CLOSE_WAIT:
3095 cm_node->state = I40IW_CM_STATE_LAST_ACK;
3096 i40iw_send_fin(cm_node);
3097 break;
3098 case I40IW_CM_STATE_FIN_WAIT1:
3099 case I40IW_CM_STATE_FIN_WAIT2:
3100 case I40IW_CM_STATE_LAST_ACK:
3101 case I40IW_CM_STATE_TIME_WAIT:
3102 case I40IW_CM_STATE_CLOSING:
3103 ret = -1;
3104 break;
3105 case I40IW_CM_STATE_LISTENING:
3106 i40iw_cleanup_retrans_entry(cm_node);
3107 i40iw_send_reset(cm_node);
3108 break;
3109 case I40IW_CM_STATE_MPAREJ_RCVD:
3110 case I40IW_CM_STATE_UNKNOWN:
3111 case I40IW_CM_STATE_INITED:
3112 case I40IW_CM_STATE_CLOSED:
3113 case I40IW_CM_STATE_LISTENER_DESTROYED:
3114 i40iw_rem_ref_cm_node(cm_node);
3115 break;
3116 case I40IW_CM_STATE_OFFLOADED:
3117 if (cm_node->send_entry)
3118 i40iw_pr_err("send_entry\n");
3119 i40iw_rem_ref_cm_node(cm_node);
3120 break;
3121 }
3122 return ret;
3123 }
3124
3125 /**
3126 * i40iw_receive_ilq - recv an ETHERNET packet, and process it
3127 * through CM
3128 * @vsi: pointer to the vsi structure
3129 * @rbuf: receive buffer
3130 */
3131 void i40iw_receive_ilq(struct i40iw_sc_vsi *vsi, struct i40iw_puda_buf *rbuf)
3132 {
3133 struct i40iw_cm_node *cm_node;
3134 struct i40iw_cm_listener *listener;
3135 struct iphdr *iph;
3136 struct ipv6hdr *ip6h;
3137 struct tcphdr *tcph;
3138 struct i40iw_cm_info cm_info;
3139 struct i40iw_sc_dev *dev = vsi->dev;
3140 struct i40iw_device *iwdev = (struct i40iw_device *)dev->back_dev;
3141 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3142 struct vlan_ethhdr *ethh;
3143 u16 vtag;
3144
3145 /* if vlan, then maclen = 18 else 14 */
3146 iph = (struct iphdr *)rbuf->iph;
3147 memset(&cm_info, 0, sizeof(cm_info));
3148
3149 i40iw_debug_buf(dev,
3150 I40IW_DEBUG_ILQ,
3151 "RECEIVE ILQ BUFFER",
3152 rbuf->mem.va,
3153 rbuf->totallen);
3154 ethh = (struct vlan_ethhdr *)rbuf->mem.va;
3155
3156 if (ethh->h_vlan_proto == htons(ETH_P_8021Q)) {
3157 vtag = ntohs(ethh->h_vlan_TCI);
3158 cm_info.user_pri = (vtag & VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
3159 cm_info.vlan_id = vtag & VLAN_VID_MASK;
3160 i40iw_debug(cm_core->dev,
3161 I40IW_DEBUG_CM,
3162 "%s vlan_id=%d\n",
3163 __func__,
3164 cm_info.vlan_id);
3165 } else {
3166 cm_info.vlan_id = I40IW_NO_VLAN;
3167 }
3168 tcph = (struct tcphdr *)rbuf->tcph;
3169
3170 if (rbuf->ipv4) {
3171 cm_info.loc_addr[0] = ntohl(iph->daddr);
3172 cm_info.rem_addr[0] = ntohl(iph->saddr);
3173 cm_info.ipv4 = true;
3174 cm_info.tos = iph->tos;
3175 } else {
3176 ip6h = (struct ipv6hdr *)rbuf->iph;
3177 i40iw_copy_ip_ntohl(cm_info.loc_addr,
3178 ip6h->daddr.in6_u.u6_addr32);
3179 i40iw_copy_ip_ntohl(cm_info.rem_addr,
3180 ip6h->saddr.in6_u.u6_addr32);
3181 cm_info.ipv4 = false;
3182 cm_info.tos = (ip6h->priority << 4) | (ip6h->flow_lbl[0] >> 4);
3183 }
3184 cm_info.loc_port = ntohs(tcph->dest);
3185 cm_info.rem_port = ntohs(tcph->source);
3186 cm_node = i40iw_find_node(cm_core,
3187 cm_info.rem_port,
3188 cm_info.rem_addr,
3189 cm_info.loc_port,
3190 cm_info.loc_addr,
3191 true,
3192 false);
3193
3194 if (!cm_node) {
3195 /* Only type of packet accepted are for */
3196 /* the PASSIVE open (syn only) */
3197 if (!tcph->syn || tcph->ack)
3198 return;
3199 listener =
3200 i40iw_find_listener(cm_core,
3201 cm_info.loc_addr,
3202 cm_info.loc_port,
3203 cm_info.vlan_id,
3204 I40IW_CM_LISTENER_ACTIVE_STATE);
3205 if (!listener) {
3206 cm_info.cm_id = NULL;
3207 i40iw_debug(cm_core->dev,
3208 I40IW_DEBUG_CM,
3209 "%s no listener found\n",
3210 __func__);
3211 return;
3212 }
3213 cm_info.cm_id = listener->cm_id;
3214 cm_node = i40iw_make_cm_node(cm_core, iwdev, &cm_info, listener);
3215 if (!cm_node) {
3216 i40iw_debug(cm_core->dev,
3217 I40IW_DEBUG_CM,
3218 "%s allocate node failed\n",
3219 __func__);
3220 atomic_dec(&listener->ref_count);
3221 return;
3222 }
3223 if (!tcph->rst && !tcph->fin) {
3224 cm_node->state = I40IW_CM_STATE_LISTENING;
3225 } else {
3226 i40iw_rem_ref_cm_node(cm_node);
3227 return;
3228 }
3229 atomic_inc(&cm_node->ref_count);
3230 } else if (cm_node->state == I40IW_CM_STATE_OFFLOADED) {
3231 i40iw_rem_ref_cm_node(cm_node);
3232 return;
3233 }
3234 i40iw_process_packet(cm_node, rbuf);
3235 i40iw_rem_ref_cm_node(cm_node);
3236 }
3237
3238 /**
3239 * i40iw_setup_cm_core - allocate a top level instance of a cm
3240 * core
3241 * @iwdev: iwarp device structure
3242 */
3243 int i40iw_setup_cm_core(struct i40iw_device *iwdev)
3244 {
3245 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3246
3247 cm_core->iwdev = iwdev;
3248 cm_core->dev = &iwdev->sc_dev;
3249
3250 INIT_LIST_HEAD(&cm_core->accelerated_list);
3251 INIT_LIST_HEAD(&cm_core->non_accelerated_list);
3252 INIT_LIST_HEAD(&cm_core->listen_nodes);
3253
3254 timer_setup(&cm_core->tcp_timer, i40iw_cm_timer_tick, 0);
3255
3256 spin_lock_init(&cm_core->ht_lock);
3257 spin_lock_init(&cm_core->listen_list_lock);
3258 spin_lock_init(&cm_core->apbvt_lock);
3259
3260 cm_core->event_wq = alloc_ordered_workqueue("iwewq",
3261 WQ_MEM_RECLAIM);
3262 if (!cm_core->event_wq)
3263 goto error;
3264
3265 cm_core->disconn_wq = alloc_ordered_workqueue("iwdwq",
3266 WQ_MEM_RECLAIM);
3267 if (!cm_core->disconn_wq)
3268 goto error;
3269
3270 return 0;
3271 error:
3272 i40iw_cleanup_cm_core(&iwdev->cm_core);
3273
3274 return -ENOMEM;
3275 }
3276
3277 /**
3278 * i40iw_cleanup_cm_core - deallocate a top level instance of a
3279 * cm core
3280 * @cm_core: cm's core
3281 */
3282 void i40iw_cleanup_cm_core(struct i40iw_cm_core *cm_core)
3283 {
3284 unsigned long flags;
3285
3286 if (!cm_core)
3287 return;
3288
3289 spin_lock_irqsave(&cm_core->ht_lock, flags);
3290 if (timer_pending(&cm_core->tcp_timer))
3291 del_timer_sync(&cm_core->tcp_timer);
3292 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3293
3294 if (cm_core->event_wq)
3295 destroy_workqueue(cm_core->event_wq);
3296 if (cm_core->disconn_wq)
3297 destroy_workqueue(cm_core->disconn_wq);
3298 }
3299
3300 /**
3301 * i40iw_init_tcp_ctx - setup qp context
3302 * @cm_node: connection's node
3303 * @tcp_info: offload info for tcp
3304 * @iwqp: associate qp for the connection
3305 */
3306 static void i40iw_init_tcp_ctx(struct i40iw_cm_node *cm_node,
3307 struct i40iw_tcp_offload_info *tcp_info,
3308 struct i40iw_qp *iwqp)
3309 {
3310 tcp_info->ipv4 = cm_node->ipv4;
3311 tcp_info->drop_ooo_seg = true;
3312 tcp_info->wscale = true;
3313 tcp_info->ignore_tcp_opt = true;
3314 tcp_info->ignore_tcp_uns_opt = true;
3315 tcp_info->no_nagle = false;
3316
3317 tcp_info->ttl = I40IW_DEFAULT_TTL;
3318 tcp_info->rtt_var = cpu_to_le32(I40IW_DEFAULT_RTT_VAR);
3319 tcp_info->ss_thresh = cpu_to_le32(I40IW_DEFAULT_SS_THRESH);
3320 tcp_info->rexmit_thresh = I40IW_DEFAULT_REXMIT_THRESH;
3321
3322 tcp_info->tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3323 tcp_info->snd_wscale = cm_node->tcp_cntxt.snd_wscale;
3324 tcp_info->rcv_wscale = cm_node->tcp_cntxt.rcv_wscale;
3325
3326 tcp_info->snd_nxt = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3327 tcp_info->snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.snd_wnd);
3328 tcp_info->rcv_nxt = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3329 tcp_info->snd_max = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3330
3331 tcp_info->snd_una = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3332 tcp_info->cwnd = cpu_to_le32(2 * cm_node->tcp_cntxt.mss);
3333 tcp_info->snd_wl1 = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3334 tcp_info->snd_wl2 = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3335 tcp_info->max_snd_window = cpu_to_le32(cm_node->tcp_cntxt.max_snd_wnd);
3336 tcp_info->rcv_wnd = cpu_to_le32(cm_node->tcp_cntxt.rcv_wnd <<
3337 cm_node->tcp_cntxt.rcv_wscale);
3338
3339 tcp_info->flow_label = 0;
3340 tcp_info->snd_mss = cpu_to_le32(((u32)cm_node->tcp_cntxt.mss));
3341 if (cm_node->vlan_id <= VLAN_VID_MASK) {
3342 tcp_info->insert_vlan_tag = true;
3343 tcp_info->vlan_tag = cpu_to_le16(((u16)cm_node->user_pri << I40IW_VLAN_PRIO_SHIFT) |
3344 cm_node->vlan_id);
3345 }
3346 if (cm_node->ipv4) {
3347 tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3348 tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3349
3350 tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[0]);
3351 tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[0]);
3352 tcp_info->arp_idx =
3353 cpu_to_le16((u16)i40iw_arp_table(
3354 iwqp->iwdev,
3355 &tcp_info->dest_ip_addr3,
3356 true,
3357 NULL,
3358 I40IW_ARP_RESOLVE));
3359 } else {
3360 tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3361 tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3362 tcp_info->dest_ip_addr0 = cpu_to_le32(cm_node->rem_addr[0]);
3363 tcp_info->dest_ip_addr1 = cpu_to_le32(cm_node->rem_addr[1]);
3364 tcp_info->dest_ip_addr2 = cpu_to_le32(cm_node->rem_addr[2]);
3365 tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[3]);
3366 tcp_info->local_ipaddr0 = cpu_to_le32(cm_node->loc_addr[0]);
3367 tcp_info->local_ipaddr1 = cpu_to_le32(cm_node->loc_addr[1]);
3368 tcp_info->local_ipaddr2 = cpu_to_le32(cm_node->loc_addr[2]);
3369 tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[3]);
3370 tcp_info->arp_idx =
3371 cpu_to_le16((u16)i40iw_arp_table(
3372 iwqp->iwdev,
3373 &tcp_info->dest_ip_addr0,
3374 false,
3375 NULL,
3376 I40IW_ARP_RESOLVE));
3377 }
3378 }
3379
3380 /**
3381 * i40iw_cm_init_tsa_conn - setup qp for RTS
3382 * @iwqp: associate qp for the connection
3383 * @cm_node: connection's node
3384 */
3385 static void i40iw_cm_init_tsa_conn(struct i40iw_qp *iwqp,
3386 struct i40iw_cm_node *cm_node)
3387 {
3388 struct i40iw_tcp_offload_info tcp_info;
3389 struct i40iwarp_offload_info *iwarp_info;
3390 struct i40iw_qp_host_ctx_info *ctx_info;
3391 struct i40iw_device *iwdev = iwqp->iwdev;
3392 struct i40iw_sc_dev *dev = &iwqp->iwdev->sc_dev;
3393
3394 memset(&tcp_info, 0x00, sizeof(struct i40iw_tcp_offload_info));
3395 iwarp_info = &iwqp->iwarp_info;
3396 ctx_info = &iwqp->ctx_info;
3397
3398 ctx_info->tcp_info = &tcp_info;
3399 ctx_info->send_cq_num = iwqp->iwscq->sc_cq.cq_uk.cq_id;
3400 ctx_info->rcv_cq_num = iwqp->iwrcq->sc_cq.cq_uk.cq_id;
3401
3402 iwarp_info->ord_size = cm_node->ord_size;
3403 iwarp_info->ird_size = i40iw_derive_hw_ird_setting(cm_node->ird_size);
3404
3405 if (iwarp_info->ord_size == 1)
3406 iwarp_info->ord_size = 2;
3407
3408 iwarp_info->rd_enable = true;
3409 iwarp_info->rdmap_ver = 1;
3410 iwarp_info->ddp_ver = 1;
3411
3412 iwarp_info->pd_id = iwqp->iwpd->sc_pd.pd_id;
3413
3414 ctx_info->tcp_info_valid = true;
3415 ctx_info->iwarp_info_valid = true;
3416 ctx_info->add_to_qoslist = true;
3417 ctx_info->user_pri = cm_node->user_pri;
3418
3419 i40iw_init_tcp_ctx(cm_node, &tcp_info, iwqp);
3420 if (cm_node->snd_mark_en) {
3421 iwarp_info->snd_mark_en = true;
3422 iwarp_info->snd_mark_offset = (tcp_info.snd_nxt &
3423 SNDMARKER_SEQNMASK) + cm_node->lsmm_size;
3424 }
3425
3426 cm_node->state = I40IW_CM_STATE_OFFLOADED;
3427 tcp_info.tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3428 tcp_info.src_mac_addr_idx = iwdev->mac_ip_table_idx;
3429 tcp_info.tos = cm_node->tos;
3430
3431 dev->iw_priv_qp_ops->qp_setctx(&iwqp->sc_qp, (u64 *)(iwqp->host_ctx.va), ctx_info);
3432
3433 /* once tcp_info is set, no need to do it again */
3434 ctx_info->tcp_info_valid = false;
3435 ctx_info->iwarp_info_valid = false;
3436 ctx_info->add_to_qoslist = false;
3437 }
3438
3439 /**
3440 * i40iw_cm_disconn - when a connection is being closed
3441 * @iwqp: associate qp for the connection
3442 */
3443 void i40iw_cm_disconn(struct i40iw_qp *iwqp)
3444 {
3445 struct disconn_work *work;
3446 struct i40iw_device *iwdev = iwqp->iwdev;
3447 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3448 unsigned long flags;
3449
3450 work = kzalloc(sizeof(*work), GFP_ATOMIC);
3451 if (!work)
3452 return; /* Timer will clean up */
3453
3454 spin_lock_irqsave(&iwdev->qptable_lock, flags);
3455 if (!iwdev->qp_table[iwqp->ibqp.qp_num]) {
3456 spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3457 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
3458 "%s qp_id %d is already freed\n",
3459 __func__, iwqp->ibqp.qp_num);
3460 kfree(work);
3461 return;
3462 }
3463 i40iw_add_ref(&iwqp->ibqp);
3464 spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3465
3466 work->iwqp = iwqp;
3467 INIT_WORK(&work->work, i40iw_disconnect_worker);
3468 queue_work(cm_core->disconn_wq, &work->work);
3469 return;
3470 }
3471
3472 /**
3473 * i40iw_qp_disconnect - free qp and close cm
3474 * @iwqp: associate qp for the connection
3475 */
3476 static void i40iw_qp_disconnect(struct i40iw_qp *iwqp)
3477 {
3478 struct i40iw_device *iwdev;
3479 struct i40iw_ib_device *iwibdev;
3480
3481 iwdev = to_iwdev(iwqp->ibqp.device);
3482 if (!iwdev) {
3483 i40iw_pr_err("iwdev == NULL\n");
3484 return;
3485 }
3486
3487 iwibdev = iwdev->iwibdev;
3488
3489 if (iwqp->active_conn) {
3490 /* indicate this connection is NOT active */
3491 iwqp->active_conn = 0;
3492 } else {
3493 /* Need to free the Last Streaming Mode Message */
3494 if (iwqp->ietf_mem.va) {
3495 if (iwqp->lsmm_mr)
3496 iwibdev->ibdev.ops.dereg_mr(iwqp->lsmm_mr,
3497 NULL);
3498 i40iw_free_dma_mem(iwdev->sc_dev.hw, &iwqp->ietf_mem);
3499 }
3500 }
3501
3502 /* close the CM node down if it is still active */
3503 if (iwqp->cm_node) {
3504 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "%s Call close API\n", __func__);
3505 i40iw_cm_close(iwqp->cm_node);
3506 }
3507 }
3508
3509 /**
3510 * i40iw_cm_disconn_true - called by worker thread to disconnect qp
3511 * @iwqp: associate qp for the connection
3512 */
3513 static void i40iw_cm_disconn_true(struct i40iw_qp *iwqp)
3514 {
3515 struct iw_cm_id *cm_id;
3516 struct i40iw_device *iwdev;
3517 struct i40iw_sc_qp *qp = &iwqp->sc_qp;
3518 u16 last_ae;
3519 u8 original_hw_tcp_state;
3520 u8 original_ibqp_state;
3521 int disconn_status = 0;
3522 int issue_disconn = 0;
3523 int issue_close = 0;
3524 int issue_flush = 0;
3525 struct ib_event ibevent;
3526 unsigned long flags;
3527 int ret;
3528
3529 if (!iwqp) {
3530 i40iw_pr_err("iwqp == NULL\n");
3531 return;
3532 }
3533
3534 spin_lock_irqsave(&iwqp->lock, flags);
3535 cm_id = iwqp->cm_id;
3536 /* make sure we havent already closed this connection */
3537 if (!cm_id) {
3538 spin_unlock_irqrestore(&iwqp->lock, flags);
3539 return;
3540 }
3541
3542 iwdev = to_iwdev(iwqp->ibqp.device);
3543
3544 original_hw_tcp_state = iwqp->hw_tcp_state;
3545 original_ibqp_state = iwqp->ibqp_state;
3546 last_ae = iwqp->last_aeq;
3547
3548 if (qp->term_flags) {
3549 issue_disconn = 1;
3550 issue_close = 1;
3551 iwqp->cm_id = NULL;
3552 /*When term timer expires after cm_timer, don't want
3553 *terminate-handler to issue cm_disconn which can re-free
3554 *a QP even after its refcnt=0.
3555 */
3556 i40iw_terminate_del_timer(qp);
3557 if (!iwqp->flush_issued) {
3558 iwqp->flush_issued = 1;
3559 issue_flush = 1;
3560 }
3561 } else if ((original_hw_tcp_state == I40IW_TCP_STATE_CLOSE_WAIT) ||
3562 ((original_ibqp_state == IB_QPS_RTS) &&
3563 (last_ae == I40IW_AE_LLP_CONNECTION_RESET))) {
3564 issue_disconn = 1;
3565 if (last_ae == I40IW_AE_LLP_CONNECTION_RESET)
3566 disconn_status = -ECONNRESET;
3567 }
3568
3569 if (((original_hw_tcp_state == I40IW_TCP_STATE_CLOSED) ||
3570 (original_hw_tcp_state == I40IW_TCP_STATE_TIME_WAIT) ||
3571 (last_ae == I40IW_AE_RDMAP_ROE_BAD_LLP_CLOSE) ||
3572 (last_ae == I40IW_AE_LLP_CONNECTION_RESET) ||
3573 iwdev->reset)) {
3574 issue_close = 1;
3575 iwqp->cm_id = NULL;
3576 if (!iwqp->flush_issued) {
3577 iwqp->flush_issued = 1;
3578 issue_flush = 1;
3579 }
3580 }
3581
3582 spin_unlock_irqrestore(&iwqp->lock, flags);
3583 if (issue_flush && !iwqp->destroyed) {
3584 /* Flush the queues */
3585 i40iw_flush_wqes(iwdev, iwqp);
3586
3587 if (qp->term_flags && iwqp->ibqp.event_handler) {
3588 ibevent.device = iwqp->ibqp.device;
3589 ibevent.event = (qp->eventtype == TERM_EVENT_QP_FATAL) ?
3590 IB_EVENT_QP_FATAL : IB_EVENT_QP_ACCESS_ERR;
3591 ibevent.element.qp = &iwqp->ibqp;
3592 iwqp->ibqp.event_handler(&ibevent, iwqp->ibqp.qp_context);
3593 }
3594 }
3595
3596 if (cm_id && cm_id->event_handler) {
3597 if (issue_disconn) {
3598 ret = i40iw_send_cm_event(NULL,
3599 cm_id,
3600 IW_CM_EVENT_DISCONNECT,
3601 disconn_status);
3602
3603 if (ret)
3604 i40iw_debug(&iwdev->sc_dev,
3605 I40IW_DEBUG_CM,
3606 "disconnect event failed %s: - cm_id = %p\n",
3607 __func__, cm_id);
3608 }
3609 if (issue_close) {
3610 i40iw_qp_disconnect(iwqp);
3611 cm_id->provider_data = iwqp;
3612 ret = i40iw_send_cm_event(NULL, cm_id, IW_CM_EVENT_CLOSE, 0);
3613 if (ret)
3614 i40iw_debug(&iwdev->sc_dev,
3615 I40IW_DEBUG_CM,
3616 "close event failed %s: - cm_id = %p\n",
3617 __func__, cm_id);
3618 cm_id->rem_ref(cm_id);
3619 }
3620 }
3621 }
3622
3623 /**
3624 * i40iw_disconnect_worker - worker for connection close
3625 * @work: points or disconn structure
3626 */
3627 static void i40iw_disconnect_worker(struct work_struct *work)
3628 {
3629 struct disconn_work *dwork = container_of(work, struct disconn_work, work);
3630 struct i40iw_qp *iwqp = dwork->iwqp;
3631
3632 kfree(dwork);
3633 i40iw_cm_disconn_true(iwqp);
3634 i40iw_rem_ref(&iwqp->ibqp);
3635 }
3636
3637 /**
3638 * i40iw_accept - registered call for connection to be accepted
3639 * @cm_id: cm information for passive connection
3640 * @conn_param: accpet parameters
3641 */
3642 int i40iw_accept(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3643 {
3644 struct ib_qp *ibqp;
3645 struct i40iw_qp *iwqp;
3646 struct i40iw_device *iwdev;
3647 struct i40iw_sc_dev *dev;
3648 struct i40iw_cm_core *cm_core;
3649 struct i40iw_cm_node *cm_node;
3650 struct ib_qp_attr attr;
3651 int passive_state;
3652 struct ib_mr *ibmr;
3653 struct i40iw_pd *iwpd;
3654 u16 buf_len = 0;
3655 struct i40iw_kmem_info accept;
3656 enum i40iw_status_code status;
3657 u64 tagged_offset;
3658 unsigned long flags;
3659
3660 memset(&attr, 0, sizeof(attr));
3661 ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3662 if (!ibqp)
3663 return -EINVAL;
3664
3665 iwqp = to_iwqp(ibqp);
3666 iwdev = iwqp->iwdev;
3667 dev = &iwdev->sc_dev;
3668 cm_core = &iwdev->cm_core;
3669 cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3670
3671 if (((struct sockaddr_in *)&cm_id->local_addr)->sin_family == AF_INET) {
3672 cm_node->ipv4 = true;
3673 cm_node->vlan_id = i40iw_get_vlan_ipv4(cm_node->loc_addr);
3674 } else {
3675 cm_node->ipv4 = false;
3676 i40iw_netdev_vlan_ipv6(cm_node->loc_addr, &cm_node->vlan_id);
3677 }
3678 i40iw_debug(cm_node->dev,
3679 I40IW_DEBUG_CM,
3680 "Accept vlan_id=%d\n",
3681 cm_node->vlan_id);
3682 if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3683 if (cm_node->loopbackpartner)
3684 i40iw_rem_ref_cm_node(cm_node->loopbackpartner);
3685 i40iw_rem_ref_cm_node(cm_node);
3686 return -EINVAL;
3687 }
3688
3689 passive_state = atomic_add_return(1, &cm_node->passive_state);
3690 if (passive_state == I40IW_SEND_RESET_EVENT) {
3691 i40iw_rem_ref_cm_node(cm_node);
3692 return -ECONNRESET;
3693 }
3694
3695 cm_node->cm_core->stats_accepts++;
3696 iwqp->cm_node = (void *)cm_node;
3697 cm_node->iwqp = iwqp;
3698
3699 buf_len = conn_param->private_data_len + I40IW_MAX_IETF_SIZE;
3700
3701 status = i40iw_allocate_dma_mem(dev->hw, &iwqp->ietf_mem, buf_len, 1);
3702
3703 if (status)
3704 return -ENOMEM;
3705 cm_node->pdata.size = conn_param->private_data_len;
3706 accept.addr = iwqp->ietf_mem.va;
3707 accept.size = i40iw_cm_build_mpa_frame(cm_node, &accept, MPA_KEY_REPLY);
3708 memcpy(accept.addr + accept.size, conn_param->private_data,
3709 conn_param->private_data_len);
3710
3711 /* setup our first outgoing iWarp send WQE (the IETF frame response) */
3712 if ((cm_node->ipv4 &&
3713 !i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
3714 (!cm_node->ipv4 &&
3715 !i40iw_ipv6_is_loopback(cm_node->loc_addr, cm_node->rem_addr))) {
3716 iwpd = iwqp->iwpd;
3717 tagged_offset = (uintptr_t)iwqp->ietf_mem.va;
3718 ibmr = i40iw_reg_phys_mr(&iwpd->ibpd,
3719 iwqp->ietf_mem.pa,
3720 buf_len,
3721 IB_ACCESS_LOCAL_WRITE,
3722 &tagged_offset);
3723 if (IS_ERR(ibmr)) {
3724 i40iw_free_dma_mem(dev->hw, &iwqp->ietf_mem);
3725 return -ENOMEM;
3726 }
3727
3728 ibmr->pd = &iwpd->ibpd;
3729 ibmr->device = iwpd->ibpd.device;
3730 iwqp->lsmm_mr = ibmr;
3731 if (iwqp->page)
3732 iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3733 dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp,
3734 iwqp->ietf_mem.va,
3735 (accept.size + conn_param->private_data_len),
3736 ibmr->lkey);
3737
3738 } else {
3739 if (iwqp->page)
3740 iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3741 dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp, NULL, 0, 0);
3742 }
3743
3744 if (iwqp->page)
3745 kunmap(iwqp->page);
3746
3747 iwqp->cm_id = cm_id;
3748 cm_node->cm_id = cm_id;
3749
3750 cm_id->provider_data = (void *)iwqp;
3751 iwqp->active_conn = 0;
3752
3753 cm_node->lsmm_size = accept.size + conn_param->private_data_len;
3754 i40iw_cm_init_tsa_conn(iwqp, cm_node);
3755 cm_id->add_ref(cm_id);
3756 i40iw_add_ref(&iwqp->ibqp);
3757
3758 attr.qp_state = IB_QPS_RTS;
3759 cm_node->qhash_set = false;
3760 i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
3761
3762 cm_node->accelerated = true;
3763 spin_lock_irqsave(&cm_core->ht_lock, flags);
3764 list_move_tail(&cm_node->list, &cm_core->accelerated_list);
3765 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3766
3767 status =
3768 i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_ESTABLISHED, 0);
3769 if (status)
3770 i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - ESTABLISHED\n");
3771
3772 if (cm_node->loopbackpartner) {
3773 cm_node->loopbackpartner->pdata.size = conn_param->private_data_len;
3774
3775 /* copy entire MPA frame to our cm_node's frame */
3776 memcpy(cm_node->loopbackpartner->pdata_buf,
3777 conn_param->private_data,
3778 conn_param->private_data_len);
3779 i40iw_create_event(cm_node->loopbackpartner, I40IW_CM_EVENT_CONNECTED);
3780 }
3781
3782 if (cm_node->accept_pend) {
3783 atomic_dec(&cm_node->listener->pend_accepts_cnt);
3784 cm_node->accept_pend = 0;
3785 }
3786 return 0;
3787 }
3788
3789 /**
3790 * i40iw_reject - registered call for connection to be rejected
3791 * @cm_id: cm information for passive connection
3792 * @pdata: private data to be sent
3793 * @pdata_len: private data length
3794 */
3795 int i40iw_reject(struct iw_cm_id *cm_id, const void *pdata, u8 pdata_len)
3796 {
3797 struct i40iw_device *iwdev;
3798 struct i40iw_cm_node *cm_node;
3799 struct i40iw_cm_node *loopback;
3800
3801 cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3802 loopback = cm_node->loopbackpartner;
3803 cm_node->cm_id = cm_id;
3804 cm_node->pdata.size = pdata_len;
3805
3806 iwdev = to_iwdev(cm_id->device);
3807 if (!iwdev)
3808 return -EINVAL;
3809 cm_node->cm_core->stats_rejects++;
3810
3811 if (pdata_len + sizeof(struct ietf_mpa_v2) > MAX_CM_BUFFER)
3812 return -EINVAL;
3813
3814 if (loopback) {
3815 memcpy(&loopback->pdata_buf, pdata, pdata_len);
3816 loopback->pdata.size = pdata_len;
3817 }
3818
3819 return i40iw_cm_reject(cm_node, pdata, pdata_len);
3820 }
3821
3822 /**
3823 * i40iw_connect - registered call for connection to be established
3824 * @cm_id: cm information for passive connection
3825 * @conn_param: Information about the connection
3826 */
3827 int i40iw_connect(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3828 {
3829 struct ib_qp *ibqp;
3830 struct i40iw_qp *iwqp;
3831 struct i40iw_device *iwdev;
3832 struct i40iw_cm_node *cm_node;
3833 struct i40iw_cm_info cm_info;
3834 struct sockaddr_in *laddr;
3835 struct sockaddr_in *raddr;
3836 struct sockaddr_in6 *laddr6;
3837 struct sockaddr_in6 *raddr6;
3838 int ret = 0;
3839
3840 ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3841 if (!ibqp)
3842 return -EINVAL;
3843 iwqp = to_iwqp(ibqp);
3844 if (!iwqp)
3845 return -EINVAL;
3846 iwdev = to_iwdev(iwqp->ibqp.device);
3847 if (!iwdev)
3848 return -EINVAL;
3849
3850 laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3851 raddr = (struct sockaddr_in *)&cm_id->m_remote_addr;
3852 laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3853 raddr6 = (struct sockaddr_in6 *)&cm_id->m_remote_addr;
3854
3855 if (!(laddr->sin_port) || !(raddr->sin_port))
3856 return -EINVAL;
3857
3858 iwqp->active_conn = 1;
3859 iwqp->cm_id = NULL;
3860 cm_id->provider_data = iwqp;
3861
3862 /* set up the connection params for the node */
3863 if (cm_id->remote_addr.ss_family == AF_INET) {
3864 cm_info.ipv4 = true;
3865 memset(cm_info.loc_addr, 0, sizeof(cm_info.loc_addr));
3866 memset(cm_info.rem_addr, 0, sizeof(cm_info.rem_addr));
3867 cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3868 cm_info.rem_addr[0] = ntohl(raddr->sin_addr.s_addr);
3869 cm_info.loc_port = ntohs(laddr->sin_port);
3870 cm_info.rem_port = ntohs(raddr->sin_port);
3871 cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3872 } else {
3873 cm_info.ipv4 = false;
3874 i40iw_copy_ip_ntohl(cm_info.loc_addr,
3875 laddr6->sin6_addr.in6_u.u6_addr32);
3876 i40iw_copy_ip_ntohl(cm_info.rem_addr,
3877 raddr6->sin6_addr.in6_u.u6_addr32);
3878 cm_info.loc_port = ntohs(laddr6->sin6_port);
3879 cm_info.rem_port = ntohs(raddr6->sin6_port);
3880 i40iw_netdev_vlan_ipv6(cm_info.loc_addr, &cm_info.vlan_id);
3881 }
3882 cm_info.cm_id = cm_id;
3883 cm_info.tos = cm_id->tos;
3884 cm_info.user_pri = rt_tos2priority(cm_id->tos);
3885 i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "%s TOS:[%d] UP:[%d]\n",
3886 __func__, cm_id->tos, cm_info.user_pri);
3887 cm_id->add_ref(cm_id);
3888 cm_node = i40iw_create_cm_node(&iwdev->cm_core, iwdev,
3889 conn_param, &cm_info);
3890
3891 if (IS_ERR(cm_node)) {
3892 ret = PTR_ERR(cm_node);
3893 cm_id->rem_ref(cm_id);
3894 return ret;
3895 }
3896
3897 if ((cm_info.ipv4 && (laddr->sin_addr.s_addr != raddr->sin_addr.s_addr)) ||
3898 (!cm_info.ipv4 && memcmp(laddr6->sin6_addr.in6_u.u6_addr32,
3899 raddr6->sin6_addr.in6_u.u6_addr32,
3900 sizeof(laddr6->sin6_addr.in6_u.u6_addr32)))) {
3901 if (i40iw_manage_qhash(iwdev, &cm_info, I40IW_QHASH_TYPE_TCP_ESTABLISHED,
3902 I40IW_QHASH_MANAGE_TYPE_ADD, NULL, true)) {
3903 ret = -EINVAL;
3904 goto err;
3905 }
3906 cm_node->qhash_set = true;
3907 }
3908
3909 if (i40iw_manage_apbvt(iwdev, cm_info.loc_port,
3910 I40IW_MANAGE_APBVT_ADD)) {
3911 ret = -EINVAL;
3912 goto err;
3913 }
3914
3915 cm_node->apbvt_set = true;
3916 iwqp->cm_node = cm_node;
3917 cm_node->iwqp = iwqp;
3918 iwqp->cm_id = cm_id;
3919 i40iw_add_ref(&iwqp->ibqp);
3920
3921 if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
3922 cm_node->state = I40IW_CM_STATE_SYN_SENT;
3923 ret = i40iw_send_syn(cm_node, 0);
3924 if (ret)
3925 goto err;
3926 }
3927
3928 if (cm_node->loopbackpartner) {
3929 cm_node->loopbackpartner->state = I40IW_CM_STATE_MPAREQ_RCVD;
3930 i40iw_create_event(cm_node->loopbackpartner,
3931 I40IW_CM_EVENT_MPA_REQ);
3932 }
3933
3934 i40iw_debug(cm_node->dev,
3935 I40IW_DEBUG_CM,
3936 "Api - connect(): port=0x%04x, cm_node=%p, cm_id = %p.\n",
3937 cm_node->rem_port,
3938 cm_node,
3939 cm_node->cm_id);
3940
3941 return 0;
3942
3943 err:
3944 if (cm_info.ipv4)
3945 i40iw_debug(&iwdev->sc_dev,
3946 I40IW_DEBUG_CM,
3947 "Api - connect() FAILED: dest addr=%pI4",
3948 cm_info.rem_addr);
3949 else
3950 i40iw_debug(&iwdev->sc_dev,
3951 I40IW_DEBUG_CM,
3952 "Api - connect() FAILED: dest addr=%pI6",
3953 cm_info.rem_addr);
3954
3955 i40iw_rem_ref_cm_node(cm_node);
3956 cm_id->rem_ref(cm_id);
3957 iwdev->cm_core.stats_connect_errs++;
3958 return ret;
3959 }
3960
3961 /**
3962 * i40iw_create_listen - registered call creating listener
3963 * @cm_id: cm information for passive connection
3964 * @backlog: to max accept pending count
3965 */
3966 int i40iw_create_listen(struct iw_cm_id *cm_id, int backlog)
3967 {
3968 struct i40iw_device *iwdev;
3969 struct i40iw_cm_listener *cm_listen_node;
3970 struct i40iw_cm_info cm_info;
3971 enum i40iw_status_code ret;
3972 struct sockaddr_in *laddr;
3973 struct sockaddr_in6 *laddr6;
3974 bool wildcard = false;
3975
3976 iwdev = to_iwdev(cm_id->device);
3977 if (!iwdev)
3978 return -EINVAL;
3979
3980 laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3981 laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3982 memset(&cm_info, 0, sizeof(cm_info));
3983 if (laddr->sin_family == AF_INET) {
3984 cm_info.ipv4 = true;
3985 cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3986 cm_info.loc_port = ntohs(laddr->sin_port);
3987
3988 if (laddr->sin_addr.s_addr != INADDR_ANY)
3989 cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3990 else
3991 wildcard = true;
3992
3993 } else {
3994 cm_info.ipv4 = false;
3995 i40iw_copy_ip_ntohl(cm_info.loc_addr,
3996 laddr6->sin6_addr.in6_u.u6_addr32);
3997 cm_info.loc_port = ntohs(laddr6->sin6_port);
3998 if (ipv6_addr_type(&laddr6->sin6_addr) != IPV6_ADDR_ANY)
3999 i40iw_netdev_vlan_ipv6(cm_info.loc_addr,
4000 &cm_info.vlan_id);
4001 else
4002 wildcard = true;
4003 }
4004 cm_info.backlog = backlog;
4005 cm_info.cm_id = cm_id;
4006
4007 cm_listen_node = i40iw_make_listen_node(&iwdev->cm_core, iwdev, &cm_info);
4008 if (!cm_listen_node) {
4009 i40iw_pr_err("cm_listen_node == NULL\n");
4010 return -ENOMEM;
4011 }
4012
4013 cm_id->provider_data = cm_listen_node;
4014
4015 cm_listen_node->tos = cm_id->tos;
4016 cm_listen_node->user_pri = rt_tos2priority(cm_id->tos);
4017 cm_info.user_pri = cm_listen_node->user_pri;
4018
4019 if (!cm_listen_node->reused_node) {
4020 if (wildcard) {
4021 if (cm_info.ipv4)
4022 ret = i40iw_add_mqh_4(iwdev,
4023 &cm_info,
4024 cm_listen_node);
4025 else
4026 ret = i40iw_add_mqh_6(iwdev,
4027 &cm_info,
4028 cm_listen_node);
4029 if (ret)
4030 goto error;
4031
4032 ret = i40iw_manage_apbvt(iwdev,
4033 cm_info.loc_port,
4034 I40IW_MANAGE_APBVT_ADD);
4035
4036 if (ret)
4037 goto error;
4038 } else {
4039 ret = i40iw_manage_qhash(iwdev,
4040 &cm_info,
4041 I40IW_QHASH_TYPE_TCP_SYN,
4042 I40IW_QHASH_MANAGE_TYPE_ADD,
4043 NULL,
4044 true);
4045 if (ret)
4046 goto error;
4047 cm_listen_node->qhash_set = true;
4048 ret = i40iw_manage_apbvt(iwdev,
4049 cm_info.loc_port,
4050 I40IW_MANAGE_APBVT_ADD);
4051 if (ret)
4052 goto error;
4053 }
4054 }
4055 cm_id->add_ref(cm_id);
4056 cm_listen_node->cm_core->stats_listen_created++;
4057 return 0;
4058 error:
4059 i40iw_cm_del_listen(&iwdev->cm_core, (void *)cm_listen_node, false);
4060 return -EINVAL;
4061 }
4062
4063 /**
4064 * i40iw_destroy_listen - registered call to destroy listener
4065 * @cm_id: cm information for passive connection
4066 */
4067 int i40iw_destroy_listen(struct iw_cm_id *cm_id)
4068 {
4069 struct i40iw_device *iwdev;
4070
4071 iwdev = to_iwdev(cm_id->device);
4072 if (cm_id->provider_data)
4073 i40iw_cm_del_listen(&iwdev->cm_core, cm_id->provider_data, true);
4074 else
4075 i40iw_pr_err("cm_id->provider_data was NULL\n");
4076
4077 cm_id->rem_ref(cm_id);
4078
4079 return 0;
4080 }
4081
4082 /**
4083 * i40iw_cm_event_connected - handle connected active node
4084 * @event: the info for cm_node of connection
4085 */
4086 static void i40iw_cm_event_connected(struct i40iw_cm_event *event)
4087 {
4088 struct i40iw_qp *iwqp;
4089 struct i40iw_device *iwdev;
4090 struct i40iw_cm_core *cm_core;
4091 struct i40iw_cm_node *cm_node;
4092 struct i40iw_sc_dev *dev;
4093 struct ib_qp_attr attr;
4094 struct iw_cm_id *cm_id;
4095 unsigned long flags;
4096 int status;
4097 bool read0;
4098
4099 cm_node = event->cm_node;
4100 cm_id = cm_node->cm_id;
4101 iwqp = (struct i40iw_qp *)cm_id->provider_data;
4102 iwdev = to_iwdev(iwqp->ibqp.device);
4103 dev = &iwdev->sc_dev;
4104 cm_core = &iwdev->cm_core;
4105
4106 if (iwqp->destroyed) {
4107 status = -ETIMEDOUT;
4108 goto error;
4109 }
4110 i40iw_cm_init_tsa_conn(iwqp, cm_node);
4111 read0 = (cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO);
4112 if (iwqp->page)
4113 iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
4114 dev->iw_priv_qp_ops->qp_send_rtt(&iwqp->sc_qp, read0);
4115 if (iwqp->page)
4116 kunmap(iwqp->page);
4117
4118 memset(&attr, 0, sizeof(attr));
4119 attr.qp_state = IB_QPS_RTS;
4120 cm_node->qhash_set = false;
4121 i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4122
4123 cm_node->accelerated = true;
4124 spin_lock_irqsave(&cm_core->ht_lock, flags);
4125 list_move_tail(&cm_node->list, &cm_core->accelerated_list);
4126 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4127 status = i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_CONNECT_REPLY,
4128 0);
4129 if (status)
4130 i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - CONNECT_REPLY\n");
4131
4132 return;
4133
4134 error:
4135 iwqp->cm_id = NULL;
4136 cm_id->provider_data = NULL;
4137 i40iw_send_cm_event(event->cm_node,
4138 cm_id,
4139 IW_CM_EVENT_CONNECT_REPLY,
4140 status);
4141 cm_id->rem_ref(cm_id);
4142 i40iw_rem_ref_cm_node(event->cm_node);
4143 }
4144
4145 /**
4146 * i40iw_cm_event_reset - handle reset
4147 * @event: the info for cm_node of connection
4148 */
4149 static void i40iw_cm_event_reset(struct i40iw_cm_event *event)
4150 {
4151 struct i40iw_cm_node *cm_node = event->cm_node;
4152 struct iw_cm_id *cm_id = cm_node->cm_id;
4153 struct i40iw_qp *iwqp;
4154
4155 if (!cm_id)
4156 return;
4157
4158 iwqp = cm_id->provider_data;
4159 if (!iwqp)
4160 return;
4161
4162 i40iw_debug(cm_node->dev,
4163 I40IW_DEBUG_CM,
4164 "reset event %p - cm_id = %p\n",
4165 event->cm_node, cm_id);
4166 iwqp->cm_id = NULL;
4167
4168 i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_DISCONNECT, -ECONNRESET);
4169 i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_CLOSE, 0);
4170 }
4171
4172 /**
4173 * i40iw_cm_event_handler - worker thread callback to send event to cm upper layer
4174 * @work: pointer of cm event info.
4175 */
4176 static void i40iw_cm_event_handler(struct work_struct *work)
4177 {
4178 struct i40iw_cm_event *event = container_of(work,
4179 struct i40iw_cm_event,
4180 event_work);
4181 struct i40iw_cm_node *cm_node;
4182
4183 if (!event || !event->cm_node || !event->cm_node->cm_core)
4184 return;
4185
4186 cm_node = event->cm_node;
4187
4188 switch (event->type) {
4189 case I40IW_CM_EVENT_MPA_REQ:
4190 i40iw_send_cm_event(cm_node,
4191 cm_node->cm_id,
4192 IW_CM_EVENT_CONNECT_REQUEST,
4193 0);
4194 break;
4195 case I40IW_CM_EVENT_RESET:
4196 i40iw_cm_event_reset(event);
4197 break;
4198 case I40IW_CM_EVENT_CONNECTED:
4199 if (!event->cm_node->cm_id ||
4200 (event->cm_node->state != I40IW_CM_STATE_OFFLOADED))
4201 break;
4202 i40iw_cm_event_connected(event);
4203 break;
4204 case I40IW_CM_EVENT_MPA_REJECT:
4205 if (!event->cm_node->cm_id ||
4206 (cm_node->state == I40IW_CM_STATE_OFFLOADED))
4207 break;
4208 i40iw_send_cm_event(cm_node,
4209 cm_node->cm_id,
4210 IW_CM_EVENT_CONNECT_REPLY,
4211 -ECONNREFUSED);
4212 break;
4213 case I40IW_CM_EVENT_ABORTED:
4214 if (!event->cm_node->cm_id ||
4215 (event->cm_node->state == I40IW_CM_STATE_OFFLOADED))
4216 break;
4217 i40iw_event_connect_error(event);
4218 break;
4219 default:
4220 i40iw_pr_err("event type = %d\n", event->type);
4221 break;
4222 }
4223
4224 event->cm_info.cm_id->rem_ref(event->cm_info.cm_id);
4225 i40iw_rem_ref_cm_node(event->cm_node);
4226 kfree(event);
4227 }
4228
4229 /**
4230 * i40iw_cm_post_event - queue event request for worker thread
4231 * @event: cm node's info for up event call
4232 */
4233 static void i40iw_cm_post_event(struct i40iw_cm_event *event)
4234 {
4235 atomic_inc(&event->cm_node->ref_count);
4236 event->cm_info.cm_id->add_ref(event->cm_info.cm_id);
4237 INIT_WORK(&event->event_work, i40iw_cm_event_handler);
4238
4239 queue_work(event->cm_node->cm_core->event_wq, &event->event_work);
4240 }
4241
4242 /**
4243 * i40iw_qhash_ctrl - enable/disable qhash for list
4244 * @iwdev: device pointer
4245 * @parent_listen_node: parent listen node
4246 * @nfo: cm info node
4247 * @ipaddr: Pointer to IPv4 or IPv6 address
4248 * @ipv4: flag indicating IPv4 when true
4249 * @ifup: flag indicating interface up when true
4250 *
4251 * Enables or disables the qhash for the node in the child
4252 * listen list that matches ipaddr. If no matching IP was found
4253 * it will allocate and add a new child listen node to the
4254 * parent listen node. The listen_list_lock is assumed to be
4255 * held when called.
4256 */
4257 static void i40iw_qhash_ctrl(struct i40iw_device *iwdev,
4258 struct i40iw_cm_listener *parent_listen_node,
4259 struct i40iw_cm_info *nfo,
4260 u32 *ipaddr, bool ipv4, bool ifup)
4261 {
4262 struct list_head *child_listen_list = &parent_listen_node->child_listen_list;
4263 struct i40iw_cm_listener *child_listen_node;
4264 struct list_head *pos, *tpos;
4265 enum i40iw_status_code ret;
4266 bool node_allocated = false;
4267 enum i40iw_quad_hash_manage_type op =
4268 ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4269
4270 list_for_each_safe(pos, tpos, child_listen_list) {
4271 child_listen_node =
4272 list_entry(pos,
4273 struct i40iw_cm_listener,
4274 child_listen_list);
4275 if (!memcmp(child_listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16))
4276 goto set_qhash;
4277 }
4278
4279 /* if not found then add a child listener if interface is going up */
4280 if (!ifup)
4281 return;
4282 child_listen_node = kmemdup(parent_listen_node,
4283 sizeof(*child_listen_node), GFP_ATOMIC);
4284 if (!child_listen_node)
4285 return;
4286 node_allocated = true;
4287
4288 memcpy(child_listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16);
4289
4290 set_qhash:
4291 memcpy(nfo->loc_addr,
4292 child_listen_node->loc_addr,
4293 sizeof(nfo->loc_addr));
4294 nfo->vlan_id = child_listen_node->vlan_id;
4295 ret = i40iw_manage_qhash(iwdev, nfo,
4296 I40IW_QHASH_TYPE_TCP_SYN,
4297 op,
4298 NULL, false);
4299 if (!ret) {
4300 child_listen_node->qhash_set = ifup;
4301 if (node_allocated)
4302 list_add(&child_listen_node->child_listen_list,
4303 &parent_listen_node->child_listen_list);
4304 } else if (node_allocated) {
4305 kfree(child_listen_node);
4306 }
4307 }
4308
4309 /**
4310 * i40iw_cm_teardown_connections - teardown QPs
4311 * @iwdev: device pointer
4312 * @ipaddr: Pointer to IPv4 or IPv6 address
4313 * @ipv4: flag indicating IPv4 when true
4314 * @disconnect_all: flag indicating disconnect all QPs
4315 * teardown QPs where source or destination addr matches ip addr
4316 */
4317 void i40iw_cm_teardown_connections(struct i40iw_device *iwdev, u32 *ipaddr,
4318 struct i40iw_cm_info *nfo,
4319 bool disconnect_all)
4320 {
4321 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4322 struct list_head *list_core_temp;
4323 struct list_head *list_node;
4324 struct i40iw_cm_node *cm_node;
4325 unsigned long flags;
4326 struct list_head teardown_list;
4327 struct ib_qp_attr attr;
4328
4329 INIT_LIST_HEAD(&teardown_list);
4330 spin_lock_irqsave(&cm_core->ht_lock, flags);
4331 list_for_each_safe(list_node, list_core_temp,
4332 &cm_core->accelerated_list) {
4333 cm_node = container_of(list_node, struct i40iw_cm_node, list);
4334 if (disconnect_all ||
4335 (nfo->vlan_id == cm_node->vlan_id &&
4336 (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4337 !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4338 atomic_inc(&cm_node->ref_count);
4339 list_add(&cm_node->teardown_entry, &teardown_list);
4340 }
4341 }
4342 list_for_each_safe(list_node, list_core_temp,
4343 &cm_core->non_accelerated_list) {
4344 cm_node = container_of(list_node, struct i40iw_cm_node, list);
4345 if (disconnect_all ||
4346 (nfo->vlan_id == cm_node->vlan_id &&
4347 (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4348 !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4349 atomic_inc(&cm_node->ref_count);
4350 list_add(&cm_node->teardown_entry, &teardown_list);
4351 }
4352 }
4353 spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4354
4355 list_for_each_safe(list_node, list_core_temp, &teardown_list) {
4356 cm_node = container_of(list_node, struct i40iw_cm_node,
4357 teardown_entry);
4358 attr.qp_state = IB_QPS_ERR;
4359 i40iw_modify_qp(&cm_node->iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4360 if (iwdev->reset)
4361 i40iw_cm_disconn(cm_node->iwqp);
4362 i40iw_rem_ref_cm_node(cm_node);
4363 }
4364 }
4365
4366 /**
4367 * i40iw_ifdown_notify - process an ifdown on an interface
4368 * @iwdev: device pointer
4369 * @ipaddr: Pointer to IPv4 or IPv6 address
4370 * @ipv4: flag indicating IPv4 when true
4371 * @ifup: flag indicating interface up when true
4372 */
4373 void i40iw_if_notify(struct i40iw_device *iwdev, struct net_device *netdev,
4374 u32 *ipaddr, bool ipv4, bool ifup)
4375 {
4376 struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4377 unsigned long flags;
4378 struct i40iw_cm_listener *listen_node;
4379 static const u32 ip_zero[4] = { 0, 0, 0, 0 };
4380 struct i40iw_cm_info nfo;
4381 u16 vlan_id = rdma_vlan_dev_vlan_id(netdev);
4382 enum i40iw_status_code ret;
4383 enum i40iw_quad_hash_manage_type op =
4384 ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4385
4386 nfo.vlan_id = vlan_id;
4387 nfo.ipv4 = ipv4;
4388
4389 /* Disable or enable qhash for listeners */
4390 spin_lock_irqsave(&cm_core->listen_list_lock, flags);
4391 list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
4392 if (vlan_id == listen_node->vlan_id &&
4393 (!memcmp(listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16) ||
4394 !memcmp(listen_node->loc_addr, ip_zero, ipv4 ? 4 : 16))) {
4395 memcpy(nfo.loc_addr, listen_node->loc_addr,
4396 sizeof(nfo.loc_addr));
4397 nfo.loc_port = listen_node->loc_port;
4398 nfo.user_pri = listen_node->user_pri;
4399 if (!list_empty(&listen_node->child_listen_list)) {
4400 i40iw_qhash_ctrl(iwdev,
4401 listen_node,
4402 &nfo,
4403 ipaddr, ipv4, ifup);
4404 } else if (memcmp(listen_node->loc_addr, ip_zero,
4405 ipv4 ? 4 : 16)) {
4406 ret = i40iw_manage_qhash(iwdev,
4407 &nfo,
4408 I40IW_QHASH_TYPE_TCP_SYN,
4409 op,
4410 NULL,
4411 false);
4412 if (!ret)
4413 listen_node->qhash_set = ifup;
4414 }
4415 }
4416 }
4417 spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
4418
4419 /* teardown connected qp's on ifdown */
4420 if (!ifup)
4421 i40iw_cm_teardown_connections(iwdev, ipaddr, &nfo, false);
4422 }