linux/drivers/infiniband/hw/i40iw/i40iw_cm.c
<<
>>
Prefs
   1/*******************************************************************************
   2*
   3* Copyright (c) 2015-2016 Intel Corporation.  All rights reserved.
   4*
   5* This software is available to you under a choice of one of two
   6* licenses.  You may choose to be licensed under the terms of the GNU
   7* General Public License (GPL) Version 2, available from the file
   8* COPYING in the main directory of this source tree, or the
   9* OpenFabrics.org BSD license below:
  10*
  11*   Redistribution and use in source and binary forms, with or
  12*   without modification, are permitted provided that the following
  13*   conditions are met:
  14*
  15*    - Redistributions of source code must retain the above
  16*       copyright notice, this list of conditions and the following
  17*       disclaimer.
  18*
  19*    - Redistributions in binary form must reproduce the above
  20*       copyright notice, this list of conditions and the following
  21*       disclaimer in the documentation and/or other materials
  22*       provided with the distribution.
  23*
  24* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  25* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  26* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  27* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  28* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  29* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  30* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  31* SOFTWARE.
  32*
  33*******************************************************************************/
  34
  35#include <linux/atomic.h>
  36#include <linux/ip.h>
  37#include <linux/tcp.h>
  38#include <linux/init.h>
  39#include <linux/if_arp.h>
  40#include <linux/if_vlan.h>
  41#include <linux/notifier.h>
  42#include <linux/net.h>
  43#include <linux/types.h>
  44#include <linux/timer.h>
  45#include <linux/time.h>
  46#include <linux/delay.h>
  47#include <linux/etherdevice.h>
  48#include <linux/netdevice.h>
  49#include <linux/random.h>
  50#include <linux/list.h>
  51#include <linux/threads.h>
  52#include <linux/highmem.h>
  53#include <net/arp.h>
  54#include <net/ndisc.h>
  55#include <net/neighbour.h>
  56#include <net/route.h>
  57#include <net/addrconf.h>
  58#include <net/ip6_route.h>
  59#include <net/ip_fib.h>
  60#include <net/secure_seq.h>
  61#include <net/tcp.h>
  62#include <asm/checksum.h>
  63
  64#include "i40iw.h"
  65
  66static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *);
  67static void i40iw_cm_post_event(struct i40iw_cm_event *event);
  68static void i40iw_disconnect_worker(struct work_struct *work);
  69
  70/**
  71 * i40iw_free_sqbuf - put back puda buffer if refcount = 0
  72 * @vsi: pointer to vsi structure
  73 * @buf: puda buffer to free
  74 */
  75void i40iw_free_sqbuf(struct i40iw_sc_vsi *vsi, void *bufp)
  76{
  77        struct i40iw_puda_buf *buf = (struct i40iw_puda_buf *)bufp;
  78        struct i40iw_puda_rsrc *ilq = vsi->ilq;
  79
  80        if (!atomic_dec_return(&buf->refcount))
  81                i40iw_puda_ret_bufpool(ilq, buf);
  82}
  83
  84/**
  85 * i40iw_derive_hw_ird_setting - Calculate IRD
  86 *
  87 * @cm_ird: IRD of connection's node
  88 *
  89 * The ird from the connection is rounded to a supported HW
  90 * setting (2,8,32,64) and then encoded for ird_size field of
  91 * qp_ctx
  92 */
  93static u8 i40iw_derive_hw_ird_setting(u16 cm_ird)
  94{
  95        u8 encoded_ird_size;
  96
  97        /* ird_size field is encoded in qp_ctx */
  98        switch (cm_ird ? roundup_pow_of_two(cm_ird) : 0) {
  99        case I40IW_HW_IRD_SETTING_64:
 100                encoded_ird_size = 3;
 101                break;
 102        case I40IW_HW_IRD_SETTING_32:
 103        case I40IW_HW_IRD_SETTING_16:
 104                encoded_ird_size = 2;
 105                break;
 106        case I40IW_HW_IRD_SETTING_8:
 107        case I40IW_HW_IRD_SETTING_4:
 108                encoded_ird_size = 1;
 109                break;
 110        case I40IW_HW_IRD_SETTING_2:
 111        default:
 112                encoded_ird_size = 0;
 113                break;
 114        }
 115        return encoded_ird_size;
 116}
 117
 118/**
 119 * i40iw_record_ird_ord - Record IRD/ORD passed in
 120 * @cm_node: connection's node
 121 * @conn_ird: connection IRD
 122 * @conn_ord: connection ORD
 123 */
 124static void i40iw_record_ird_ord(struct i40iw_cm_node *cm_node, u32 conn_ird,
 125                                 u32 conn_ord)
 126{
 127        if (conn_ird > I40IW_MAX_IRD_SIZE)
 128                conn_ird = I40IW_MAX_IRD_SIZE;
 129
 130        if (conn_ord > I40IW_MAX_ORD_SIZE)
 131                conn_ord = I40IW_MAX_ORD_SIZE;
 132        else if (!conn_ord && cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO)
 133                conn_ord = 1;
 134
 135        cm_node->ird_size = conn_ird;
 136        cm_node->ord_size = conn_ord;
 137}
 138
 139/**
 140 * i40iw_copy_ip_ntohl - change network to host ip
 141 * @dst: host ip
 142 * @src: big endian
 143 */
 144void i40iw_copy_ip_ntohl(u32 *dst, __be32 *src)
 145{
 146        *dst++ = ntohl(*src++);
 147        *dst++ = ntohl(*src++);
 148        *dst++ = ntohl(*src++);
 149        *dst = ntohl(*src);
 150}
 151
 152/**
 153 * i40iw_copy_ip_htonl - change host addr to network ip
 154 * @dst: host ip
 155 * @src: little endian
 156 */
 157static inline void i40iw_copy_ip_htonl(__be32 *dst, u32 *src)
 158{
 159        *dst++ = htonl(*src++);
 160        *dst++ = htonl(*src++);
 161        *dst++ = htonl(*src++);
 162        *dst = htonl(*src);
 163}
 164
 165/**
 166 * i40iw_fill_sockaddr4 - get addr info for passive connection
 167 * @cm_node: connection's node
 168 * @event: upper layer's cm event
 169 */
 170static inline void i40iw_fill_sockaddr4(struct i40iw_cm_node *cm_node,
 171                                        struct iw_cm_event *event)
 172{
 173        struct sockaddr_in *laddr = (struct sockaddr_in *)&event->local_addr;
 174        struct sockaddr_in *raddr = (struct sockaddr_in *)&event->remote_addr;
 175
 176        laddr->sin_family = AF_INET;
 177        raddr->sin_family = AF_INET;
 178
 179        laddr->sin_port = htons(cm_node->loc_port);
 180        raddr->sin_port = htons(cm_node->rem_port);
 181
 182        laddr->sin_addr.s_addr = htonl(cm_node->loc_addr[0]);
 183        raddr->sin_addr.s_addr = htonl(cm_node->rem_addr[0]);
 184}
 185
 186/**
 187 * i40iw_fill_sockaddr6 - get ipv6 addr info for passive side
 188 * @cm_node: connection's node
 189 * @event: upper layer's cm event
 190 */
 191static inline void i40iw_fill_sockaddr6(struct i40iw_cm_node *cm_node,
 192                                        struct iw_cm_event *event)
 193{
 194        struct sockaddr_in6 *laddr6 = (struct sockaddr_in6 *)&event->local_addr;
 195        struct sockaddr_in6 *raddr6 = (struct sockaddr_in6 *)&event->remote_addr;
 196
 197        laddr6->sin6_family = AF_INET6;
 198        raddr6->sin6_family = AF_INET6;
 199
 200        laddr6->sin6_port = htons(cm_node->loc_port);
 201        raddr6->sin6_port = htons(cm_node->rem_port);
 202
 203        i40iw_copy_ip_htonl(laddr6->sin6_addr.in6_u.u6_addr32,
 204                            cm_node->loc_addr);
 205        i40iw_copy_ip_htonl(raddr6->sin6_addr.in6_u.u6_addr32,
 206                            cm_node->rem_addr);
 207}
 208
 209/**
 210 * i40iw_get_addr_info
 211 * @cm_node: contains ip/tcp info
 212 * @cm_info: to get a copy of the cm_node ip/tcp info
 213*/
 214static void i40iw_get_addr_info(struct i40iw_cm_node *cm_node,
 215                                struct i40iw_cm_info *cm_info)
 216{
 217        cm_info->ipv4 = cm_node->ipv4;
 218        cm_info->vlan_id = cm_node->vlan_id;
 219        memcpy(cm_info->loc_addr, cm_node->loc_addr, sizeof(cm_info->loc_addr));
 220        memcpy(cm_info->rem_addr, cm_node->rem_addr, sizeof(cm_info->rem_addr));
 221        cm_info->loc_port = cm_node->loc_port;
 222        cm_info->rem_port = cm_node->rem_port;
 223        cm_info->user_pri = cm_node->user_pri;
 224}
 225
 226/**
 227 * i40iw_get_cmevent_info - for cm event upcall
 228 * @cm_node: connection's node
 229 * @cm_id: upper layers cm struct for the event
 230 * @event: upper layer's cm event
 231 */
 232static inline void i40iw_get_cmevent_info(struct i40iw_cm_node *cm_node,
 233                                          struct iw_cm_id *cm_id,
 234                                          struct iw_cm_event *event)
 235{
 236        memcpy(&event->local_addr, &cm_id->m_local_addr,
 237               sizeof(event->local_addr));
 238        memcpy(&event->remote_addr, &cm_id->m_remote_addr,
 239               sizeof(event->remote_addr));
 240        if (cm_node) {
 241                event->private_data = (void *)cm_node->pdata_buf;
 242                event->private_data_len = (u8)cm_node->pdata.size;
 243                event->ird = cm_node->ird_size;
 244                event->ord = cm_node->ord_size;
 245        }
 246}
 247
 248/**
 249 * i40iw_send_cm_event - upcall cm's event handler
 250 * @cm_node: connection's node
 251 * @cm_id: upper layer's cm info struct
 252 * @type: Event type to indicate
 253 * @status: status for the event type
 254 */
 255static int i40iw_send_cm_event(struct i40iw_cm_node *cm_node,
 256                               struct iw_cm_id *cm_id,
 257                               enum iw_cm_event_type type,
 258                               int status)
 259{
 260        struct iw_cm_event event;
 261
 262        memset(&event, 0, sizeof(event));
 263        event.event = type;
 264        event.status = status;
 265        switch (type) {
 266        case IW_CM_EVENT_CONNECT_REQUEST:
 267                if (cm_node->ipv4)
 268                        i40iw_fill_sockaddr4(cm_node, &event);
 269                else
 270                        i40iw_fill_sockaddr6(cm_node, &event);
 271                event.provider_data = (void *)cm_node;
 272                event.private_data = (void *)cm_node->pdata_buf;
 273                event.private_data_len = (u8)cm_node->pdata.size;
 274                event.ird = cm_node->ird_size;
 275                break;
 276        case IW_CM_EVENT_CONNECT_REPLY:
 277                i40iw_get_cmevent_info(cm_node, cm_id, &event);
 278                break;
 279        case IW_CM_EVENT_ESTABLISHED:
 280                event.ird = cm_node->ird_size;
 281                event.ord = cm_node->ord_size;
 282                break;
 283        case IW_CM_EVENT_DISCONNECT:
 284                break;
 285        case IW_CM_EVENT_CLOSE:
 286                break;
 287        default:
 288                i40iw_pr_err("event type received type = %d\n", type);
 289                return -1;
 290        }
 291        return cm_id->event_handler(cm_id, &event);
 292}
 293
 294/**
 295 * i40iw_create_event - create cm event
 296 * @cm_node: connection's node
 297 * @type: Event type to generate
 298 */
 299static struct i40iw_cm_event *i40iw_create_event(struct i40iw_cm_node *cm_node,
 300                                                 enum i40iw_cm_event_type type)
 301{
 302        struct i40iw_cm_event *event;
 303
 304        if (!cm_node->cm_id)
 305                return NULL;
 306
 307        event = kzalloc(sizeof(*event), GFP_ATOMIC);
 308
 309        if (!event)
 310                return NULL;
 311
 312        event->type = type;
 313        event->cm_node = cm_node;
 314        memcpy(event->cm_info.rem_addr, cm_node->rem_addr, sizeof(event->cm_info.rem_addr));
 315        memcpy(event->cm_info.loc_addr, cm_node->loc_addr, sizeof(event->cm_info.loc_addr));
 316        event->cm_info.rem_port = cm_node->rem_port;
 317        event->cm_info.loc_port = cm_node->loc_port;
 318        event->cm_info.cm_id = cm_node->cm_id;
 319
 320        i40iw_debug(cm_node->dev,
 321                    I40IW_DEBUG_CM,
 322                    "node=%p event=%p type=%u dst=%pI4 src=%pI4\n",
 323                    cm_node,
 324                    event,
 325                    type,
 326                    event->cm_info.loc_addr,
 327                    event->cm_info.rem_addr);
 328
 329        i40iw_cm_post_event(event);
 330        return event;
 331}
 332
 333/**
 334 * i40iw_free_retrans_entry - free send entry
 335 * @cm_node: connection's node
 336 */
 337static void i40iw_free_retrans_entry(struct i40iw_cm_node *cm_node)
 338{
 339        struct i40iw_device *iwdev = cm_node->iwdev;
 340        struct i40iw_timer_entry *send_entry;
 341
 342        send_entry = cm_node->send_entry;
 343        if (send_entry) {
 344                cm_node->send_entry = NULL;
 345                i40iw_free_sqbuf(&iwdev->vsi, (void *)send_entry->sqbuf);
 346                kfree(send_entry);
 347                atomic_dec(&cm_node->ref_count);
 348        }
 349}
 350
 351/**
 352 * i40iw_cleanup_retrans_entry - free send entry with lock
 353 * @cm_node: connection's node
 354 */
 355static void i40iw_cleanup_retrans_entry(struct i40iw_cm_node *cm_node)
 356{
 357        unsigned long flags;
 358
 359        spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
 360        i40iw_free_retrans_entry(cm_node);
 361        spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
 362}
 363
 364/**
 365 * i40iw_form_cm_frame - get a free packet and build frame
 366 * @cm_node: connection's node ionfo to use in frame
 367 * @options: pointer to options info
 368 * @hdr: pointer mpa header
 369 * @pdata: pointer to private data
 370 * @flags:  indicates FIN or ACK
 371 */
 372static struct i40iw_puda_buf *i40iw_form_cm_frame(struct i40iw_cm_node *cm_node,
 373                                                  struct i40iw_kmem_info *options,
 374                                                  struct i40iw_kmem_info *hdr,
 375                                                  struct i40iw_kmem_info *pdata,
 376                                                  u8 flags)
 377{
 378        struct i40iw_puda_buf *sqbuf;
 379        struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
 380        u8 *buf;
 381
 382        struct tcphdr *tcph;
 383        struct iphdr *iph;
 384        struct ipv6hdr *ip6h;
 385        struct ethhdr *ethh;
 386        u16 packetsize;
 387        u16 eth_hlen = ETH_HLEN;
 388        u32 opts_len = 0;
 389        u32 pd_len = 0;
 390        u32 hdr_len = 0;
 391        u16 vtag;
 392
 393        sqbuf = i40iw_puda_get_bufpool(vsi->ilq);
 394        if (!sqbuf)
 395                return NULL;
 396        buf = sqbuf->mem.va;
 397
 398        if (options)
 399                opts_len = (u32)options->size;
 400
 401        if (hdr)
 402                hdr_len = hdr->size;
 403
 404        if (pdata)
 405                pd_len = pdata->size;
 406
 407        if (cm_node->vlan_id <= VLAN_VID_MASK)
 408                eth_hlen += 4;
 409
 410        if (cm_node->ipv4)
 411                packetsize = sizeof(*iph) + sizeof(*tcph);
 412        else
 413                packetsize = sizeof(*ip6h) + sizeof(*tcph);
 414        packetsize += opts_len + hdr_len + pd_len;
 415
 416        memset(buf, 0x00, eth_hlen + packetsize);
 417
 418        sqbuf->totallen = packetsize + eth_hlen;
 419        sqbuf->maclen = eth_hlen;
 420        sqbuf->tcphlen = sizeof(*tcph) + opts_len;
 421        sqbuf->scratch = (void *)cm_node;
 422
 423        ethh = (struct ethhdr *)buf;
 424        buf += eth_hlen;
 425
 426        if (cm_node->ipv4) {
 427                sqbuf->ipv4 = true;
 428
 429                iph = (struct iphdr *)buf;
 430                buf += sizeof(*iph);
 431                tcph = (struct tcphdr *)buf;
 432                buf += sizeof(*tcph);
 433
 434                ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
 435                ether_addr_copy(ethh->h_source, cm_node->loc_mac);
 436                if (cm_node->vlan_id <= VLAN_VID_MASK) {
 437                        ((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
 438                        vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
 439                        ((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
 440
 441                        ((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IP);
 442                } else {
 443                        ethh->h_proto = htons(ETH_P_IP);
 444                }
 445
 446                iph->version = IPVERSION;
 447                iph->ihl = 5;   /* 5 * 4Byte words, IP headr len */
 448                iph->tos = cm_node->tos;
 449                iph->tot_len = htons(packetsize);
 450                iph->id = htons(++cm_node->tcp_cntxt.loc_id);
 451
 452                iph->frag_off = htons(0x4000);
 453                iph->ttl = 0x40;
 454                iph->protocol = IPPROTO_TCP;
 455                iph->saddr = htonl(cm_node->loc_addr[0]);
 456                iph->daddr = htonl(cm_node->rem_addr[0]);
 457        } else {
 458                sqbuf->ipv4 = false;
 459                ip6h = (struct ipv6hdr *)buf;
 460                buf += sizeof(*ip6h);
 461                tcph = (struct tcphdr *)buf;
 462                buf += sizeof(*tcph);
 463
 464                ether_addr_copy(ethh->h_dest, cm_node->rem_mac);
 465                ether_addr_copy(ethh->h_source, cm_node->loc_mac);
 466                if (cm_node->vlan_id <= VLAN_VID_MASK) {
 467                        ((struct vlan_ethhdr *)ethh)->h_vlan_proto = htons(ETH_P_8021Q);
 468                        vtag = (cm_node->user_pri << VLAN_PRIO_SHIFT) | cm_node->vlan_id;
 469                        ((struct vlan_ethhdr *)ethh)->h_vlan_TCI = htons(vtag);
 470                        ((struct vlan_ethhdr *)ethh)->h_vlan_encapsulated_proto = htons(ETH_P_IPV6);
 471                } else {
 472                        ethh->h_proto = htons(ETH_P_IPV6);
 473                }
 474                ip6h->version = 6;
 475                ip6h->priority = cm_node->tos >> 4;
 476                ip6h->flow_lbl[0] = cm_node->tos << 4;
 477                ip6h->flow_lbl[1] = 0;
 478                ip6h->flow_lbl[2] = 0;
 479                ip6h->payload_len = htons(packetsize - sizeof(*ip6h));
 480                ip6h->nexthdr = 6;
 481                ip6h->hop_limit = 128;
 482                i40iw_copy_ip_htonl(ip6h->saddr.in6_u.u6_addr32,
 483                                    cm_node->loc_addr);
 484                i40iw_copy_ip_htonl(ip6h->daddr.in6_u.u6_addr32,
 485                                    cm_node->rem_addr);
 486        }
 487
 488        tcph->source = htons(cm_node->loc_port);
 489        tcph->dest = htons(cm_node->rem_port);
 490
 491        tcph->seq = htonl(cm_node->tcp_cntxt.loc_seq_num);
 492
 493        if (flags & SET_ACK) {
 494                cm_node->tcp_cntxt.loc_ack_num = cm_node->tcp_cntxt.rcv_nxt;
 495                tcph->ack_seq = htonl(cm_node->tcp_cntxt.loc_ack_num);
 496                tcph->ack = 1;
 497        } else {
 498                tcph->ack_seq = 0;
 499        }
 500
 501        if (flags & SET_SYN) {
 502                cm_node->tcp_cntxt.loc_seq_num++;
 503                tcph->syn = 1;
 504        } else {
 505                cm_node->tcp_cntxt.loc_seq_num += hdr_len + pd_len;
 506        }
 507
 508        if (flags & SET_FIN) {
 509                cm_node->tcp_cntxt.loc_seq_num++;
 510                tcph->fin = 1;
 511        }
 512
 513        if (flags & SET_RST)
 514                tcph->rst = 1;
 515
 516        tcph->doff = (u16)((sizeof(*tcph) + opts_len + 3) >> 2);
 517        sqbuf->tcphlen = tcph->doff << 2;
 518        tcph->window = htons(cm_node->tcp_cntxt.rcv_wnd);
 519        tcph->urg_ptr = 0;
 520
 521        if (opts_len) {
 522                memcpy(buf, options->addr, opts_len);
 523                buf += opts_len;
 524        }
 525
 526        if (hdr_len) {
 527                memcpy(buf, hdr->addr, hdr_len);
 528                buf += hdr_len;
 529        }
 530
 531        if (pdata && pdata->addr)
 532                memcpy(buf, pdata->addr, pdata->size);
 533
 534        atomic_set(&sqbuf->refcount, 1);
 535
 536        return sqbuf;
 537}
 538
 539/**
 540 * i40iw_send_reset - Send RST packet
 541 * @cm_node: connection's node
 542 */
 543int i40iw_send_reset(struct i40iw_cm_node *cm_node)
 544{
 545        struct i40iw_puda_buf *sqbuf;
 546        int flags = SET_RST | SET_ACK;
 547
 548        sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, flags);
 549        if (!sqbuf) {
 550                i40iw_pr_err("no sqbuf\n");
 551                return -1;
 552        }
 553
 554        return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 0, 1);
 555}
 556
 557/**
 558 * i40iw_active_open_err - send event for active side cm error
 559 * @cm_node: connection's node
 560 * @reset: Flag to send reset or not
 561 */
 562static void i40iw_active_open_err(struct i40iw_cm_node *cm_node, bool reset)
 563{
 564        i40iw_cleanup_retrans_entry(cm_node);
 565        cm_node->cm_core->stats_connect_errs++;
 566        if (reset) {
 567                i40iw_debug(cm_node->dev,
 568                            I40IW_DEBUG_CM,
 569                            "%s cm_node=%p state=%d\n",
 570                            __func__,
 571                            cm_node,
 572                            cm_node->state);
 573                atomic_inc(&cm_node->ref_count);
 574                i40iw_send_reset(cm_node);
 575        }
 576
 577        cm_node->state = I40IW_CM_STATE_CLOSED;
 578        i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
 579}
 580
 581/**
 582 * i40iw_passive_open_err - handle passive side cm error
 583 * @cm_node: connection's node
 584 * @reset: send reset or just free cm_node
 585 */
 586static void i40iw_passive_open_err(struct i40iw_cm_node *cm_node, bool reset)
 587{
 588        i40iw_cleanup_retrans_entry(cm_node);
 589        cm_node->cm_core->stats_passive_errs++;
 590        cm_node->state = I40IW_CM_STATE_CLOSED;
 591        i40iw_debug(cm_node->dev,
 592                    I40IW_DEBUG_CM,
 593                    "%s cm_node=%p state =%d\n",
 594                    __func__,
 595                    cm_node,
 596                    cm_node->state);
 597        if (reset)
 598                i40iw_send_reset(cm_node);
 599        else
 600                i40iw_rem_ref_cm_node(cm_node);
 601}
 602
 603/**
 604 * i40iw_event_connect_error - to create connect error event
 605 * @event: cm information for connect event
 606 */
 607static void i40iw_event_connect_error(struct i40iw_cm_event *event)
 608{
 609        struct i40iw_qp *iwqp;
 610        struct iw_cm_id *cm_id;
 611
 612        cm_id = event->cm_node->cm_id;
 613        if (!cm_id)
 614                return;
 615
 616        iwqp = cm_id->provider_data;
 617
 618        if (!iwqp || !iwqp->iwdev)
 619                return;
 620
 621        iwqp->cm_id = NULL;
 622        cm_id->provider_data = NULL;
 623        i40iw_send_cm_event(event->cm_node, cm_id,
 624                            IW_CM_EVENT_CONNECT_REPLY,
 625                            -ECONNRESET);
 626        cm_id->rem_ref(cm_id);
 627        i40iw_rem_ref_cm_node(event->cm_node);
 628}
 629
 630/**
 631 * i40iw_process_options
 632 * @cm_node: connection's node
 633 * @optionsloc: point to start of options
 634 * @optionsize: size of all options
 635 * @syn_packet: flag if syn packet
 636 */
 637static int i40iw_process_options(struct i40iw_cm_node *cm_node,
 638                                 u8 *optionsloc,
 639                                 u32 optionsize,
 640                                 u32 syn_packet)
 641{
 642        u32 tmp;
 643        u32 offset = 0;
 644        union all_known_options *all_options;
 645        char got_mss_option = 0;
 646
 647        while (offset < optionsize) {
 648                all_options = (union all_known_options *)(optionsloc + offset);
 649                switch (all_options->as_base.optionnum) {
 650                case OPTION_NUMBER_END:
 651                        offset = optionsize;
 652                        break;
 653                case OPTION_NUMBER_NONE:
 654                        offset += 1;
 655                        continue;
 656                case OPTION_NUMBER_MSS:
 657                        i40iw_debug(cm_node->dev,
 658                                    I40IW_DEBUG_CM,
 659                                    "%s: MSS Length: %d Offset: %d Size: %d\n",
 660                                    __func__,
 661                                    all_options->as_mss.length,
 662                                    offset,
 663                                    optionsize);
 664                        got_mss_option = 1;
 665                        if (all_options->as_mss.length != 4)
 666                                return -1;
 667                        tmp = ntohs(all_options->as_mss.mss);
 668                        if (tmp > 0 && tmp < cm_node->tcp_cntxt.mss)
 669                                cm_node->tcp_cntxt.mss = tmp;
 670                        break;
 671                case OPTION_NUMBER_WINDOW_SCALE:
 672                        cm_node->tcp_cntxt.snd_wscale =
 673                            all_options->as_windowscale.shiftcount;
 674                        break;
 675                default:
 676                        i40iw_debug(cm_node->dev,
 677                                    I40IW_DEBUG_CM,
 678                                    "TCP Option not understood: %x\n",
 679                                    all_options->as_base.optionnum);
 680                        break;
 681                }
 682                offset += all_options->as_base.length;
 683        }
 684        if (!got_mss_option && syn_packet)
 685                cm_node->tcp_cntxt.mss = I40IW_CM_DEFAULT_MSS;
 686        return 0;
 687}
 688
 689/**
 690 * i40iw_handle_tcp_options -
 691 * @cm_node: connection's node
 692 * @tcph: pointer tcp header
 693 * @optionsize: size of options rcvd
 694 * @passive: active or passive flag
 695 */
 696static int i40iw_handle_tcp_options(struct i40iw_cm_node *cm_node,
 697                                    struct tcphdr *tcph,
 698                                    int optionsize,
 699                                    int passive)
 700{
 701        u8 *optionsloc = (u8 *)&tcph[1];
 702
 703        if (optionsize) {
 704                if (i40iw_process_options(cm_node,
 705                                          optionsloc,
 706                                          optionsize,
 707                                          (u32)tcph->syn)) {
 708                        i40iw_debug(cm_node->dev,
 709                                    I40IW_DEBUG_CM,
 710                                    "%s: Node %p, Sending RESET\n",
 711                                    __func__,
 712                                    cm_node);
 713                        if (passive)
 714                                i40iw_passive_open_err(cm_node, true);
 715                        else
 716                                i40iw_active_open_err(cm_node, true);
 717                        return -1;
 718                }
 719        }
 720
 721        cm_node->tcp_cntxt.snd_wnd = ntohs(tcph->window) <<
 722            cm_node->tcp_cntxt.snd_wscale;
 723
 724        if (cm_node->tcp_cntxt.snd_wnd > cm_node->tcp_cntxt.max_snd_wnd)
 725                cm_node->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.snd_wnd;
 726        return 0;
 727}
 728
 729/**
 730 * i40iw_build_mpa_v1 - build a MPA V1 frame
 731 * @cm_node: connection's node
 732 * @mpa_key: to do read0 or write0
 733 */
 734static void i40iw_build_mpa_v1(struct i40iw_cm_node *cm_node,
 735                               void *start_addr,
 736                               u8 mpa_key)
 737{
 738        struct ietf_mpa_v1 *mpa_frame = (struct ietf_mpa_v1 *)start_addr;
 739
 740        switch (mpa_key) {
 741        case MPA_KEY_REQUEST:
 742                memcpy(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE);
 743                break;
 744        case MPA_KEY_REPLY:
 745                memcpy(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE);
 746                break;
 747        default:
 748                break;
 749        }
 750        mpa_frame->flags = IETF_MPA_FLAGS_CRC;
 751        mpa_frame->rev = cm_node->mpa_frame_rev;
 752        mpa_frame->priv_data_len = htons(cm_node->pdata.size);
 753}
 754
 755/**
 756 * i40iw_build_mpa_v2 - build a MPA V2 frame
 757 * @cm_node: connection's node
 758 * @start_addr: buffer start address
 759 * @mpa_key: to do read0 or write0
 760 */
 761static void i40iw_build_mpa_v2(struct i40iw_cm_node *cm_node,
 762                               void *start_addr,
 763                               u8 mpa_key)
 764{
 765        struct ietf_mpa_v2 *mpa_frame = (struct ietf_mpa_v2 *)start_addr;
 766        struct ietf_rtr_msg *rtr_msg = &mpa_frame->rtr_msg;
 767        u16 ctrl_ird, ctrl_ord;
 768
 769        /* initialize the upper 5 bytes of the frame */
 770        i40iw_build_mpa_v1(cm_node, start_addr, mpa_key);
 771        mpa_frame->flags |= IETF_MPA_V2_FLAG;
 772        mpa_frame->priv_data_len += htons(IETF_RTR_MSG_SIZE);
 773
 774        /* initialize RTR msg */
 775        if (cm_node->mpav2_ird_ord == IETF_NO_IRD_ORD) {
 776                ctrl_ird = IETF_NO_IRD_ORD;
 777                ctrl_ord = IETF_NO_IRD_ORD;
 778        } else {
 779                ctrl_ird = (cm_node->ird_size > IETF_NO_IRD_ORD) ?
 780                        IETF_NO_IRD_ORD : cm_node->ird_size;
 781                ctrl_ord = (cm_node->ord_size > IETF_NO_IRD_ORD) ?
 782                        IETF_NO_IRD_ORD : cm_node->ord_size;
 783        }
 784
 785        ctrl_ird |= IETF_PEER_TO_PEER;
 786
 787        switch (mpa_key) {
 788        case MPA_KEY_REQUEST:
 789                ctrl_ord |= IETF_RDMA0_WRITE;
 790                ctrl_ord |= IETF_RDMA0_READ;
 791                break;
 792        case MPA_KEY_REPLY:
 793                switch (cm_node->send_rdma0_op) {
 794                case SEND_RDMA_WRITE_ZERO:
 795                        ctrl_ord |= IETF_RDMA0_WRITE;
 796                        break;
 797                case SEND_RDMA_READ_ZERO:
 798                        ctrl_ord |= IETF_RDMA0_READ;
 799                        break;
 800                }
 801                break;
 802        default:
 803                break;
 804        }
 805        rtr_msg->ctrl_ird = htons(ctrl_ird);
 806        rtr_msg->ctrl_ord = htons(ctrl_ord);
 807}
 808
 809/**
 810 * i40iw_cm_build_mpa_frame - build mpa frame for mpa version 1 or version 2
 811 * @cm_node: connection's node
 812 * @mpa: mpa: data buffer
 813 * @mpa_key: to do read0 or write0
 814 */
 815static int i40iw_cm_build_mpa_frame(struct i40iw_cm_node *cm_node,
 816                                    struct i40iw_kmem_info *mpa,
 817                                    u8 mpa_key)
 818{
 819        int hdr_len = 0;
 820
 821        switch (cm_node->mpa_frame_rev) {
 822        case IETF_MPA_V1:
 823                hdr_len = sizeof(struct ietf_mpa_v1);
 824                i40iw_build_mpa_v1(cm_node, mpa->addr, mpa_key);
 825                break;
 826        case IETF_MPA_V2:
 827                hdr_len = sizeof(struct ietf_mpa_v2);
 828                i40iw_build_mpa_v2(cm_node, mpa->addr, mpa_key);
 829                break;
 830        default:
 831                break;
 832        }
 833
 834        return hdr_len;
 835}
 836
 837/**
 838 * i40iw_send_mpa_request - active node send mpa request to passive node
 839 * @cm_node: connection's node
 840 */
 841static int i40iw_send_mpa_request(struct i40iw_cm_node *cm_node)
 842{
 843        struct i40iw_puda_buf *sqbuf;
 844
 845        if (!cm_node) {
 846                i40iw_pr_err("cm_node == NULL\n");
 847                return -1;
 848        }
 849
 850        cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
 851        cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
 852                                                         &cm_node->mpa_hdr,
 853                                                         MPA_KEY_REQUEST);
 854        if (!cm_node->mpa_hdr.size) {
 855                i40iw_pr_err("mpa size = %d\n", cm_node->mpa_hdr.size);
 856                return -1;
 857        }
 858
 859        sqbuf = i40iw_form_cm_frame(cm_node,
 860                                    NULL,
 861                                    &cm_node->mpa_hdr,
 862                                    &cm_node->pdata,
 863                                    SET_ACK);
 864        if (!sqbuf) {
 865                i40iw_pr_err("sq_buf == NULL\n");
 866                return -1;
 867        }
 868        return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
 869}
 870
 871/**
 872 * i40iw_send_mpa_reject -
 873 * @cm_node: connection's node
 874 * @pdata: reject data for connection
 875 * @plen: length of reject data
 876 */
 877static int i40iw_send_mpa_reject(struct i40iw_cm_node *cm_node,
 878                                 const void *pdata,
 879                                 u8 plen)
 880{
 881        struct i40iw_puda_buf *sqbuf;
 882        struct i40iw_kmem_info priv_info;
 883
 884        cm_node->mpa_hdr.addr = &cm_node->mpa_frame;
 885        cm_node->mpa_hdr.size = i40iw_cm_build_mpa_frame(cm_node,
 886                                                         &cm_node->mpa_hdr,
 887                                                         MPA_KEY_REPLY);
 888
 889        cm_node->mpa_frame.flags |= IETF_MPA_FLAGS_REJECT;
 890        priv_info.addr = (void *)pdata;
 891        priv_info.size = plen;
 892
 893        sqbuf = i40iw_form_cm_frame(cm_node,
 894                                    NULL,
 895                                    &cm_node->mpa_hdr,
 896                                    &priv_info,
 897                                    SET_ACK | SET_FIN);
 898        if (!sqbuf) {
 899                i40iw_pr_err("no sqbuf\n");
 900                return -ENOMEM;
 901        }
 902        cm_node->state = I40IW_CM_STATE_FIN_WAIT1;
 903        return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
 904}
 905
 906/**
 907 * recv_mpa - process an IETF MPA frame
 908 * @cm_node: connection's node
 909 * @buffer: Data pointer
 910 * @type: to return accept or reject
 911 * @len: Len of mpa buffer
 912 */
 913static int i40iw_parse_mpa(struct i40iw_cm_node *cm_node, u8 *buffer, u32 *type, u32 len)
 914{
 915        struct ietf_mpa_v1 *mpa_frame;
 916        struct ietf_mpa_v2 *mpa_v2_frame;
 917        struct ietf_rtr_msg *rtr_msg;
 918        int mpa_hdr_len;
 919        int priv_data_len;
 920
 921        *type = I40IW_MPA_REQUEST_ACCEPT;
 922
 923        if (len < sizeof(struct ietf_mpa_v1)) {
 924                i40iw_pr_err("ietf buffer small (%x)\n", len);
 925                return -1;
 926        }
 927
 928        mpa_frame = (struct ietf_mpa_v1 *)buffer;
 929        mpa_hdr_len = sizeof(struct ietf_mpa_v1);
 930        priv_data_len = ntohs(mpa_frame->priv_data_len);
 931
 932        if (priv_data_len > IETF_MAX_PRIV_DATA_LEN) {
 933                i40iw_pr_err("large pri_data %d\n", priv_data_len);
 934                return -1;
 935        }
 936        if (mpa_frame->rev != IETF_MPA_V1 && mpa_frame->rev != IETF_MPA_V2) {
 937                i40iw_pr_err("unsupported mpa rev = %d\n", mpa_frame->rev);
 938                return -1;
 939        }
 940        if (mpa_frame->rev > cm_node->mpa_frame_rev) {
 941                i40iw_pr_err("rev %d\n", mpa_frame->rev);
 942                return -1;
 943        }
 944        cm_node->mpa_frame_rev = mpa_frame->rev;
 945
 946        if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
 947                if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REQ, IETF_MPA_KEY_SIZE)) {
 948                        i40iw_pr_err("Unexpected MPA Key received\n");
 949                        return -1;
 950                }
 951        } else {
 952                if (memcmp(mpa_frame->key, IEFT_MPA_KEY_REP, IETF_MPA_KEY_SIZE)) {
 953                        i40iw_pr_err("Unexpected MPA Key received\n");
 954                        return -1;
 955                }
 956        }
 957
 958        if (priv_data_len + mpa_hdr_len > len) {
 959                i40iw_pr_err("ietf buffer len(%x + %x != %x)\n",
 960                             priv_data_len, mpa_hdr_len, len);
 961                return -1;
 962        }
 963        if (len > MAX_CM_BUFFER) {
 964                i40iw_pr_err("ietf buffer large len = %d\n", len);
 965                return -1;
 966        }
 967
 968        switch (mpa_frame->rev) {
 969        case IETF_MPA_V2:{
 970                        u16 ird_size;
 971                        u16 ord_size;
 972                        u16 ctrl_ord;
 973                        u16 ctrl_ird;
 974
 975                        mpa_v2_frame = (struct ietf_mpa_v2 *)buffer;
 976                        mpa_hdr_len += IETF_RTR_MSG_SIZE;
 977                        rtr_msg = &mpa_v2_frame->rtr_msg;
 978
 979                        /* parse rtr message */
 980                        ctrl_ord = ntohs(rtr_msg->ctrl_ord);
 981                        ctrl_ird = ntohs(rtr_msg->ctrl_ird);
 982                        ird_size = ctrl_ird & IETF_NO_IRD_ORD;
 983                        ord_size = ctrl_ord & IETF_NO_IRD_ORD;
 984
 985                        if (!(ctrl_ird & IETF_PEER_TO_PEER))
 986                                return -1;
 987
 988                        if (ird_size == IETF_NO_IRD_ORD || ord_size == IETF_NO_IRD_ORD) {
 989                                cm_node->mpav2_ird_ord = IETF_NO_IRD_ORD;
 990                                goto negotiate_done;
 991                        }
 992
 993                        if (cm_node->state != I40IW_CM_STATE_MPAREQ_SENT) {
 994                                /* responder */
 995                                if (!ord_size && (ctrl_ord & IETF_RDMA0_READ))
 996                                        cm_node->ird_size = 1;
 997                                if (cm_node->ord_size > ird_size)
 998                                        cm_node->ord_size = ird_size;
 999                        } else {
1000                                /* initiator */
1001                                if (!ird_size && (ctrl_ord & IETF_RDMA0_READ))
1002                                        return -1;
1003                                if (cm_node->ord_size > ird_size)
1004                                        cm_node->ord_size = ird_size;
1005
1006                                if (cm_node->ird_size < ord_size)
1007                                        /* no resources available */
1008                                        return -1;
1009                        }
1010
1011negotiate_done:
1012                        if (ctrl_ord & IETF_RDMA0_READ)
1013                                cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
1014                        else if (ctrl_ord & IETF_RDMA0_WRITE)
1015                                cm_node->send_rdma0_op = SEND_RDMA_WRITE_ZERO;
1016                        else    /* Not supported RDMA0 operation */
1017                                return -1;
1018                        i40iw_debug(cm_node->dev, I40IW_DEBUG_CM,
1019                                    "MPAV2: Negotiated ORD: %d, IRD: %d\n",
1020                                    cm_node->ord_size, cm_node->ird_size);
1021                        break;
1022                }
1023                break;
1024        case IETF_MPA_V1:
1025        default:
1026                break;
1027        }
1028
1029        memcpy(cm_node->pdata_buf, buffer + mpa_hdr_len, priv_data_len);
1030        cm_node->pdata.size = priv_data_len;
1031
1032        if (mpa_frame->flags & IETF_MPA_FLAGS_REJECT)
1033                *type = I40IW_MPA_REQUEST_REJECT;
1034
1035        if (mpa_frame->flags & IETF_MPA_FLAGS_MARKERS)
1036                cm_node->snd_mark_en = true;
1037
1038        return 0;
1039}
1040
1041/**
1042 * i40iw_schedule_cm_timer
1043 * @@cm_node: connection's node
1044 * @sqbuf: buffer to send
1045 * @type: if it is send or close
1046 * @send_retrans: if rexmits to be done
1047 * @close_when_complete: is cm_node to be removed
1048 *
1049 * note - cm_node needs to be protected before calling this. Encase in:
1050 *              i40iw_rem_ref_cm_node(cm_core, cm_node);
1051 *              i40iw_schedule_cm_timer(...)
1052 *              atomic_inc(&cm_node->ref_count);
1053 */
1054int i40iw_schedule_cm_timer(struct i40iw_cm_node *cm_node,
1055                            struct i40iw_puda_buf *sqbuf,
1056                            enum i40iw_timer_type type,
1057                            int send_retrans,
1058                            int close_when_complete)
1059{
1060        struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1061        struct i40iw_cm_core *cm_core = cm_node->cm_core;
1062        struct i40iw_timer_entry *new_send;
1063        int ret = 0;
1064        u32 was_timer_set;
1065        unsigned long flags;
1066
1067        new_send = kzalloc(sizeof(*new_send), GFP_ATOMIC);
1068        if (!new_send) {
1069                if (type != I40IW_TIMER_TYPE_CLOSE)
1070                        i40iw_free_sqbuf(vsi, (void *)sqbuf);
1071                return -ENOMEM;
1072        }
1073        new_send->retrycount = I40IW_DEFAULT_RETRYS;
1074        new_send->retranscount = I40IW_DEFAULT_RETRANS;
1075        new_send->sqbuf = sqbuf;
1076        new_send->timetosend = jiffies;
1077        new_send->type = type;
1078        new_send->send_retrans = send_retrans;
1079        new_send->close_when_complete = close_when_complete;
1080
1081        if (type == I40IW_TIMER_TYPE_CLOSE) {
1082                new_send->timetosend += (HZ / 10);
1083                if (cm_node->close_entry) {
1084                        kfree(new_send);
1085                        i40iw_pr_err("already close entry\n");
1086                        return -EINVAL;
1087                }
1088                cm_node->close_entry = new_send;
1089        }
1090
1091        if (type == I40IW_TIMER_TYPE_SEND) {
1092                spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1093                cm_node->send_entry = new_send;
1094                atomic_inc(&cm_node->ref_count);
1095                spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1096                new_send->timetosend = jiffies + I40IW_RETRY_TIMEOUT;
1097
1098                atomic_inc(&sqbuf->refcount);
1099                i40iw_puda_send_buf(vsi->ilq, sqbuf);
1100                if (!send_retrans) {
1101                        i40iw_cleanup_retrans_entry(cm_node);
1102                        if (close_when_complete)
1103                                i40iw_rem_ref_cm_node(cm_node);
1104                        return ret;
1105                }
1106        }
1107
1108        spin_lock_irqsave(&cm_core->ht_lock, flags);
1109        was_timer_set = timer_pending(&cm_core->tcp_timer);
1110
1111        if (!was_timer_set) {
1112                cm_core->tcp_timer.expires = new_send->timetosend;
1113                add_timer(&cm_core->tcp_timer);
1114        }
1115        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1116
1117        return ret;
1118}
1119
1120/**
1121 * i40iw_retrans_expired - Could not rexmit the packet
1122 * @cm_node: connection's node
1123 */
1124static void i40iw_retrans_expired(struct i40iw_cm_node *cm_node)
1125{
1126        struct iw_cm_id *cm_id = cm_node->cm_id;
1127        enum i40iw_cm_node_state state = cm_node->state;
1128
1129        cm_node->state = I40IW_CM_STATE_CLOSED;
1130        switch (state) {
1131        case I40IW_CM_STATE_SYN_RCVD:
1132        case I40IW_CM_STATE_CLOSING:
1133                i40iw_rem_ref_cm_node(cm_node);
1134                break;
1135        case I40IW_CM_STATE_FIN_WAIT1:
1136        case I40IW_CM_STATE_LAST_ACK:
1137                if (cm_node->cm_id)
1138                        cm_id->rem_ref(cm_id);
1139                i40iw_send_reset(cm_node);
1140                break;
1141        default:
1142                atomic_inc(&cm_node->ref_count);
1143                i40iw_send_reset(cm_node);
1144                i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
1145                break;
1146        }
1147}
1148
1149/**
1150 * i40iw_handle_close_entry - for handling retry/timeouts
1151 * @cm_node: connection's node
1152 * @rem_node: flag for remove cm_node
1153 */
1154static void i40iw_handle_close_entry(struct i40iw_cm_node *cm_node, u32 rem_node)
1155{
1156        struct i40iw_timer_entry *close_entry = cm_node->close_entry;
1157        struct iw_cm_id *cm_id = cm_node->cm_id;
1158        struct i40iw_qp *iwqp;
1159        unsigned long flags;
1160
1161        if (!close_entry)
1162                return;
1163        iwqp = (struct i40iw_qp *)close_entry->sqbuf;
1164        if (iwqp) {
1165                spin_lock_irqsave(&iwqp->lock, flags);
1166                if (iwqp->cm_id) {
1167                        iwqp->hw_tcp_state = I40IW_TCP_STATE_CLOSED;
1168                        iwqp->hw_iwarp_state = I40IW_QP_STATE_ERROR;
1169                        iwqp->last_aeq = I40IW_AE_RESET_SENT;
1170                        iwqp->ibqp_state = IB_QPS_ERR;
1171                        spin_unlock_irqrestore(&iwqp->lock, flags);
1172                        i40iw_cm_disconn(iwqp);
1173                } else {
1174                        spin_unlock_irqrestore(&iwqp->lock, flags);
1175                }
1176        } else if (rem_node) {
1177                /* TIME_WAIT state */
1178                i40iw_rem_ref_cm_node(cm_node);
1179        }
1180        if (cm_id)
1181                cm_id->rem_ref(cm_id);
1182        kfree(close_entry);
1183        cm_node->close_entry = NULL;
1184}
1185
1186/**
1187 * i40iw_build_timer_list - Add cm_nodes to timer list
1188 * @timer_list: ptr to timer list
1189 * @hte: ptr to accelerated or non-accelerated list
1190 */
1191static void i40iw_build_timer_list(struct list_head *timer_list,
1192                                   struct list_head *hte)
1193{
1194        struct i40iw_cm_node *cm_node;
1195        struct list_head *list_core_temp, *list_node;
1196
1197        list_for_each_safe(list_node, list_core_temp, hte) {
1198                cm_node = container_of(list_node, struct i40iw_cm_node, list);
1199                if (cm_node->close_entry || cm_node->send_entry) {
1200                        atomic_inc(&cm_node->ref_count);
1201                        list_add(&cm_node->timer_entry, timer_list);
1202                }
1203        }
1204}
1205
1206/**
1207 * i40iw_cm_timer_tick - system's timer expired callback
1208 * @pass: Pointing to cm_core
1209 */
1210static void i40iw_cm_timer_tick(struct timer_list *t)
1211{
1212        unsigned long nexttimeout = jiffies + I40IW_LONG_TIME;
1213        struct i40iw_cm_node *cm_node;
1214        struct i40iw_timer_entry *send_entry, *close_entry;
1215        struct list_head *list_core_temp;
1216        struct i40iw_sc_vsi *vsi;
1217        struct list_head *list_node;
1218        struct i40iw_cm_core *cm_core = from_timer(cm_core, t, tcp_timer);
1219        u32 settimer = 0;
1220        unsigned long timetosend;
1221        unsigned long flags;
1222
1223        struct list_head timer_list;
1224
1225        INIT_LIST_HEAD(&timer_list);
1226
1227        spin_lock_irqsave(&cm_core->ht_lock, flags);
1228        i40iw_build_timer_list(&timer_list, &cm_core->non_accelerated_list);
1229        i40iw_build_timer_list(&timer_list, &cm_core->accelerated_list);
1230        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1231
1232        list_for_each_safe(list_node, list_core_temp, &timer_list) {
1233                cm_node = container_of(list_node,
1234                                       struct i40iw_cm_node,
1235                                       timer_entry);
1236                close_entry = cm_node->close_entry;
1237
1238                if (close_entry) {
1239                        if (time_after(close_entry->timetosend, jiffies)) {
1240                                if (nexttimeout > close_entry->timetosend ||
1241                                    !settimer) {
1242                                        nexttimeout = close_entry->timetosend;
1243                                        settimer = 1;
1244                                }
1245                        } else {
1246                                i40iw_handle_close_entry(cm_node, 1);
1247                        }
1248                }
1249
1250                spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1251
1252                send_entry = cm_node->send_entry;
1253                if (!send_entry)
1254                        goto done;
1255                if (time_after(send_entry->timetosend, jiffies)) {
1256                        if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
1257                                if ((nexttimeout > send_entry->timetosend) ||
1258                                    !settimer) {
1259                                        nexttimeout = send_entry->timetosend;
1260                                        settimer = 1;
1261                                }
1262                        } else {
1263                                i40iw_free_retrans_entry(cm_node);
1264                        }
1265                        goto done;
1266                }
1267
1268                if ((cm_node->state == I40IW_CM_STATE_OFFLOADED) ||
1269                    (cm_node->state == I40IW_CM_STATE_CLOSED)) {
1270                        i40iw_free_retrans_entry(cm_node);
1271                        goto done;
1272                }
1273
1274                if (!send_entry->retranscount || !send_entry->retrycount) {
1275                        i40iw_free_retrans_entry(cm_node);
1276
1277                        spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1278                        i40iw_retrans_expired(cm_node);
1279                        cm_node->state = I40IW_CM_STATE_CLOSED;
1280                        spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1281                        goto done;
1282                }
1283                spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1284
1285                vsi = &cm_node->iwdev->vsi;
1286
1287                if (!cm_node->ack_rcvd) {
1288                        atomic_inc(&send_entry->sqbuf->refcount);
1289                        i40iw_puda_send_buf(vsi->ilq, send_entry->sqbuf);
1290                        cm_node->cm_core->stats_pkt_retrans++;
1291                }
1292                spin_lock_irqsave(&cm_node->retrans_list_lock, flags);
1293                if (send_entry->send_retrans) {
1294                        send_entry->retranscount--;
1295                        timetosend = (I40IW_RETRY_TIMEOUT <<
1296                                      (I40IW_DEFAULT_RETRANS -
1297                                       send_entry->retranscount));
1298
1299                        send_entry->timetosend = jiffies +
1300                            min(timetosend, I40IW_MAX_TIMEOUT);
1301                        if (nexttimeout > send_entry->timetosend || !settimer) {
1302                                nexttimeout = send_entry->timetosend;
1303                                settimer = 1;
1304                        }
1305                } else {
1306                        int close_when_complete;
1307
1308                        close_when_complete = send_entry->close_when_complete;
1309                        i40iw_debug(cm_node->dev,
1310                                    I40IW_DEBUG_CM,
1311                                    "cm_node=%p state=%d\n",
1312                                    cm_node,
1313                                    cm_node->state);
1314                        i40iw_free_retrans_entry(cm_node);
1315                        if (close_when_complete)
1316                                i40iw_rem_ref_cm_node(cm_node);
1317                }
1318done:
1319                spin_unlock_irqrestore(&cm_node->retrans_list_lock, flags);
1320                i40iw_rem_ref_cm_node(cm_node);
1321        }
1322
1323        if (settimer) {
1324                spin_lock_irqsave(&cm_core->ht_lock, flags);
1325                if (!timer_pending(&cm_core->tcp_timer)) {
1326                        cm_core->tcp_timer.expires = nexttimeout;
1327                        add_timer(&cm_core->tcp_timer);
1328                }
1329                spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1330        }
1331}
1332
1333/**
1334 * i40iw_send_syn - send SYN packet
1335 * @cm_node: connection's node
1336 * @sendack: flag to set ACK bit or not
1337 */
1338int i40iw_send_syn(struct i40iw_cm_node *cm_node, u32 sendack)
1339{
1340        struct i40iw_puda_buf *sqbuf;
1341        int flags = SET_SYN;
1342        char optionsbuffer[sizeof(struct option_mss) +
1343                           sizeof(struct option_windowscale) +
1344                           sizeof(struct option_base) + TCP_OPTIONS_PADDING];
1345        struct i40iw_kmem_info opts;
1346
1347        int optionssize = 0;
1348        /* Sending MSS option */
1349        union all_known_options *options;
1350
1351        opts.addr = optionsbuffer;
1352        if (!cm_node) {
1353                i40iw_pr_err("no cm_node\n");
1354                return -EINVAL;
1355        }
1356
1357        options = (union all_known_options *)&optionsbuffer[optionssize];
1358        options->as_mss.optionnum = OPTION_NUMBER_MSS;
1359        options->as_mss.length = sizeof(struct option_mss);
1360        options->as_mss.mss = htons(cm_node->tcp_cntxt.mss);
1361        optionssize += sizeof(struct option_mss);
1362
1363        options = (union all_known_options *)&optionsbuffer[optionssize];
1364        options->as_windowscale.optionnum = OPTION_NUMBER_WINDOW_SCALE;
1365        options->as_windowscale.length = sizeof(struct option_windowscale);
1366        options->as_windowscale.shiftcount = cm_node->tcp_cntxt.rcv_wscale;
1367        optionssize += sizeof(struct option_windowscale);
1368        options = (union all_known_options *)&optionsbuffer[optionssize];
1369        options->as_end = OPTION_NUMBER_END;
1370        optionssize += 1;
1371
1372        if (sendack)
1373                flags |= SET_ACK;
1374
1375        opts.size = optionssize;
1376
1377        sqbuf = i40iw_form_cm_frame(cm_node, &opts, NULL, NULL, flags);
1378        if (!sqbuf) {
1379                i40iw_pr_err("no sqbuf\n");
1380                return -1;
1381        }
1382        return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1383}
1384
1385/**
1386 * i40iw_send_ack - Send ACK packet
1387 * @cm_node: connection's node
1388 */
1389static void i40iw_send_ack(struct i40iw_cm_node *cm_node)
1390{
1391        struct i40iw_puda_buf *sqbuf;
1392        struct i40iw_sc_vsi *vsi = &cm_node->iwdev->vsi;
1393
1394        sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK);
1395        if (sqbuf)
1396                i40iw_puda_send_buf(vsi->ilq, sqbuf);
1397        else
1398                i40iw_pr_err("no sqbuf\n");
1399}
1400
1401/**
1402 * i40iw_send_fin - Send FIN pkt
1403 * @cm_node: connection's node
1404 */
1405static int i40iw_send_fin(struct i40iw_cm_node *cm_node)
1406{
1407        struct i40iw_puda_buf *sqbuf;
1408
1409        sqbuf = i40iw_form_cm_frame(cm_node, NULL, NULL, NULL, SET_ACK | SET_FIN);
1410        if (!sqbuf) {
1411                i40iw_pr_err("no sqbuf\n");
1412                return -1;
1413        }
1414        return i40iw_schedule_cm_timer(cm_node, sqbuf, I40IW_TIMER_TYPE_SEND, 1, 0);
1415}
1416
1417/**
1418 * i40iw_find_node - find a cm node that matches the reference cm node
1419 * @cm_core: cm's core
1420 * @rem_port: remote tcp port num
1421 * @rem_addr: remote ip addr
1422 * @loc_port: local tcp port num
1423 * @loc_addr: loc ip addr
1424 * @add_refcnt: flag to increment refcount of cm_node
1425 * @accelerated_list: flag for accelerated vs non-accelerated list to search
1426 */
1427struct i40iw_cm_node *i40iw_find_node(struct i40iw_cm_core *cm_core,
1428                                      u16 rem_port,
1429                                      u32 *rem_addr,
1430                                      u16 loc_port,
1431                                      u32 *loc_addr,
1432                                      bool add_refcnt,
1433                                      bool accelerated_list)
1434{
1435        struct list_head *hte;
1436        struct i40iw_cm_node *cm_node;
1437        unsigned long flags;
1438
1439        hte = accelerated_list ?
1440              &cm_core->accelerated_list : &cm_core->non_accelerated_list;
1441
1442        /* walk list and find cm_node associated with this session ID */
1443        spin_lock_irqsave(&cm_core->ht_lock, flags);
1444        list_for_each_entry(cm_node, hte, list) {
1445                if (!memcmp(cm_node->loc_addr, loc_addr, sizeof(cm_node->loc_addr)) &&
1446                    (cm_node->loc_port == loc_port) &&
1447                    !memcmp(cm_node->rem_addr, rem_addr, sizeof(cm_node->rem_addr)) &&
1448                    (cm_node->rem_port == rem_port)) {
1449                        if (add_refcnt)
1450                                atomic_inc(&cm_node->ref_count);
1451                        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1452                        return cm_node;
1453                }
1454        }
1455        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1456
1457        /* no owner node */
1458        return NULL;
1459}
1460
1461/**
1462 * i40iw_find_listener - find a cm node listening on this addr-port pair
1463 * @cm_core: cm's core
1464 * @dst_port: listener tcp port num
1465 * @dst_addr: listener ip addr
1466 * @listener_state: state to match with listen node's
1467 */
1468static struct i40iw_cm_listener *i40iw_find_listener(
1469                                                     struct i40iw_cm_core *cm_core,
1470                                                     u32 *dst_addr,
1471                                                     u16 dst_port,
1472                                                     u16 vlan_id,
1473                                                     enum i40iw_cm_listener_state
1474                                                     listener_state)
1475{
1476        struct i40iw_cm_listener *listen_node;
1477        static const u32 ip_zero[4] = { 0, 0, 0, 0 };
1478        u32 listen_addr[4];
1479        u16 listen_port;
1480        unsigned long flags;
1481
1482        /* walk list and find cm_node associated with this session ID */
1483        spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1484        list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1485                memcpy(listen_addr, listen_node->loc_addr, sizeof(listen_addr));
1486                listen_port = listen_node->loc_port;
1487                /* compare node pair, return node handle if a match */
1488                if ((!memcmp(listen_addr, dst_addr, sizeof(listen_addr)) ||
1489                     !memcmp(listen_addr, ip_zero, sizeof(listen_addr))) &&
1490                     (listen_port == dst_port) &&
1491                     (listener_state & listen_node->listener_state)) {
1492                        atomic_inc(&listen_node->ref_count);
1493                        spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1494                        return listen_node;
1495                }
1496        }
1497        spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1498        return NULL;
1499}
1500
1501/**
1502 * i40iw_add_hte_node - add a cm node to the hash table
1503 * @cm_core: cm's core
1504 * @cm_node: connection's node
1505 */
1506static void i40iw_add_hte_node(struct i40iw_cm_core *cm_core,
1507                               struct i40iw_cm_node *cm_node)
1508{
1509        unsigned long flags;
1510
1511        if (!cm_node || !cm_core) {
1512                i40iw_pr_err("cm_node or cm_core == NULL\n");
1513                return;
1514        }
1515
1516        spin_lock_irqsave(&cm_core->ht_lock, flags);
1517        list_add_tail(&cm_node->list, &cm_core->non_accelerated_list);
1518        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1519}
1520
1521/**
1522 * i40iw_find_port - find port that matches reference port
1523 * @hte: ptr to accelerated or non-accelerated list
1524 * @accelerated_list: flag for accelerated vs non-accelerated list
1525 */
1526static bool i40iw_find_port(struct list_head *hte, u16 port)
1527{
1528        struct i40iw_cm_node *cm_node;
1529
1530        list_for_each_entry(cm_node, hte, list) {
1531                if (cm_node->loc_port == port)
1532                        return true;
1533        }
1534        return false;
1535}
1536
1537/**
1538 * i40iw_port_in_use - determine if port is in use
1539 * @cm_core: cm's core
1540 * @port: port number
1541 */
1542bool i40iw_port_in_use(struct i40iw_cm_core *cm_core, u16 port)
1543{
1544        struct i40iw_cm_listener *listen_node;
1545        unsigned long flags;
1546
1547        spin_lock_irqsave(&cm_core->ht_lock, flags);
1548        if (i40iw_find_port(&cm_core->accelerated_list, port) ||
1549            i40iw_find_port(&cm_core->non_accelerated_list, port)) {
1550                spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1551                return true;
1552        }
1553        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1554
1555        spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1556        list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
1557                if (listen_node->loc_port == port) {
1558                        spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1559                        return true;
1560                }
1561        }
1562        spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1563
1564        return false;
1565}
1566
1567/**
1568 * i40iw_del_multiple_qhash - Remove qhash and child listens
1569 * @iwdev: iWarp device
1570 * @cm_info: CM info for parent listen node
1571 * @cm_parent_listen_node: The parent listen node
1572 */
1573static enum i40iw_status_code i40iw_del_multiple_qhash(
1574                                                       struct i40iw_device *iwdev,
1575                                                       struct i40iw_cm_info *cm_info,
1576                                                       struct i40iw_cm_listener *cm_parent_listen_node)
1577{
1578        struct i40iw_cm_listener *child_listen_node;
1579        enum i40iw_status_code ret = I40IW_ERR_CONFIG;
1580        struct list_head *pos, *tpos;
1581        unsigned long flags;
1582
1583        spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1584        list_for_each_safe(pos, tpos, &cm_parent_listen_node->child_listen_list) {
1585                child_listen_node = list_entry(pos, struct i40iw_cm_listener, child_listen_list);
1586                if (child_listen_node->ipv4)
1587                        i40iw_debug(&iwdev->sc_dev,
1588                                    I40IW_DEBUG_CM,
1589                                    "removing child listen for IP=%pI4, port=%d, vlan=%d\n",
1590                                    child_listen_node->loc_addr,
1591                                    child_listen_node->loc_port,
1592                                    child_listen_node->vlan_id);
1593                else
1594                        i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
1595                                    "removing child listen for IP=%pI6, port=%d, vlan=%d\n",
1596                                    child_listen_node->loc_addr,
1597                                    child_listen_node->loc_port,
1598                                    child_listen_node->vlan_id);
1599                list_del(pos);
1600                memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1601                       sizeof(cm_info->loc_addr));
1602                cm_info->vlan_id = child_listen_node->vlan_id;
1603                if (child_listen_node->qhash_set) {
1604                        ret = i40iw_manage_qhash(iwdev, cm_info,
1605                                                 I40IW_QHASH_TYPE_TCP_SYN,
1606                                                 I40IW_QHASH_MANAGE_TYPE_DELETE,
1607                                                 NULL, false);
1608                        child_listen_node->qhash_set = false;
1609                } else {
1610                        ret = I40IW_SUCCESS;
1611                }
1612                i40iw_debug(&iwdev->sc_dev,
1613                            I40IW_DEBUG_CM,
1614                            "freed pointer = %p\n",
1615                            child_listen_node);
1616                kfree(child_listen_node);
1617                cm_parent_listen_node->cm_core->stats_listen_nodes_destroyed++;
1618        }
1619        spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1620
1621        return ret;
1622}
1623
1624/**
1625 * i40iw_netdev_vlan_ipv6 - Gets the netdev and vlan
1626 * @addr: local IPv6 address
1627 * @vlan_id: vlan id for the given IPv6 address
1628 *
1629 * Returns the net_device of the IPv6 address and also sets the
1630 * vlan id for that address.
1631 */
1632static struct net_device *i40iw_netdev_vlan_ipv6(u32 *addr, u16 *vlan_id)
1633{
1634        struct net_device *ip_dev = NULL;
1635        struct in6_addr laddr6;
1636
1637        if (!IS_ENABLED(CONFIG_IPV6))
1638                return NULL;
1639        i40iw_copy_ip_htonl(laddr6.in6_u.u6_addr32, addr);
1640        if (vlan_id)
1641                *vlan_id = I40IW_NO_VLAN;
1642        rcu_read_lock();
1643        for_each_netdev_rcu(&init_net, ip_dev) {
1644                if (ipv6_chk_addr(&init_net, &laddr6, ip_dev, 1)) {
1645                        if (vlan_id)
1646                                *vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1647                        break;
1648                }
1649        }
1650        rcu_read_unlock();
1651        return ip_dev;
1652}
1653
1654/**
1655 * i40iw_get_vlan_ipv4 - Returns the vlan_id for IPv4 address
1656 * @addr: local IPv4 address
1657 */
1658static u16 i40iw_get_vlan_ipv4(u32 *addr)
1659{
1660        struct net_device *netdev;
1661        u16 vlan_id = I40IW_NO_VLAN;
1662
1663        netdev = ip_dev_find(&init_net, htonl(addr[0]));
1664        if (netdev) {
1665                vlan_id = rdma_vlan_dev_vlan_id(netdev);
1666                dev_put(netdev);
1667        }
1668        return vlan_id;
1669}
1670
1671/**
1672 * i40iw_add_mqh_6 - Adds multiple qhashes for IPv6
1673 * @iwdev: iWarp device
1674 * @cm_info: CM info for parent listen node
1675 * @cm_parent_listen_node: The parent listen node
1676 *
1677 * Adds a qhash and a child listen node for every IPv6 address
1678 * on the adapter and adds the associated qhash filter
1679 */
1680static enum i40iw_status_code i40iw_add_mqh_6(struct i40iw_device *iwdev,
1681                                              struct i40iw_cm_info *cm_info,
1682                                              struct i40iw_cm_listener *cm_parent_listen_node)
1683{
1684        struct net_device *ip_dev;
1685        struct inet6_dev *idev;
1686        struct inet6_ifaddr *ifp, *tmp;
1687        enum i40iw_status_code ret = 0;
1688        struct i40iw_cm_listener *child_listen_node;
1689        unsigned long flags;
1690
1691        rtnl_lock();
1692        for_each_netdev(&init_net, ip_dev) {
1693                if ((((rdma_vlan_dev_vlan_id(ip_dev) < I40IW_NO_VLAN) &&
1694                      (rdma_vlan_dev_real_dev(ip_dev) == iwdev->netdev)) ||
1695                     (ip_dev == iwdev->netdev)) && (ip_dev->flags & IFF_UP)) {
1696                        idev = __in6_dev_get(ip_dev);
1697                        if (!idev) {
1698                                i40iw_pr_err("idev == NULL\n");
1699                                break;
1700                        }
1701                        list_for_each_entry_safe(ifp, tmp, &idev->addr_list, if_list) {
1702                                i40iw_debug(&iwdev->sc_dev,
1703                                            I40IW_DEBUG_CM,
1704                                            "IP=%pI6, vlan_id=%d, MAC=%pM\n",
1705                                            &ifp->addr,
1706                                            rdma_vlan_dev_vlan_id(ip_dev),
1707                                            ip_dev->dev_addr);
1708                                child_listen_node =
1709                                        kzalloc(sizeof(*child_listen_node), GFP_ATOMIC);
1710                                i40iw_debug(&iwdev->sc_dev,
1711                                            I40IW_DEBUG_CM,
1712                                            "Allocating child listener %p\n",
1713                                            child_listen_node);
1714                                if (!child_listen_node) {
1715                                        ret = I40IW_ERR_NO_MEMORY;
1716                                        goto exit;
1717                                }
1718                                cm_info->vlan_id = rdma_vlan_dev_vlan_id(ip_dev);
1719                                cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1720
1721                                memcpy(child_listen_node, cm_parent_listen_node,
1722                                       sizeof(*child_listen_node));
1723
1724                                i40iw_copy_ip_ntohl(child_listen_node->loc_addr,
1725                                                    ifp->addr.in6_u.u6_addr32);
1726                                memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1727                                       sizeof(cm_info->loc_addr));
1728
1729                                ret = i40iw_manage_qhash(iwdev, cm_info,
1730                                                         I40IW_QHASH_TYPE_TCP_SYN,
1731                                                         I40IW_QHASH_MANAGE_TYPE_ADD,
1732                                                         NULL, true);
1733                                if (!ret) {
1734                                        child_listen_node->qhash_set = true;
1735                                        spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1736                                        list_add(&child_listen_node->child_listen_list,
1737                                                 &cm_parent_listen_node->child_listen_list);
1738                                        spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1739                                        cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1740                                } else {
1741                                        kfree(child_listen_node);
1742                                }
1743                        }
1744                }
1745        }
1746exit:
1747        rtnl_unlock();
1748        return ret;
1749}
1750
1751/**
1752 * i40iw_add_mqh_4 - Adds multiple qhashes for IPv4
1753 * @iwdev: iWarp device
1754 * @cm_info: CM info for parent listen node
1755 * @cm_parent_listen_node: The parent listen node
1756 *
1757 * Adds a qhash and a child listen node for every IPv4 address
1758 * on the adapter and adds the associated qhash filter
1759 */
1760static enum i40iw_status_code i40iw_add_mqh_4(
1761                                struct i40iw_device *iwdev,
1762                                struct i40iw_cm_info *cm_info,
1763                                struct i40iw_cm_listener *cm_parent_listen_node)
1764{
1765        struct net_device *dev;
1766        struct in_device *idev;
1767        struct i40iw_cm_listener *child_listen_node;
1768        enum i40iw_status_code ret = 0;
1769        unsigned long flags;
1770
1771        rtnl_lock();
1772        for_each_netdev(&init_net, dev) {
1773                if ((((rdma_vlan_dev_vlan_id(dev) < I40IW_NO_VLAN) &&
1774                      (rdma_vlan_dev_real_dev(dev) == iwdev->netdev)) ||
1775                    (dev == iwdev->netdev)) && (dev->flags & IFF_UP)) {
1776                        const struct in_ifaddr *ifa;
1777
1778                        idev = in_dev_get(dev);
1779
1780                        in_dev_for_each_ifa_rtnl(ifa, idev) {
1781                                i40iw_debug(&iwdev->sc_dev,
1782                                            I40IW_DEBUG_CM,
1783                                            "Allocating child CM Listener forIP=%pI4, vlan_id=%d, MAC=%pM\n",
1784                                            &ifa->ifa_address,
1785                                            rdma_vlan_dev_vlan_id(dev),
1786                                            dev->dev_addr);
1787                                child_listen_node = kzalloc(sizeof(*child_listen_node), GFP_KERNEL);
1788                                cm_parent_listen_node->cm_core->stats_listen_nodes_created++;
1789                                i40iw_debug(&iwdev->sc_dev,
1790                                            I40IW_DEBUG_CM,
1791                                            "Allocating child listener %p\n",
1792                                            child_listen_node);
1793                                if (!child_listen_node) {
1794                                        in_dev_put(idev);
1795                                        ret = I40IW_ERR_NO_MEMORY;
1796                                        goto exit;
1797                                }
1798                                cm_info->vlan_id = rdma_vlan_dev_vlan_id(dev);
1799                                cm_parent_listen_node->vlan_id = cm_info->vlan_id;
1800                                memcpy(child_listen_node,
1801                                       cm_parent_listen_node,
1802                                       sizeof(*child_listen_node));
1803
1804                                child_listen_node->loc_addr[0] = ntohl(ifa->ifa_address);
1805                                memcpy(cm_info->loc_addr, child_listen_node->loc_addr,
1806                                       sizeof(cm_info->loc_addr));
1807
1808                                ret = i40iw_manage_qhash(iwdev,
1809                                                         cm_info,
1810                                                         I40IW_QHASH_TYPE_TCP_SYN,
1811                                                         I40IW_QHASH_MANAGE_TYPE_ADD,
1812                                                         NULL,
1813                                                         true);
1814                                if (!ret) {
1815                                        child_listen_node->qhash_set = true;
1816                                        spin_lock_irqsave(&iwdev->cm_core.listen_list_lock, flags);
1817                                        list_add(&child_listen_node->child_listen_list,
1818                                                 &cm_parent_listen_node->child_listen_list);
1819                                        spin_unlock_irqrestore(&iwdev->cm_core.listen_list_lock, flags);
1820                                } else {
1821                                        kfree(child_listen_node);
1822                                        cm_parent_listen_node->cm_core->stats_listen_nodes_created--;
1823                                }
1824                        }
1825
1826                        in_dev_put(idev);
1827                }
1828        }
1829exit:
1830        rtnl_unlock();
1831        return ret;
1832}
1833
1834/**
1835 * i40iw_dec_refcnt_listen - delete listener and associated cm nodes
1836 * @cm_core: cm's core
1837 * @free_hanging_nodes: to free associated cm_nodes
1838 * @apbvt_del: flag to delete the apbvt
1839 */
1840static int i40iw_dec_refcnt_listen(struct i40iw_cm_core *cm_core,
1841                                   struct i40iw_cm_listener *listener,
1842                                   int free_hanging_nodes, bool apbvt_del)
1843{
1844        int ret = -EINVAL;
1845        int err = 0;
1846        struct list_head *list_pos;
1847        struct list_head *list_temp;
1848        struct i40iw_cm_node *cm_node;
1849        struct list_head reset_list;
1850        struct i40iw_cm_info nfo;
1851        struct i40iw_cm_node *loopback;
1852        enum i40iw_cm_node_state old_state;
1853        unsigned long flags;
1854
1855        /* free non-accelerated child nodes for this listener */
1856        INIT_LIST_HEAD(&reset_list);
1857        if (free_hanging_nodes) {
1858                spin_lock_irqsave(&cm_core->ht_lock, flags);
1859                list_for_each_safe(list_pos,
1860                                   list_temp, &cm_core->non_accelerated_list) {
1861                        cm_node = container_of(list_pos, struct i40iw_cm_node, list);
1862                        if ((cm_node->listener == listener) &&
1863                            !cm_node->accelerated) {
1864                                atomic_inc(&cm_node->ref_count);
1865                                list_add(&cm_node->reset_entry, &reset_list);
1866                        }
1867                }
1868                spin_unlock_irqrestore(&cm_core->ht_lock, flags);
1869        }
1870
1871        list_for_each_safe(list_pos, list_temp, &reset_list) {
1872                cm_node = container_of(list_pos, struct i40iw_cm_node, reset_entry);
1873                loopback = cm_node->loopbackpartner;
1874                if (cm_node->state >= I40IW_CM_STATE_FIN_WAIT1) {
1875                        i40iw_rem_ref_cm_node(cm_node);
1876                } else {
1877                        if (!loopback) {
1878                                i40iw_cleanup_retrans_entry(cm_node);
1879                                err = i40iw_send_reset(cm_node);
1880                                if (err) {
1881                                        cm_node->state = I40IW_CM_STATE_CLOSED;
1882                                        i40iw_pr_err("send reset\n");
1883                                } else {
1884                                        old_state = cm_node->state;
1885                                        cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1886                                        if (old_state != I40IW_CM_STATE_MPAREQ_RCVD)
1887                                                i40iw_rem_ref_cm_node(cm_node);
1888                                }
1889                        } else {
1890                                struct i40iw_cm_event event;
1891
1892                                event.cm_node = loopback;
1893                                memcpy(event.cm_info.rem_addr,
1894                                       loopback->rem_addr, sizeof(event.cm_info.rem_addr));
1895                                memcpy(event.cm_info.loc_addr,
1896                                       loopback->loc_addr, sizeof(event.cm_info.loc_addr));
1897                                event.cm_info.rem_port = loopback->rem_port;
1898                                event.cm_info.loc_port = loopback->loc_port;
1899                                event.cm_info.cm_id = loopback->cm_id;
1900                                event.cm_info.ipv4 = loopback->ipv4;
1901                                atomic_inc(&loopback->ref_count);
1902                                loopback->state = I40IW_CM_STATE_CLOSED;
1903                                i40iw_event_connect_error(&event);
1904                                cm_node->state = I40IW_CM_STATE_LISTENER_DESTROYED;
1905                                i40iw_rem_ref_cm_node(cm_node);
1906                        }
1907                }
1908        }
1909
1910        if (!atomic_dec_return(&listener->ref_count)) {
1911                spin_lock_irqsave(&cm_core->listen_list_lock, flags);
1912                list_del(&listener->list);
1913                spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
1914
1915                if (listener->iwdev) {
1916                        if (apbvt_del)
1917                                i40iw_manage_apbvt(listener->iwdev,
1918                                                   listener->loc_port,
1919                                                   I40IW_MANAGE_APBVT_DEL);
1920
1921                        memcpy(nfo.loc_addr, listener->loc_addr, sizeof(nfo.loc_addr));
1922                        nfo.loc_port = listener->loc_port;
1923                        nfo.ipv4 = listener->ipv4;
1924                        nfo.vlan_id = listener->vlan_id;
1925                        nfo.user_pri = listener->user_pri;
1926
1927                        if (!list_empty(&listener->child_listen_list)) {
1928                                i40iw_del_multiple_qhash(listener->iwdev, &nfo, listener);
1929                        } else {
1930                                if (listener->qhash_set)
1931                                        i40iw_manage_qhash(listener->iwdev,
1932                                                           &nfo,
1933                                                           I40IW_QHASH_TYPE_TCP_SYN,
1934                                                           I40IW_QHASH_MANAGE_TYPE_DELETE,
1935                                                           NULL,
1936                                                           false);
1937                        }
1938                }
1939
1940                cm_core->stats_listen_destroyed++;
1941                kfree(listener);
1942                cm_core->stats_listen_nodes_destroyed++;
1943                listener = NULL;
1944                ret = 0;
1945        }
1946
1947        if (listener) {
1948                if (atomic_read(&listener->pend_accepts_cnt) > 0)
1949                        i40iw_debug(cm_core->dev,
1950                                    I40IW_DEBUG_CM,
1951                                    "%s: listener (%p) pending accepts=%u\n",
1952                                    __func__,
1953                                    listener,
1954                                    atomic_read(&listener->pend_accepts_cnt));
1955        }
1956
1957        return ret;
1958}
1959
1960/**
1961 * i40iw_cm_del_listen - delete a linstener
1962 * @cm_core: cm's core
1963  * @listener: passive connection's listener
1964 * @apbvt_del: flag to delete apbvt
1965 */
1966static int i40iw_cm_del_listen(struct i40iw_cm_core *cm_core,
1967                               struct i40iw_cm_listener *listener,
1968                               bool apbvt_del)
1969{
1970        listener->listener_state = I40IW_CM_LISTENER_PASSIVE_STATE;
1971        listener->cm_id = NULL; /* going to be destroyed pretty soon */
1972        return i40iw_dec_refcnt_listen(cm_core, listener, 1, apbvt_del);
1973}
1974
1975/**
1976 * i40iw_addr_resolve_neigh - resolve neighbor address
1977 * @iwdev: iwarp device structure
1978 * @src_ip: local ip address
1979 * @dst_ip: remote ip address
1980 * @arpindex: if there is an arp entry
1981 */
1982static int i40iw_addr_resolve_neigh(struct i40iw_device *iwdev,
1983                                    u32 src_ip,
1984                                    u32 dst_ip,
1985                                    int arpindex)
1986{
1987        struct rtable *rt;
1988        struct neighbour *neigh;
1989        int rc = arpindex;
1990        struct net_device *netdev = iwdev->netdev;
1991        __be32 dst_ipaddr = htonl(dst_ip);
1992        __be32 src_ipaddr = htonl(src_ip);
1993
1994        rt = ip_route_output(&init_net, dst_ipaddr, src_ipaddr, 0, 0);
1995        if (IS_ERR(rt)) {
1996                i40iw_pr_err("ip_route_output\n");
1997                return rc;
1998        }
1999
2000        if (netif_is_bond_slave(netdev))
2001                netdev = netdev_master_upper_dev_get(netdev);
2002
2003        neigh = dst_neigh_lookup(&rt->dst, &dst_ipaddr);
2004
2005        rcu_read_lock();
2006        if (neigh) {
2007                if (neigh->nud_state & NUD_VALID) {
2008                        if (arpindex >= 0) {
2009                                if (ether_addr_equal(iwdev->arp_table[arpindex].mac_addr,
2010                                                     neigh->ha))
2011                                        /* Mac address same as arp table */
2012                                        goto resolve_neigh_exit;
2013                                i40iw_manage_arp_cache(iwdev,
2014                                                       iwdev->arp_table[arpindex].mac_addr,
2015                                                       &dst_ip,
2016                                                       true,
2017                                                       I40IW_ARP_DELETE);
2018                        }
2019
2020                        i40iw_manage_arp_cache(iwdev, neigh->ha, &dst_ip, true, I40IW_ARP_ADD);
2021                        rc = i40iw_arp_table(iwdev, &dst_ip, true, NULL, I40IW_ARP_RESOLVE);
2022                } else {
2023                        neigh_event_send(neigh, NULL);
2024                }
2025        }
2026 resolve_neigh_exit:
2027
2028        rcu_read_unlock();
2029        if (neigh)
2030                neigh_release(neigh);
2031
2032        ip_rt_put(rt);
2033        return rc;
2034}
2035
2036/**
2037 * i40iw_get_dst_ipv6
2038 */
2039static struct dst_entry *i40iw_get_dst_ipv6(struct sockaddr_in6 *src_addr,
2040                                            struct sockaddr_in6 *dst_addr)
2041{
2042        struct dst_entry *dst;
2043        struct flowi6 fl6;
2044
2045        memset(&fl6, 0, sizeof(fl6));
2046        fl6.daddr = dst_addr->sin6_addr;
2047        fl6.saddr = src_addr->sin6_addr;
2048        if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
2049                fl6.flowi6_oif = dst_addr->sin6_scope_id;
2050
2051        dst = ip6_route_output(&init_net, NULL, &fl6);
2052        return dst;
2053}
2054
2055/**
2056 * i40iw_addr_resolve_neigh_ipv6 - resolve neighbor ipv6 address
2057 * @iwdev: iwarp device structure
2058 * @dst_ip: remote ip address
2059 * @arpindex: if there is an arp entry
2060 */
2061static int i40iw_addr_resolve_neigh_ipv6(struct i40iw_device *iwdev,
2062                                         u32 *src,
2063                                         u32 *dest,
2064                                         int arpindex)
2065{
2066        struct neighbour *neigh;
2067        int rc = arpindex;
2068        struct net_device *netdev = iwdev->netdev;
2069        struct dst_entry *dst;
2070        struct sockaddr_in6 dst_addr;
2071        struct sockaddr_in6 src_addr;
2072
2073        memset(&dst_addr, 0, sizeof(dst_addr));
2074        dst_addr.sin6_family = AF_INET6;
2075        i40iw_copy_ip_htonl(dst_addr.sin6_addr.in6_u.u6_addr32, dest);
2076        memset(&src_addr, 0, sizeof(src_addr));
2077        src_addr.sin6_family = AF_INET6;
2078        i40iw_copy_ip_htonl(src_addr.sin6_addr.in6_u.u6_addr32, src);
2079        dst = i40iw_get_dst_ipv6(&src_addr, &dst_addr);
2080        if (!dst || dst->error) {
2081                if (dst) {
2082                        dst_release(dst);
2083                        i40iw_pr_err("ip6_route_output returned dst->error = %d\n",
2084                                     dst->error);
2085                }
2086                return rc;
2087        }
2088
2089        if (netif_is_bond_slave(netdev))
2090                netdev = netdev_master_upper_dev_get(netdev);
2091
2092        neigh = dst_neigh_lookup(dst, dst_addr.sin6_addr.in6_u.u6_addr32);
2093
2094        rcu_read_lock();
2095        if (neigh) {
2096                i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "dst_neigh_lookup MAC=%pM\n", neigh->ha);
2097                if (neigh->nud_state & NUD_VALID) {
2098                        if (arpindex >= 0) {
2099                                if (ether_addr_equal
2100                                    (iwdev->arp_table[arpindex].mac_addr,
2101                                     neigh->ha)) {
2102                                        /* Mac address same as in arp table */
2103                                        goto resolve_neigh_exit6;
2104                                }
2105                                i40iw_manage_arp_cache(iwdev,
2106                                                       iwdev->arp_table[arpindex].mac_addr,
2107                                                       dest,
2108                                                       false,
2109                                                       I40IW_ARP_DELETE);
2110                        }
2111                        i40iw_manage_arp_cache(iwdev,
2112                                               neigh->ha,
2113                                               dest,
2114                                               false,
2115                                               I40IW_ARP_ADD);
2116                        rc = i40iw_arp_table(iwdev,
2117                                             dest,
2118                                             false,
2119                                             NULL,
2120                                             I40IW_ARP_RESOLVE);
2121                } else {
2122                        neigh_event_send(neigh, NULL);
2123                }
2124        }
2125
2126 resolve_neigh_exit6:
2127        rcu_read_unlock();
2128        if (neigh)
2129                neigh_release(neigh);
2130        dst_release(dst);
2131        return rc;
2132}
2133
2134/**
2135 * i40iw_ipv4_is_loopback - check if loopback
2136 * @loc_addr: local addr to compare
2137 * @rem_addr: remote address
2138 */
2139static bool i40iw_ipv4_is_loopback(u32 loc_addr, u32 rem_addr)
2140{
2141        return ipv4_is_loopback(htonl(rem_addr)) || (loc_addr == rem_addr);
2142}
2143
2144/**
2145 * i40iw_ipv6_is_loopback - check if loopback
2146 * @loc_addr: local addr to compare
2147 * @rem_addr: remote address
2148 */
2149static bool i40iw_ipv6_is_loopback(u32 *loc_addr, u32 *rem_addr)
2150{
2151        struct in6_addr raddr6;
2152
2153        i40iw_copy_ip_htonl(raddr6.in6_u.u6_addr32, rem_addr);
2154        return !memcmp(loc_addr, rem_addr, 16) || ipv6_addr_loopback(&raddr6);
2155}
2156
2157/**
2158 * i40iw_make_cm_node - create a new instance of a cm node
2159 * @cm_core: cm's core
2160 * @iwdev: iwarp device structure
2161 * @cm_info: quad info for connection
2162 * @listener: passive connection's listener
2163 */
2164static struct i40iw_cm_node *i40iw_make_cm_node(
2165                                   struct i40iw_cm_core *cm_core,
2166                                   struct i40iw_device *iwdev,
2167                                   struct i40iw_cm_info *cm_info,
2168                                   struct i40iw_cm_listener *listener)
2169{
2170        struct i40iw_cm_node *cm_node;
2171        int oldarpindex;
2172        int arpindex;
2173        struct net_device *netdev = iwdev->netdev;
2174
2175        /* create an hte and cm_node for this instance */
2176        cm_node = kzalloc(sizeof(*cm_node), GFP_ATOMIC);
2177        if (!cm_node)
2178                return NULL;
2179
2180        /* set our node specific transport info */
2181        cm_node->ipv4 = cm_info->ipv4;
2182        cm_node->vlan_id = cm_info->vlan_id;
2183        if ((cm_node->vlan_id == I40IW_NO_VLAN) && iwdev->dcb)
2184                cm_node->vlan_id = 0;
2185        cm_node->tos = cm_info->tos;
2186        cm_node->user_pri = cm_info->user_pri;
2187        if (listener) {
2188                if (listener->tos != cm_info->tos)
2189                        i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB,
2190                                    "application TOS[%d] and remote client TOS[%d] mismatch\n",
2191                                     listener->tos, cm_info->tos);
2192                cm_node->tos = max(listener->tos, cm_info->tos);
2193                cm_node->user_pri = rt_tos2priority(cm_node->tos);
2194                i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "listener: TOS:[%d] UP:[%d]\n",
2195                            cm_node->tos, cm_node->user_pri);
2196        }
2197        memcpy(cm_node->loc_addr, cm_info->loc_addr, sizeof(cm_node->loc_addr));
2198        memcpy(cm_node->rem_addr, cm_info->rem_addr, sizeof(cm_node->rem_addr));
2199        cm_node->loc_port = cm_info->loc_port;
2200        cm_node->rem_port = cm_info->rem_port;
2201
2202        cm_node->mpa_frame_rev = iwdev->mpa_version;
2203        cm_node->send_rdma0_op = SEND_RDMA_READ_ZERO;
2204        cm_node->ird_size = I40IW_MAX_IRD_SIZE;
2205        cm_node->ord_size = I40IW_MAX_ORD_SIZE;
2206
2207        cm_node->listener = listener;
2208        cm_node->cm_id = cm_info->cm_id;
2209        ether_addr_copy(cm_node->loc_mac, netdev->dev_addr);
2210        spin_lock_init(&cm_node->retrans_list_lock);
2211        cm_node->ack_rcvd = false;
2212
2213        atomic_set(&cm_node->ref_count, 1);
2214        /* associate our parent CM core */
2215        cm_node->cm_core = cm_core;
2216        cm_node->tcp_cntxt.loc_id = I40IW_CM_DEF_LOCAL_ID;
2217        cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2218        cm_node->tcp_cntxt.rcv_wnd =
2219                        I40IW_CM_DEFAULT_RCV_WND_SCALED >> I40IW_CM_DEFAULT_RCV_WND_SCALE;
2220        if (cm_node->ipv4) {
2221                cm_node->tcp_cntxt.loc_seq_num = secure_tcp_seq(htonl(cm_node->loc_addr[0]),
2222                                                        htonl(cm_node->rem_addr[0]),
2223                                                        htons(cm_node->loc_port),
2224                                                        htons(cm_node->rem_port));
2225                cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV4;
2226        } else if (IS_ENABLED(CONFIG_IPV6)) {
2227                __be32 loc[4] = {
2228                        htonl(cm_node->loc_addr[0]), htonl(cm_node->loc_addr[1]),
2229                        htonl(cm_node->loc_addr[2]), htonl(cm_node->loc_addr[3])
2230                };
2231                __be32 rem[4] = {
2232                        htonl(cm_node->rem_addr[0]), htonl(cm_node->rem_addr[1]),
2233                        htonl(cm_node->rem_addr[2]), htonl(cm_node->rem_addr[3])
2234                };
2235                cm_node->tcp_cntxt.loc_seq_num = secure_tcpv6_seq(loc, rem,
2236                                                        htons(cm_node->loc_port),
2237                                                        htons(cm_node->rem_port));
2238                cm_node->tcp_cntxt.mss = iwdev->vsi.mtu - I40IW_MTU_TO_MSS_IPV6;
2239        }
2240
2241        cm_node->iwdev = iwdev;
2242        cm_node->dev = &iwdev->sc_dev;
2243
2244        if ((cm_node->ipv4 &&
2245             i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
2246             (!cm_node->ipv4 && i40iw_ipv6_is_loopback(cm_node->loc_addr,
2247                                                       cm_node->rem_addr))) {
2248                arpindex = i40iw_arp_table(iwdev,
2249                                           cm_node->rem_addr,
2250                                           false,
2251                                           NULL,
2252                                           I40IW_ARP_RESOLVE);
2253        } else {
2254                oldarpindex = i40iw_arp_table(iwdev,
2255                                              cm_node->rem_addr,
2256                                              false,
2257                                              NULL,
2258                                              I40IW_ARP_RESOLVE);
2259                if (cm_node->ipv4)
2260                        arpindex = i40iw_addr_resolve_neigh(iwdev,
2261                                                            cm_info->loc_addr[0],
2262                                                            cm_info->rem_addr[0],
2263                                                            oldarpindex);
2264                else if (IS_ENABLED(CONFIG_IPV6))
2265                        arpindex = i40iw_addr_resolve_neigh_ipv6(iwdev,
2266                                                                 cm_info->loc_addr,
2267                                                                 cm_info->rem_addr,
2268                                                                 oldarpindex);
2269                else
2270                        arpindex = -EINVAL;
2271        }
2272        if (arpindex < 0) {
2273                i40iw_pr_err("cm_node arpindex\n");
2274                kfree(cm_node);
2275                return NULL;
2276        }
2277        ether_addr_copy(cm_node->rem_mac, iwdev->arp_table[arpindex].mac_addr);
2278        i40iw_add_hte_node(cm_core, cm_node);
2279        cm_core->stats_nodes_created++;
2280        return cm_node;
2281}
2282
2283/**
2284 * i40iw_rem_ref_cm_node - destroy an instance of a cm node
2285 * @cm_node: connection's node
2286 */
2287static void i40iw_rem_ref_cm_node(struct i40iw_cm_node *cm_node)
2288{
2289        struct i40iw_cm_core *cm_core = cm_node->cm_core;
2290        struct i40iw_qp *iwqp;
2291        struct i40iw_cm_info nfo;
2292        unsigned long flags;
2293
2294        spin_lock_irqsave(&cm_node->cm_core->ht_lock, flags);
2295        if (atomic_dec_return(&cm_node->ref_count)) {
2296                spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2297                return;
2298        }
2299        list_del(&cm_node->list);
2300        spin_unlock_irqrestore(&cm_node->cm_core->ht_lock, flags);
2301
2302        /* if the node is destroyed before connection was accelerated */
2303        if (!cm_node->accelerated && cm_node->accept_pend) {
2304                pr_err("node destroyed before established\n");
2305                atomic_dec(&cm_node->listener->pend_accepts_cnt);
2306        }
2307        if (cm_node->close_entry)
2308                i40iw_handle_close_entry(cm_node, 0);
2309        if (cm_node->listener) {
2310                i40iw_dec_refcnt_listen(cm_core, cm_node->listener, 0, true);
2311        } else {
2312                if (cm_node->apbvt_set) {
2313                        i40iw_manage_apbvt(cm_node->iwdev,
2314                                           cm_node->loc_port,
2315                                           I40IW_MANAGE_APBVT_DEL);
2316                        cm_node->apbvt_set = 0;
2317                }
2318                i40iw_get_addr_info(cm_node, &nfo);
2319                if (cm_node->qhash_set) {
2320                        i40iw_manage_qhash(cm_node->iwdev,
2321                                           &nfo,
2322                                           I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2323                                           I40IW_QHASH_MANAGE_TYPE_DELETE,
2324                                           NULL,
2325                                           false);
2326                        cm_node->qhash_set = 0;
2327                }
2328        }
2329
2330        iwqp = cm_node->iwqp;
2331        if (iwqp) {
2332                iwqp->cm_node = NULL;
2333                i40iw_rem_ref(&iwqp->ibqp);
2334                cm_node->iwqp = NULL;
2335        } else if (cm_node->qhash_set) {
2336                i40iw_get_addr_info(cm_node, &nfo);
2337                i40iw_manage_qhash(cm_node->iwdev,
2338                                   &nfo,
2339                                   I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2340                                   I40IW_QHASH_MANAGE_TYPE_DELETE,
2341                                   NULL,
2342                                   false);
2343                cm_node->qhash_set = 0;
2344        }
2345
2346        cm_node->cm_core->stats_nodes_destroyed++;
2347        kfree(cm_node);
2348}
2349
2350/**
2351 * i40iw_handle_fin_pkt - FIN packet received
2352 * @cm_node: connection's node
2353 */
2354static void i40iw_handle_fin_pkt(struct i40iw_cm_node *cm_node)
2355{
2356        u32 ret;
2357
2358        switch (cm_node->state) {
2359        case I40IW_CM_STATE_SYN_RCVD:
2360        case I40IW_CM_STATE_SYN_SENT:
2361        case I40IW_CM_STATE_ESTABLISHED:
2362        case I40IW_CM_STATE_MPAREJ_RCVD:
2363                cm_node->tcp_cntxt.rcv_nxt++;
2364                i40iw_cleanup_retrans_entry(cm_node);
2365                cm_node->state = I40IW_CM_STATE_LAST_ACK;
2366                i40iw_send_fin(cm_node);
2367                break;
2368        case I40IW_CM_STATE_MPAREQ_SENT:
2369                i40iw_create_event(cm_node, I40IW_CM_EVENT_ABORTED);
2370                cm_node->tcp_cntxt.rcv_nxt++;
2371                i40iw_cleanup_retrans_entry(cm_node);
2372                cm_node->state = I40IW_CM_STATE_CLOSED;
2373                atomic_inc(&cm_node->ref_count);
2374                i40iw_send_reset(cm_node);
2375                break;
2376        case I40IW_CM_STATE_FIN_WAIT1:
2377                cm_node->tcp_cntxt.rcv_nxt++;
2378                i40iw_cleanup_retrans_entry(cm_node);
2379                cm_node->state = I40IW_CM_STATE_CLOSING;
2380                i40iw_send_ack(cm_node);
2381                /*
2382                 * Wait for ACK as this is simultaneous close.
2383                 * After we receive ACK, do not send anything.
2384                 * Just rm the node.
2385                 */
2386                break;
2387        case I40IW_CM_STATE_FIN_WAIT2:
2388                cm_node->tcp_cntxt.rcv_nxt++;
2389                i40iw_cleanup_retrans_entry(cm_node);
2390                cm_node->state = I40IW_CM_STATE_TIME_WAIT;
2391                i40iw_send_ack(cm_node);
2392                ret =
2393                    i40iw_schedule_cm_timer(cm_node, NULL, I40IW_TIMER_TYPE_CLOSE, 1, 0);
2394                if (ret)
2395                        i40iw_pr_err("node %p state = %d\n", cm_node, cm_node->state);
2396                break;
2397        case I40IW_CM_STATE_TIME_WAIT:
2398                cm_node->tcp_cntxt.rcv_nxt++;
2399                i40iw_cleanup_retrans_entry(cm_node);
2400                cm_node->state = I40IW_CM_STATE_CLOSED;
2401                i40iw_rem_ref_cm_node(cm_node);
2402                break;
2403        case I40IW_CM_STATE_OFFLOADED:
2404        default:
2405                i40iw_pr_err("bad state node %p state = %d\n", cm_node, cm_node->state);
2406                break;
2407        }
2408}
2409
2410/**
2411 * i40iw_handle_rst_pkt - process received RST packet
2412 * @cm_node: connection's node
2413 * @rbuf: receive buffer
2414 */
2415static void i40iw_handle_rst_pkt(struct i40iw_cm_node *cm_node,
2416                                 struct i40iw_puda_buf *rbuf)
2417{
2418        i40iw_cleanup_retrans_entry(cm_node);
2419        switch (cm_node->state) {
2420        case I40IW_CM_STATE_SYN_SENT:
2421        case I40IW_CM_STATE_MPAREQ_SENT:
2422                switch (cm_node->mpa_frame_rev) {
2423                case IETF_MPA_V2:
2424                        cm_node->mpa_frame_rev = IETF_MPA_V1;
2425                        /* send a syn and goto syn sent state */
2426                        cm_node->state = I40IW_CM_STATE_SYN_SENT;
2427                        if (i40iw_send_syn(cm_node, 0))
2428                                i40iw_active_open_err(cm_node, false);
2429                        break;
2430                case IETF_MPA_V1:
2431                default:
2432                        i40iw_active_open_err(cm_node, false);
2433                        break;
2434                }
2435                break;
2436        case I40IW_CM_STATE_MPAREQ_RCVD:
2437                atomic_add_return(1, &cm_node->passive_state);
2438                break;
2439        case I40IW_CM_STATE_ESTABLISHED:
2440        case I40IW_CM_STATE_SYN_RCVD:
2441        case I40IW_CM_STATE_LISTENING:
2442                i40iw_pr_err("Bad state state = %d\n", cm_node->state);
2443                i40iw_passive_open_err(cm_node, false);
2444                break;
2445        case I40IW_CM_STATE_OFFLOADED:
2446                i40iw_active_open_err(cm_node, false);
2447                break;
2448        case I40IW_CM_STATE_CLOSED:
2449                break;
2450        case I40IW_CM_STATE_FIN_WAIT2:
2451        case I40IW_CM_STATE_FIN_WAIT1:
2452        case I40IW_CM_STATE_LAST_ACK:
2453                cm_node->cm_id->rem_ref(cm_node->cm_id);
2454                /* fall through */
2455        case I40IW_CM_STATE_TIME_WAIT:
2456                cm_node->state = I40IW_CM_STATE_CLOSED;
2457                i40iw_rem_ref_cm_node(cm_node);
2458                break;
2459        default:
2460                break;
2461        }
2462}
2463
2464/**
2465 * i40iw_handle_rcv_mpa - Process a recv'd mpa buffer
2466 * @cm_node: connection's node
2467 * @rbuf: receive buffer
2468 */
2469static void i40iw_handle_rcv_mpa(struct i40iw_cm_node *cm_node,
2470                                 struct i40iw_puda_buf *rbuf)
2471{
2472        int ret;
2473        int datasize = rbuf->datalen;
2474        u8 *dataloc = rbuf->data;
2475
2476        enum i40iw_cm_event_type type = I40IW_CM_EVENT_UNKNOWN;
2477        u32 res_type;
2478
2479        ret = i40iw_parse_mpa(cm_node, dataloc, &res_type, datasize);
2480        if (ret) {
2481                if (cm_node->state == I40IW_CM_STATE_MPAREQ_SENT)
2482                        i40iw_active_open_err(cm_node, true);
2483                else
2484                        i40iw_passive_open_err(cm_node, true);
2485                return;
2486        }
2487
2488        switch (cm_node->state) {
2489        case I40IW_CM_STATE_ESTABLISHED:
2490                if (res_type == I40IW_MPA_REQUEST_REJECT)
2491                        i40iw_pr_err("state for reject\n");
2492                cm_node->state = I40IW_CM_STATE_MPAREQ_RCVD;
2493                type = I40IW_CM_EVENT_MPA_REQ;
2494                i40iw_send_ack(cm_node);        /* ACK received MPA request */
2495                atomic_set(&cm_node->passive_state,
2496                           I40IW_PASSIVE_STATE_INDICATED);
2497                break;
2498        case I40IW_CM_STATE_MPAREQ_SENT:
2499                i40iw_cleanup_retrans_entry(cm_node);
2500                if (res_type == I40IW_MPA_REQUEST_REJECT) {
2501                        type = I40IW_CM_EVENT_MPA_REJECT;
2502                        cm_node->state = I40IW_CM_STATE_MPAREJ_RCVD;
2503                } else {
2504                        type = I40IW_CM_EVENT_CONNECTED;
2505                        cm_node->state = I40IW_CM_STATE_OFFLOADED;
2506                }
2507                i40iw_send_ack(cm_node);
2508                break;
2509        default:
2510                pr_err("%s wrong cm_node state =%d\n", __func__, cm_node->state);
2511                break;
2512        }
2513        i40iw_create_event(cm_node, type);
2514}
2515
2516/**
2517 * i40iw_indicate_pkt_err - Send up err event to cm
2518 * @cm_node: connection's node
2519 */
2520static void i40iw_indicate_pkt_err(struct i40iw_cm_node *cm_node)
2521{
2522        switch (cm_node->state) {
2523        case I40IW_CM_STATE_SYN_SENT:
2524        case I40IW_CM_STATE_MPAREQ_SENT:
2525                i40iw_active_open_err(cm_node, true);
2526                break;
2527        case I40IW_CM_STATE_ESTABLISHED:
2528        case I40IW_CM_STATE_SYN_RCVD:
2529                i40iw_passive_open_err(cm_node, true);
2530                break;
2531        case I40IW_CM_STATE_OFFLOADED:
2532        default:
2533                break;
2534        }
2535}
2536
2537/**
2538 * i40iw_check_syn - Check for error on received syn ack
2539 * @cm_node: connection's node
2540 * @tcph: pointer tcp header
2541 */
2542static int i40iw_check_syn(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2543{
2544        int err = 0;
2545
2546        if (ntohl(tcph->ack_seq) != cm_node->tcp_cntxt.loc_seq_num) {
2547                err = 1;
2548                i40iw_active_open_err(cm_node, true);
2549        }
2550        return err;
2551}
2552
2553/**
2554 * i40iw_check_seq - check seq numbers if OK
2555 * @cm_node: connection's node
2556 * @tcph: pointer tcp header
2557 */
2558static int i40iw_check_seq(struct i40iw_cm_node *cm_node, struct tcphdr *tcph)
2559{
2560        int err = 0;
2561        u32 seq;
2562        u32 ack_seq;
2563        u32 loc_seq_num = cm_node->tcp_cntxt.loc_seq_num;
2564        u32 rcv_nxt = cm_node->tcp_cntxt.rcv_nxt;
2565        u32 rcv_wnd;
2566
2567        seq = ntohl(tcph->seq);
2568        ack_seq = ntohl(tcph->ack_seq);
2569        rcv_wnd = cm_node->tcp_cntxt.rcv_wnd;
2570        if (ack_seq != loc_seq_num)
2571                err = -1;
2572        else if (!between(seq, rcv_nxt, (rcv_nxt + rcv_wnd)))
2573                err = -1;
2574        if (err) {
2575                i40iw_pr_err("seq number\n");
2576                i40iw_indicate_pkt_err(cm_node);
2577        }
2578        return err;
2579}
2580
2581/**
2582 * i40iw_handle_syn_pkt - is for Passive node
2583 * @cm_node: connection's node
2584 * @rbuf: receive buffer
2585 */
2586static void i40iw_handle_syn_pkt(struct i40iw_cm_node *cm_node,
2587                                 struct i40iw_puda_buf *rbuf)
2588{
2589        struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2590        int ret;
2591        u32 inc_sequence;
2592        int optionsize;
2593        struct i40iw_cm_info nfo;
2594
2595        optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2596        inc_sequence = ntohl(tcph->seq);
2597
2598        switch (cm_node->state) {
2599        case I40IW_CM_STATE_SYN_SENT:
2600        case I40IW_CM_STATE_MPAREQ_SENT:
2601                /* Rcvd syn on active open connection */
2602                i40iw_active_open_err(cm_node, 1);
2603                break;
2604        case I40IW_CM_STATE_LISTENING:
2605                /* Passive OPEN */
2606                if (atomic_read(&cm_node->listener->pend_accepts_cnt) >
2607                    cm_node->listener->backlog) {
2608                        cm_node->cm_core->stats_backlog_drops++;
2609                        i40iw_passive_open_err(cm_node, false);
2610                        break;
2611                }
2612                ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2613                if (ret) {
2614                        i40iw_passive_open_err(cm_node, false);
2615                        /* drop pkt */
2616                        break;
2617                }
2618                cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2619                cm_node->accept_pend = 1;
2620                atomic_inc(&cm_node->listener->pend_accepts_cnt);
2621
2622                cm_node->state = I40IW_CM_STATE_SYN_RCVD;
2623                i40iw_get_addr_info(cm_node, &nfo);
2624                ret = i40iw_manage_qhash(cm_node->iwdev,
2625                                         &nfo,
2626                                         I40IW_QHASH_TYPE_TCP_ESTABLISHED,
2627                                         I40IW_QHASH_MANAGE_TYPE_ADD,
2628                                         (void *)cm_node,
2629                                         false);
2630                cm_node->qhash_set = true;
2631                break;
2632        case I40IW_CM_STATE_CLOSED:
2633                i40iw_cleanup_retrans_entry(cm_node);
2634                atomic_inc(&cm_node->ref_count);
2635                i40iw_send_reset(cm_node);
2636                break;
2637        case I40IW_CM_STATE_OFFLOADED:
2638        case I40IW_CM_STATE_ESTABLISHED:
2639        case I40IW_CM_STATE_FIN_WAIT1:
2640        case I40IW_CM_STATE_FIN_WAIT2:
2641        case I40IW_CM_STATE_MPAREQ_RCVD:
2642        case I40IW_CM_STATE_LAST_ACK:
2643        case I40IW_CM_STATE_CLOSING:
2644        case I40IW_CM_STATE_UNKNOWN:
2645        default:
2646                break;
2647        }
2648}
2649
2650/**
2651 * i40iw_handle_synack_pkt - Process SYN+ACK packet (active side)
2652 * @cm_node: connection's node
2653 * @rbuf: receive buffer
2654 */
2655static void i40iw_handle_synack_pkt(struct i40iw_cm_node *cm_node,
2656                                    struct i40iw_puda_buf *rbuf)
2657{
2658        struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2659        int ret;
2660        u32 inc_sequence;
2661        int optionsize;
2662
2663        optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2664        inc_sequence = ntohl(tcph->seq);
2665        switch (cm_node->state) {
2666        case I40IW_CM_STATE_SYN_SENT:
2667                i40iw_cleanup_retrans_entry(cm_node);
2668                /* active open */
2669                if (i40iw_check_syn(cm_node, tcph)) {
2670                        i40iw_pr_err("check syn fail\n");
2671                        return;
2672                }
2673                cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2674                /* setup options */
2675                ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 0);
2676                if (ret) {
2677                        i40iw_debug(cm_node->dev,
2678                                    I40IW_DEBUG_CM,
2679                                    "cm_node=%p tcp_options failed\n",
2680                                    cm_node);
2681                        break;
2682                }
2683                i40iw_cleanup_retrans_entry(cm_node);
2684                cm_node->tcp_cntxt.rcv_nxt = inc_sequence + 1;
2685                i40iw_send_ack(cm_node);        /* ACK  for the syn_ack */
2686                ret = i40iw_send_mpa_request(cm_node);
2687                if (ret) {
2688                        i40iw_debug(cm_node->dev,
2689                                    I40IW_DEBUG_CM,
2690                                    "cm_node=%p i40iw_send_mpa_request failed\n",
2691                                    cm_node);
2692                        break;
2693                }
2694                cm_node->state = I40IW_CM_STATE_MPAREQ_SENT;
2695                break;
2696        case I40IW_CM_STATE_MPAREQ_RCVD:
2697                i40iw_passive_open_err(cm_node, true);
2698                break;
2699        case I40IW_CM_STATE_LISTENING:
2700                cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2701                i40iw_cleanup_retrans_entry(cm_node);
2702                cm_node->state = I40IW_CM_STATE_CLOSED;
2703                i40iw_send_reset(cm_node);
2704                break;
2705        case I40IW_CM_STATE_CLOSED:
2706                cm_node->tcp_cntxt.loc_seq_num = ntohl(tcph->ack_seq);
2707                i40iw_cleanup_retrans_entry(cm_node);
2708                atomic_inc(&cm_node->ref_count);
2709                i40iw_send_reset(cm_node);
2710                break;
2711        case I40IW_CM_STATE_ESTABLISHED:
2712        case I40IW_CM_STATE_FIN_WAIT1:
2713        case I40IW_CM_STATE_FIN_WAIT2:
2714        case I40IW_CM_STATE_LAST_ACK:
2715        case I40IW_CM_STATE_OFFLOADED:
2716        case I40IW_CM_STATE_CLOSING:
2717        case I40IW_CM_STATE_UNKNOWN:
2718        case I40IW_CM_STATE_MPAREQ_SENT:
2719        default:
2720                break;
2721        }
2722}
2723
2724/**
2725 * i40iw_handle_ack_pkt - process packet with ACK
2726 * @cm_node: connection's node
2727 * @rbuf: receive buffer
2728 */
2729static int i40iw_handle_ack_pkt(struct i40iw_cm_node *cm_node,
2730                                struct i40iw_puda_buf *rbuf)
2731{
2732        struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2733        u32 inc_sequence;
2734        int ret = 0;
2735        int optionsize;
2736        u32 datasize = rbuf->datalen;
2737
2738        optionsize = (tcph->doff << 2) - sizeof(struct tcphdr);
2739
2740        if (i40iw_check_seq(cm_node, tcph))
2741                return -EINVAL;
2742
2743        inc_sequence = ntohl(tcph->seq);
2744        switch (cm_node->state) {
2745        case I40IW_CM_STATE_SYN_RCVD:
2746                i40iw_cleanup_retrans_entry(cm_node);
2747                ret = i40iw_handle_tcp_options(cm_node, tcph, optionsize, 1);
2748                if (ret)
2749                        break;
2750                cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2751                cm_node->state = I40IW_CM_STATE_ESTABLISHED;
2752                if (datasize) {
2753                        cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2754                        i40iw_handle_rcv_mpa(cm_node, rbuf);
2755                }
2756                break;
2757        case I40IW_CM_STATE_ESTABLISHED:
2758                i40iw_cleanup_retrans_entry(cm_node);
2759                if (datasize) {
2760                        cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2761                        i40iw_handle_rcv_mpa(cm_node, rbuf);
2762                }
2763                break;
2764        case I40IW_CM_STATE_MPAREQ_SENT:
2765                cm_node->tcp_cntxt.rem_ack_num = ntohl(tcph->ack_seq);
2766                if (datasize) {
2767                        cm_node->tcp_cntxt.rcv_nxt = inc_sequence + datasize;
2768                        cm_node->ack_rcvd = false;
2769                        i40iw_handle_rcv_mpa(cm_node, rbuf);
2770                } else {
2771                        cm_node->ack_rcvd = true;
2772                }
2773                break;
2774        case I40IW_CM_STATE_LISTENING:
2775                i40iw_cleanup_retrans_entry(cm_node);
2776                cm_node->state = I40IW_CM_STATE_CLOSED;
2777                i40iw_send_reset(cm_node);
2778                break;
2779        case I40IW_CM_STATE_CLOSED:
2780                i40iw_cleanup_retrans_entry(cm_node);
2781                atomic_inc(&cm_node->ref_count);
2782                i40iw_send_reset(cm_node);
2783                break;
2784        case I40IW_CM_STATE_LAST_ACK:
2785        case I40IW_CM_STATE_CLOSING:
2786                i40iw_cleanup_retrans_entry(cm_node);
2787                cm_node->state = I40IW_CM_STATE_CLOSED;
2788                if (!cm_node->accept_pend)
2789                        cm_node->cm_id->rem_ref(cm_node->cm_id);
2790                i40iw_rem_ref_cm_node(cm_node);
2791                break;
2792        case I40IW_CM_STATE_FIN_WAIT1:
2793                i40iw_cleanup_retrans_entry(cm_node);
2794                cm_node->state = I40IW_CM_STATE_FIN_WAIT2;
2795                break;
2796        case I40IW_CM_STATE_SYN_SENT:
2797        case I40IW_CM_STATE_FIN_WAIT2:
2798        case I40IW_CM_STATE_OFFLOADED:
2799        case I40IW_CM_STATE_MPAREQ_RCVD:
2800        case I40IW_CM_STATE_UNKNOWN:
2801        default:
2802                i40iw_cleanup_retrans_entry(cm_node);
2803                break;
2804        }
2805        return ret;
2806}
2807
2808/**
2809 * i40iw_process_packet - process cm packet
2810 * @cm_node: connection's node
2811 * @rbuf: receive buffer
2812 */
2813static void i40iw_process_packet(struct i40iw_cm_node *cm_node,
2814                                 struct i40iw_puda_buf *rbuf)
2815{
2816        enum i40iw_tcpip_pkt_type pkt_type = I40IW_PKT_TYPE_UNKNOWN;
2817        struct tcphdr *tcph = (struct tcphdr *)rbuf->tcph;
2818        u32 fin_set = 0;
2819        int ret;
2820
2821        if (tcph->rst) {
2822                pkt_type = I40IW_PKT_TYPE_RST;
2823        } else if (tcph->syn) {
2824                pkt_type = I40IW_PKT_TYPE_SYN;
2825                if (tcph->ack)
2826                        pkt_type = I40IW_PKT_TYPE_SYNACK;
2827        } else if (tcph->ack) {
2828                pkt_type = I40IW_PKT_TYPE_ACK;
2829        }
2830        if (tcph->fin)
2831                fin_set = 1;
2832
2833        switch (pkt_type) {
2834        case I40IW_PKT_TYPE_SYN:
2835                i40iw_handle_syn_pkt(cm_node, rbuf);
2836                break;
2837        case I40IW_PKT_TYPE_SYNACK:
2838                i40iw_handle_synack_pkt(cm_node, rbuf);
2839                break;
2840        case I40IW_PKT_TYPE_ACK:
2841                ret = i40iw_handle_ack_pkt(cm_node, rbuf);
2842                if (fin_set && !ret)
2843                        i40iw_handle_fin_pkt(cm_node);
2844                break;
2845        case I40IW_PKT_TYPE_RST:
2846                i40iw_handle_rst_pkt(cm_node, rbuf);
2847                break;
2848        default:
2849                if (fin_set &&
2850                    (!i40iw_check_seq(cm_node, (struct tcphdr *)rbuf->tcph)))
2851                        i40iw_handle_fin_pkt(cm_node);
2852                break;
2853        }
2854}
2855
2856/**
2857 * i40iw_make_listen_node - create a listen node with params
2858 * @cm_core: cm's core
2859 * @iwdev: iwarp device structure
2860 * @cm_info: quad info for connection
2861 */
2862static struct i40iw_cm_listener *i40iw_make_listen_node(
2863                                        struct i40iw_cm_core *cm_core,
2864                                        struct i40iw_device *iwdev,
2865                                        struct i40iw_cm_info *cm_info)
2866{
2867        struct i40iw_cm_listener *listener;
2868        unsigned long flags;
2869
2870        /* cannot have multiple matching listeners */
2871        listener = i40iw_find_listener(cm_core, cm_info->loc_addr,
2872                                       cm_info->loc_port,
2873                                       cm_info->vlan_id,
2874                                       I40IW_CM_LISTENER_EITHER_STATE);
2875        if (listener &&
2876            (listener->listener_state == I40IW_CM_LISTENER_ACTIVE_STATE)) {
2877                atomic_dec(&listener->ref_count);
2878                i40iw_debug(cm_core->dev,
2879                            I40IW_DEBUG_CM,
2880                            "Not creating listener since it already exists\n");
2881                return NULL;
2882        }
2883
2884        if (!listener) {
2885                /* create a CM listen node (1/2 node to compare incoming traffic to) */
2886                listener = kzalloc(sizeof(*listener), GFP_KERNEL);
2887                if (!listener)
2888                        return NULL;
2889                cm_core->stats_listen_nodes_created++;
2890                memcpy(listener->loc_addr, cm_info->loc_addr, sizeof(listener->loc_addr));
2891                listener->loc_port = cm_info->loc_port;
2892
2893                INIT_LIST_HEAD(&listener->child_listen_list);
2894
2895                atomic_set(&listener->ref_count, 1);
2896        } else {
2897                listener->reused_node = 1;
2898        }
2899
2900        listener->cm_id = cm_info->cm_id;
2901        listener->ipv4 = cm_info->ipv4;
2902        listener->vlan_id = cm_info->vlan_id;
2903        atomic_set(&listener->pend_accepts_cnt, 0);
2904        listener->cm_core = cm_core;
2905        listener->iwdev = iwdev;
2906
2907        listener->backlog = cm_info->backlog;
2908        listener->listener_state = I40IW_CM_LISTENER_ACTIVE_STATE;
2909
2910        if (!listener->reused_node) {
2911                spin_lock_irqsave(&cm_core->listen_list_lock, flags);
2912                list_add(&listener->list, &cm_core->listen_nodes);
2913                spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
2914        }
2915
2916        return listener;
2917}
2918
2919/**
2920 * i40iw_create_cm_node - make a connection node with params
2921 * @cm_core: cm's core
2922 * @iwdev: iwarp device structure
2923 * @conn_param: upper layer connection parameters
2924 * @cm_info: quad info for connection
2925 */
2926static struct i40iw_cm_node *i40iw_create_cm_node(
2927                                        struct i40iw_cm_core *cm_core,
2928                                        struct i40iw_device *iwdev,
2929                                        struct iw_cm_conn_param *conn_param,
2930                                        struct i40iw_cm_info *cm_info)
2931{
2932        struct i40iw_cm_node *cm_node;
2933        struct i40iw_cm_listener *loopback_remotelistener;
2934        struct i40iw_cm_node *loopback_remotenode;
2935        struct i40iw_cm_info loopback_cm_info;
2936
2937        u16 private_data_len = conn_param->private_data_len;
2938        const void *private_data = conn_param->private_data;
2939
2940        /* create a CM connection node */
2941        cm_node = i40iw_make_cm_node(cm_core, iwdev, cm_info, NULL);
2942        if (!cm_node)
2943                return ERR_PTR(-ENOMEM);
2944        /* set our node side to client (active) side */
2945        cm_node->tcp_cntxt.client = 1;
2946        cm_node->tcp_cntxt.rcv_wscale = I40IW_CM_DEFAULT_RCV_WND_SCALE;
2947
2948        i40iw_record_ird_ord(cm_node, conn_param->ird, conn_param->ord);
2949
2950        if (!memcmp(cm_info->loc_addr, cm_info->rem_addr, sizeof(cm_info->loc_addr))) {
2951                loopback_remotelistener = i40iw_find_listener(
2952                                                cm_core,
2953                                                cm_info->rem_addr,
2954                                                cm_node->rem_port,
2955                                                cm_node->vlan_id,
2956                                                I40IW_CM_LISTENER_ACTIVE_STATE);
2957                if (!loopback_remotelistener) {
2958                        i40iw_rem_ref_cm_node(cm_node);
2959                        return ERR_PTR(-ECONNREFUSED);
2960                } else {
2961                        loopback_cm_info = *cm_info;
2962                        loopback_cm_info.loc_port = cm_info->rem_port;
2963                        loopback_cm_info.rem_port = cm_info->loc_port;
2964                        loopback_cm_info.cm_id = loopback_remotelistener->cm_id;
2965                        loopback_cm_info.ipv4 = cm_info->ipv4;
2966                        loopback_remotenode = i40iw_make_cm_node(cm_core,
2967                                                                 iwdev,
2968                                                                 &loopback_cm_info,
2969                                                                 loopback_remotelistener);
2970                        if (!loopback_remotenode) {
2971                                i40iw_rem_ref_cm_node(cm_node);
2972                                return ERR_PTR(-ENOMEM);
2973                        }
2974                        cm_core->stats_loopbacks++;
2975                        loopback_remotenode->loopbackpartner = cm_node;
2976                        loopback_remotenode->tcp_cntxt.rcv_wscale =
2977                                I40IW_CM_DEFAULT_RCV_WND_SCALE;
2978                        cm_node->loopbackpartner = loopback_remotenode;
2979                        memcpy(loopback_remotenode->pdata_buf, private_data,
2980                               private_data_len);
2981                        loopback_remotenode->pdata.size = private_data_len;
2982
2983                        if (loopback_remotenode->ord_size > cm_node->ird_size)
2984                                loopback_remotenode->ord_size =
2985                                        cm_node->ird_size;
2986
2987                        cm_node->state = I40IW_CM_STATE_OFFLOADED;
2988                        cm_node->tcp_cntxt.rcv_nxt =
2989                                loopback_remotenode->tcp_cntxt.loc_seq_num;
2990                        loopback_remotenode->tcp_cntxt.rcv_nxt =
2991                                cm_node->tcp_cntxt.loc_seq_num;
2992                        cm_node->tcp_cntxt.max_snd_wnd =
2993                                loopback_remotenode->tcp_cntxt.rcv_wnd;
2994                        loopback_remotenode->tcp_cntxt.max_snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2995                        cm_node->tcp_cntxt.snd_wnd = loopback_remotenode->tcp_cntxt.rcv_wnd;
2996                        loopback_remotenode->tcp_cntxt.snd_wnd = cm_node->tcp_cntxt.rcv_wnd;
2997                        cm_node->tcp_cntxt.snd_wscale = loopback_remotenode->tcp_cntxt.rcv_wscale;
2998                        loopback_remotenode->tcp_cntxt.snd_wscale = cm_node->tcp_cntxt.rcv_wscale;
2999                }
3000                return cm_node;
3001        }
3002
3003        cm_node->pdata.size = private_data_len;
3004        cm_node->pdata.addr = cm_node->pdata_buf;
3005
3006        memcpy(cm_node->pdata_buf, private_data, private_data_len);
3007
3008        cm_node->state = I40IW_CM_STATE_SYN_SENT;
3009        return cm_node;
3010}
3011
3012/**
3013 * i40iw_cm_reject - reject and teardown a connection
3014 * @cm_node: connection's node
3015 * @pdate: ptr to private data for reject
3016 * @plen: size of private data
3017 */
3018static int i40iw_cm_reject(struct i40iw_cm_node *cm_node, const void *pdata, u8 plen)
3019{
3020        int ret = 0;
3021        int err;
3022        int passive_state;
3023        struct iw_cm_id *cm_id = cm_node->cm_id;
3024        struct i40iw_cm_node *loopback = cm_node->loopbackpartner;
3025
3026        if (cm_node->tcp_cntxt.client)
3027                return ret;
3028        i40iw_cleanup_retrans_entry(cm_node);
3029
3030        if (!loopback) {
3031                passive_state = atomic_add_return(1, &cm_node->passive_state);
3032                if (passive_state == I40IW_SEND_RESET_EVENT) {
3033                        cm_node->state = I40IW_CM_STATE_CLOSED;
3034                        i40iw_rem_ref_cm_node(cm_node);
3035                } else {
3036                        if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3037                                i40iw_rem_ref_cm_node(cm_node);
3038                        } else {
3039                                ret = i40iw_send_mpa_reject(cm_node, pdata, plen);
3040                                if (ret) {
3041                                        cm_node->state = I40IW_CM_STATE_CLOSED;
3042                                        err = i40iw_send_reset(cm_node);
3043                                        if (err)
3044                                                i40iw_pr_err("send reset failed\n");
3045                                } else {
3046                                        cm_id->add_ref(cm_id);
3047                                }
3048                        }
3049                }
3050        } else {
3051                cm_node->cm_id = NULL;
3052                if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3053                        i40iw_rem_ref_cm_node(cm_node);
3054                        i40iw_rem_ref_cm_node(loopback);
3055                } else {
3056                        ret = i40iw_send_cm_event(loopback,
3057                                                  loopback->cm_id,
3058                                                  IW_CM_EVENT_CONNECT_REPLY,
3059                                                  -ECONNREFUSED);
3060                        i40iw_rem_ref_cm_node(cm_node);
3061                        loopback->state = I40IW_CM_STATE_CLOSING;
3062
3063                        cm_id = loopback->cm_id;
3064                        i40iw_rem_ref_cm_node(loopback);
3065                        cm_id->rem_ref(cm_id);
3066                }
3067        }
3068
3069        return ret;
3070}
3071
3072/**
3073 * i40iw_cm_close - close of cm connection
3074 * @cm_node: connection's node
3075 */
3076static int i40iw_cm_close(struct i40iw_cm_node *cm_node)
3077{
3078        int ret = 0;
3079
3080        if (!cm_node)
3081                return -EINVAL;
3082
3083        switch (cm_node->state) {
3084        case I40IW_CM_STATE_SYN_RCVD:
3085        case I40IW_CM_STATE_SYN_SENT:
3086        case I40IW_CM_STATE_ONE_SIDE_ESTABLISHED:
3087        case I40IW_CM_STATE_ESTABLISHED:
3088        case I40IW_CM_STATE_ACCEPTING:
3089        case I40IW_CM_STATE_MPAREQ_SENT:
3090        case I40IW_CM_STATE_MPAREQ_RCVD:
3091                i40iw_cleanup_retrans_entry(cm_node);
3092                i40iw_send_reset(cm_node);
3093                break;
3094        case I40IW_CM_STATE_CLOSE_WAIT:
3095                cm_node->state = I40IW_CM_STATE_LAST_ACK;
3096                i40iw_send_fin(cm_node);
3097                break;
3098        case I40IW_CM_STATE_FIN_WAIT1:
3099        case I40IW_CM_STATE_FIN_WAIT2:
3100        case I40IW_CM_STATE_LAST_ACK:
3101        case I40IW_CM_STATE_TIME_WAIT:
3102        case I40IW_CM_STATE_CLOSING:
3103                ret = -1;
3104                break;
3105        case I40IW_CM_STATE_LISTENING:
3106                i40iw_cleanup_retrans_entry(cm_node);
3107                i40iw_send_reset(cm_node);
3108                break;
3109        case I40IW_CM_STATE_MPAREJ_RCVD:
3110        case I40IW_CM_STATE_UNKNOWN:
3111        case I40IW_CM_STATE_INITED:
3112        case I40IW_CM_STATE_CLOSED:
3113        case I40IW_CM_STATE_LISTENER_DESTROYED:
3114                i40iw_rem_ref_cm_node(cm_node);
3115                break;
3116        case I40IW_CM_STATE_OFFLOADED:
3117                if (cm_node->send_entry)
3118                        i40iw_pr_err("send_entry\n");
3119                i40iw_rem_ref_cm_node(cm_node);
3120                break;
3121        }
3122        return ret;
3123}
3124
3125/**
3126 * i40iw_receive_ilq - recv an ETHERNET packet, and process it
3127 * through CM
3128 * @vsi: pointer to the vsi structure
3129 * @rbuf: receive buffer
3130 */
3131void i40iw_receive_ilq(struct i40iw_sc_vsi *vsi, struct i40iw_puda_buf *rbuf)
3132{
3133        struct i40iw_cm_node *cm_node;
3134        struct i40iw_cm_listener *listener;
3135        struct iphdr *iph;
3136        struct ipv6hdr *ip6h;
3137        struct tcphdr *tcph;
3138        struct i40iw_cm_info cm_info;
3139        struct i40iw_sc_dev *dev = vsi->dev;
3140        struct i40iw_device *iwdev = (struct i40iw_device *)dev->back_dev;
3141        struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3142        struct vlan_ethhdr *ethh;
3143        u16 vtag;
3144
3145        /* if vlan, then maclen = 18 else 14 */
3146        iph = (struct iphdr *)rbuf->iph;
3147        memset(&cm_info, 0, sizeof(cm_info));
3148
3149        i40iw_debug_buf(dev,
3150                        I40IW_DEBUG_ILQ,
3151                        "RECEIVE ILQ BUFFER",
3152                        rbuf->mem.va,
3153                        rbuf->totallen);
3154        ethh = (struct vlan_ethhdr *)rbuf->mem.va;
3155
3156        if (ethh->h_vlan_proto == htons(ETH_P_8021Q)) {
3157                vtag = ntohs(ethh->h_vlan_TCI);
3158                cm_info.user_pri = (vtag & VLAN_PRIO_MASK) >> VLAN_PRIO_SHIFT;
3159                cm_info.vlan_id = vtag & VLAN_VID_MASK;
3160                i40iw_debug(cm_core->dev,
3161                            I40IW_DEBUG_CM,
3162                            "%s vlan_id=%d\n",
3163                            __func__,
3164                            cm_info.vlan_id);
3165        } else {
3166                cm_info.vlan_id = I40IW_NO_VLAN;
3167        }
3168        tcph = (struct tcphdr *)rbuf->tcph;
3169
3170        if (rbuf->ipv4) {
3171                cm_info.loc_addr[0] = ntohl(iph->daddr);
3172                cm_info.rem_addr[0] = ntohl(iph->saddr);
3173                cm_info.ipv4 = true;
3174                cm_info.tos = iph->tos;
3175        } else {
3176                ip6h = (struct ipv6hdr *)rbuf->iph;
3177                i40iw_copy_ip_ntohl(cm_info.loc_addr,
3178                                    ip6h->daddr.in6_u.u6_addr32);
3179                i40iw_copy_ip_ntohl(cm_info.rem_addr,
3180                                    ip6h->saddr.in6_u.u6_addr32);
3181                cm_info.ipv4 = false;
3182                cm_info.tos = (ip6h->priority << 4) | (ip6h->flow_lbl[0] >> 4);
3183        }
3184        cm_info.loc_port = ntohs(tcph->dest);
3185        cm_info.rem_port = ntohs(tcph->source);
3186        cm_node = i40iw_find_node(cm_core,
3187                                  cm_info.rem_port,
3188                                  cm_info.rem_addr,
3189                                  cm_info.loc_port,
3190                                  cm_info.loc_addr,
3191                                  true,
3192                                  false);
3193
3194        if (!cm_node) {
3195                /* Only type of packet accepted are for */
3196                /* the PASSIVE open (syn only) */
3197                if (!tcph->syn || tcph->ack)
3198                        return;
3199                listener =
3200                    i40iw_find_listener(cm_core,
3201                                        cm_info.loc_addr,
3202                                        cm_info.loc_port,
3203                                        cm_info.vlan_id,
3204                                        I40IW_CM_LISTENER_ACTIVE_STATE);
3205                if (!listener) {
3206                        cm_info.cm_id = NULL;
3207                        i40iw_debug(cm_core->dev,
3208                                    I40IW_DEBUG_CM,
3209                                    "%s no listener found\n",
3210                                    __func__);
3211                        return;
3212                }
3213                cm_info.cm_id = listener->cm_id;
3214                cm_node = i40iw_make_cm_node(cm_core, iwdev, &cm_info, listener);
3215                if (!cm_node) {
3216                        i40iw_debug(cm_core->dev,
3217                                    I40IW_DEBUG_CM,
3218                                    "%s allocate node failed\n",
3219                                    __func__);
3220                        atomic_dec(&listener->ref_count);
3221                        return;
3222                }
3223                if (!tcph->rst && !tcph->fin) {
3224                        cm_node->state = I40IW_CM_STATE_LISTENING;
3225                } else {
3226                        i40iw_rem_ref_cm_node(cm_node);
3227                        return;
3228                }
3229                atomic_inc(&cm_node->ref_count);
3230        } else if (cm_node->state == I40IW_CM_STATE_OFFLOADED) {
3231                i40iw_rem_ref_cm_node(cm_node);
3232                return;
3233        }
3234        i40iw_process_packet(cm_node, rbuf);
3235        i40iw_rem_ref_cm_node(cm_node);
3236}
3237
3238/**
3239 * i40iw_setup_cm_core - allocate a top level instance of a cm
3240 * core
3241 * @iwdev: iwarp device structure
3242 */
3243int i40iw_setup_cm_core(struct i40iw_device *iwdev)
3244{
3245        struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3246
3247        cm_core->iwdev = iwdev;
3248        cm_core->dev = &iwdev->sc_dev;
3249
3250        INIT_LIST_HEAD(&cm_core->accelerated_list);
3251        INIT_LIST_HEAD(&cm_core->non_accelerated_list);
3252        INIT_LIST_HEAD(&cm_core->listen_nodes);
3253
3254        timer_setup(&cm_core->tcp_timer, i40iw_cm_timer_tick, 0);
3255
3256        spin_lock_init(&cm_core->ht_lock);
3257        spin_lock_init(&cm_core->listen_list_lock);
3258        spin_lock_init(&cm_core->apbvt_lock);
3259
3260        cm_core->event_wq = alloc_ordered_workqueue("iwewq",
3261                                                    WQ_MEM_RECLAIM);
3262        if (!cm_core->event_wq)
3263                goto error;
3264
3265        cm_core->disconn_wq = alloc_ordered_workqueue("iwdwq",
3266                                                      WQ_MEM_RECLAIM);
3267        if (!cm_core->disconn_wq)
3268                goto error;
3269
3270        return 0;
3271error:
3272        i40iw_cleanup_cm_core(&iwdev->cm_core);
3273
3274        return -ENOMEM;
3275}
3276
3277/**
3278 * i40iw_cleanup_cm_core - deallocate a top level instance of a
3279 * cm core
3280 * @cm_core: cm's core
3281 */
3282void i40iw_cleanup_cm_core(struct i40iw_cm_core *cm_core)
3283{
3284        unsigned long flags;
3285
3286        if (!cm_core)
3287                return;
3288
3289        spin_lock_irqsave(&cm_core->ht_lock, flags);
3290        if (timer_pending(&cm_core->tcp_timer))
3291                del_timer_sync(&cm_core->tcp_timer);
3292        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3293
3294        if (cm_core->event_wq)
3295                destroy_workqueue(cm_core->event_wq);
3296        if (cm_core->disconn_wq)
3297                destroy_workqueue(cm_core->disconn_wq);
3298}
3299
3300/**
3301 * i40iw_init_tcp_ctx - setup qp context
3302 * @cm_node: connection's node
3303 * @tcp_info: offload info for tcp
3304 * @iwqp: associate qp for the connection
3305 */
3306static void i40iw_init_tcp_ctx(struct i40iw_cm_node *cm_node,
3307                               struct i40iw_tcp_offload_info *tcp_info,
3308                               struct i40iw_qp *iwqp)
3309{
3310        tcp_info->ipv4 = cm_node->ipv4;
3311        tcp_info->drop_ooo_seg = true;
3312        tcp_info->wscale = true;
3313        tcp_info->ignore_tcp_opt = true;
3314        tcp_info->ignore_tcp_uns_opt = true;
3315        tcp_info->no_nagle = false;
3316
3317        tcp_info->ttl = I40IW_DEFAULT_TTL;
3318        tcp_info->rtt_var = cpu_to_le32(I40IW_DEFAULT_RTT_VAR);
3319        tcp_info->ss_thresh = cpu_to_le32(I40IW_DEFAULT_SS_THRESH);
3320        tcp_info->rexmit_thresh = I40IW_DEFAULT_REXMIT_THRESH;
3321
3322        tcp_info->tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3323        tcp_info->snd_wscale = cm_node->tcp_cntxt.snd_wscale;
3324        tcp_info->rcv_wscale = cm_node->tcp_cntxt.rcv_wscale;
3325
3326        tcp_info->snd_nxt = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3327        tcp_info->snd_wnd = cpu_to_le32(cm_node->tcp_cntxt.snd_wnd);
3328        tcp_info->rcv_nxt = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3329        tcp_info->snd_max = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3330
3331        tcp_info->snd_una = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3332        tcp_info->cwnd = cpu_to_le32(2 * cm_node->tcp_cntxt.mss);
3333        tcp_info->snd_wl1 = cpu_to_le32(cm_node->tcp_cntxt.rcv_nxt);
3334        tcp_info->snd_wl2 = cpu_to_le32(cm_node->tcp_cntxt.loc_seq_num);
3335        tcp_info->max_snd_window = cpu_to_le32(cm_node->tcp_cntxt.max_snd_wnd);
3336        tcp_info->rcv_wnd = cpu_to_le32(cm_node->tcp_cntxt.rcv_wnd <<
3337                                        cm_node->tcp_cntxt.rcv_wscale);
3338
3339        tcp_info->flow_label = 0;
3340        tcp_info->snd_mss = cpu_to_le32(((u32)cm_node->tcp_cntxt.mss));
3341        if (cm_node->vlan_id <= VLAN_VID_MASK) {
3342                tcp_info->insert_vlan_tag = true;
3343                tcp_info->vlan_tag = cpu_to_le16(((u16)cm_node->user_pri << I40IW_VLAN_PRIO_SHIFT) |
3344                                                  cm_node->vlan_id);
3345        }
3346        if (cm_node->ipv4) {
3347                tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3348                tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3349
3350                tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[0]);
3351                tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[0]);
3352                tcp_info->arp_idx =
3353                        cpu_to_le16((u16)i40iw_arp_table(
3354                                                         iwqp->iwdev,
3355                                                         &tcp_info->dest_ip_addr3,
3356                                                         true,
3357                                                         NULL,
3358                                                         I40IW_ARP_RESOLVE));
3359        } else {
3360                tcp_info->src_port = cpu_to_le16(cm_node->loc_port);
3361                tcp_info->dst_port = cpu_to_le16(cm_node->rem_port);
3362                tcp_info->dest_ip_addr0 = cpu_to_le32(cm_node->rem_addr[0]);
3363                tcp_info->dest_ip_addr1 = cpu_to_le32(cm_node->rem_addr[1]);
3364                tcp_info->dest_ip_addr2 = cpu_to_le32(cm_node->rem_addr[2]);
3365                tcp_info->dest_ip_addr3 = cpu_to_le32(cm_node->rem_addr[3]);
3366                tcp_info->local_ipaddr0 = cpu_to_le32(cm_node->loc_addr[0]);
3367                tcp_info->local_ipaddr1 = cpu_to_le32(cm_node->loc_addr[1]);
3368                tcp_info->local_ipaddr2 = cpu_to_le32(cm_node->loc_addr[2]);
3369                tcp_info->local_ipaddr3 = cpu_to_le32(cm_node->loc_addr[3]);
3370                tcp_info->arp_idx =
3371                        cpu_to_le16((u16)i40iw_arp_table(
3372                                                         iwqp->iwdev,
3373                                                         &tcp_info->dest_ip_addr0,
3374                                                         false,
3375                                                         NULL,
3376                                                         I40IW_ARP_RESOLVE));
3377        }
3378}
3379
3380/**
3381 * i40iw_cm_init_tsa_conn - setup qp for RTS
3382 * @iwqp: associate qp for the connection
3383 * @cm_node: connection's node
3384 */
3385static void i40iw_cm_init_tsa_conn(struct i40iw_qp *iwqp,
3386                                   struct i40iw_cm_node *cm_node)
3387{
3388        struct i40iw_tcp_offload_info tcp_info;
3389        struct i40iwarp_offload_info *iwarp_info;
3390        struct i40iw_qp_host_ctx_info *ctx_info;
3391        struct i40iw_device *iwdev = iwqp->iwdev;
3392        struct i40iw_sc_dev *dev = &iwqp->iwdev->sc_dev;
3393
3394        memset(&tcp_info, 0x00, sizeof(struct i40iw_tcp_offload_info));
3395        iwarp_info = &iwqp->iwarp_info;
3396        ctx_info = &iwqp->ctx_info;
3397
3398        ctx_info->tcp_info = &tcp_info;
3399        ctx_info->send_cq_num = iwqp->iwscq->sc_cq.cq_uk.cq_id;
3400        ctx_info->rcv_cq_num = iwqp->iwrcq->sc_cq.cq_uk.cq_id;
3401
3402        iwarp_info->ord_size = cm_node->ord_size;
3403        iwarp_info->ird_size = i40iw_derive_hw_ird_setting(cm_node->ird_size);
3404
3405        if (iwarp_info->ord_size == 1)
3406                iwarp_info->ord_size = 2;
3407
3408        iwarp_info->rd_enable = true;
3409        iwarp_info->rdmap_ver = 1;
3410        iwarp_info->ddp_ver = 1;
3411
3412        iwarp_info->pd_id = iwqp->iwpd->sc_pd.pd_id;
3413
3414        ctx_info->tcp_info_valid = true;
3415        ctx_info->iwarp_info_valid = true;
3416        ctx_info->add_to_qoslist = true;
3417        ctx_info->user_pri = cm_node->user_pri;
3418
3419        i40iw_init_tcp_ctx(cm_node, &tcp_info, iwqp);
3420        if (cm_node->snd_mark_en) {
3421                iwarp_info->snd_mark_en = true;
3422                iwarp_info->snd_mark_offset = (tcp_info.snd_nxt &
3423                                SNDMARKER_SEQNMASK) + cm_node->lsmm_size;
3424        }
3425
3426        cm_node->state = I40IW_CM_STATE_OFFLOADED;
3427        tcp_info.tcp_state = I40IW_TCP_STATE_ESTABLISHED;
3428        tcp_info.src_mac_addr_idx = iwdev->mac_ip_table_idx;
3429        tcp_info.tos = cm_node->tos;
3430
3431        dev->iw_priv_qp_ops->qp_setctx(&iwqp->sc_qp, (u64 *)(iwqp->host_ctx.va), ctx_info);
3432
3433        /* once tcp_info is set, no need to do it again */
3434        ctx_info->tcp_info_valid = false;
3435        ctx_info->iwarp_info_valid = false;
3436        ctx_info->add_to_qoslist = false;
3437}
3438
3439/**
3440 * i40iw_cm_disconn - when a connection is being closed
3441 * @iwqp: associate qp for the connection
3442 */
3443void i40iw_cm_disconn(struct i40iw_qp *iwqp)
3444{
3445        struct disconn_work *work;
3446        struct i40iw_device *iwdev = iwqp->iwdev;
3447        struct i40iw_cm_core *cm_core = &iwdev->cm_core;
3448        unsigned long flags;
3449
3450        work = kzalloc(sizeof(*work), GFP_ATOMIC);
3451        if (!work)
3452                return; /* Timer will clean up */
3453
3454        spin_lock_irqsave(&iwdev->qptable_lock, flags);
3455        if (!iwdev->qp_table[iwqp->ibqp.qp_num]) {
3456                spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3457                i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM,
3458                            "%s qp_id %d is already freed\n",
3459                             __func__, iwqp->ibqp.qp_num);
3460                kfree(work);
3461                return;
3462        }
3463        i40iw_add_ref(&iwqp->ibqp);
3464        spin_unlock_irqrestore(&iwdev->qptable_lock, flags);
3465
3466        work->iwqp = iwqp;
3467        INIT_WORK(&work->work, i40iw_disconnect_worker);
3468        queue_work(cm_core->disconn_wq, &work->work);
3469        return;
3470}
3471
3472/**
3473 * i40iw_qp_disconnect - free qp and close cm
3474 * @iwqp: associate qp for the connection
3475 */
3476static void i40iw_qp_disconnect(struct i40iw_qp *iwqp)
3477{
3478        struct i40iw_device *iwdev;
3479        struct i40iw_ib_device *iwibdev;
3480
3481        iwdev = to_iwdev(iwqp->ibqp.device);
3482        if (!iwdev) {
3483                i40iw_pr_err("iwdev == NULL\n");
3484                return;
3485        }
3486
3487        iwibdev = iwdev->iwibdev;
3488
3489        if (iwqp->active_conn) {
3490                /* indicate this connection is NOT active */
3491                iwqp->active_conn = 0;
3492        } else {
3493                /* Need to free the Last Streaming Mode Message */
3494                if (iwqp->ietf_mem.va) {
3495                        if (iwqp->lsmm_mr)
3496                                iwibdev->ibdev.ops.dereg_mr(iwqp->lsmm_mr,
3497                                                            NULL);
3498                        i40iw_free_dma_mem(iwdev->sc_dev.hw, &iwqp->ietf_mem);
3499                }
3500        }
3501
3502        /* close the CM node down if it is still active */
3503        if (iwqp->cm_node) {
3504                i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_CM, "%s Call close API\n", __func__);
3505                i40iw_cm_close(iwqp->cm_node);
3506        }
3507}
3508
3509/**
3510 * i40iw_cm_disconn_true - called by worker thread to disconnect qp
3511 * @iwqp: associate qp for the connection
3512 */
3513static void i40iw_cm_disconn_true(struct i40iw_qp *iwqp)
3514{
3515        struct iw_cm_id *cm_id;
3516        struct i40iw_device *iwdev;
3517        struct i40iw_sc_qp *qp = &iwqp->sc_qp;
3518        u16 last_ae;
3519        u8 original_hw_tcp_state;
3520        u8 original_ibqp_state;
3521        int disconn_status = 0;
3522        int issue_disconn = 0;
3523        int issue_close = 0;
3524        int issue_flush = 0;
3525        struct ib_event ibevent;
3526        unsigned long flags;
3527        int ret;
3528
3529        if (!iwqp) {
3530                i40iw_pr_err("iwqp == NULL\n");
3531                return;
3532        }
3533
3534        spin_lock_irqsave(&iwqp->lock, flags);
3535        cm_id = iwqp->cm_id;
3536        /* make sure we havent already closed this connection */
3537        if (!cm_id) {
3538                spin_unlock_irqrestore(&iwqp->lock, flags);
3539                return;
3540        }
3541
3542        iwdev = to_iwdev(iwqp->ibqp.device);
3543
3544        original_hw_tcp_state = iwqp->hw_tcp_state;
3545        original_ibqp_state = iwqp->ibqp_state;
3546        last_ae = iwqp->last_aeq;
3547
3548        if (qp->term_flags) {
3549                issue_disconn = 1;
3550                issue_close = 1;
3551                iwqp->cm_id = NULL;
3552                /*When term timer expires after cm_timer, don't want
3553                 *terminate-handler to issue cm_disconn which can re-free
3554                 *a QP even after its refcnt=0.
3555                 */
3556                i40iw_terminate_del_timer(qp);
3557                if (!iwqp->flush_issued) {
3558                        iwqp->flush_issued = 1;
3559                        issue_flush = 1;
3560                }
3561        } else if ((original_hw_tcp_state == I40IW_TCP_STATE_CLOSE_WAIT) ||
3562                   ((original_ibqp_state == IB_QPS_RTS) &&
3563                    (last_ae == I40IW_AE_LLP_CONNECTION_RESET))) {
3564                issue_disconn = 1;
3565                if (last_ae == I40IW_AE_LLP_CONNECTION_RESET)
3566                        disconn_status = -ECONNRESET;
3567        }
3568
3569        if (((original_hw_tcp_state == I40IW_TCP_STATE_CLOSED) ||
3570             (original_hw_tcp_state == I40IW_TCP_STATE_TIME_WAIT) ||
3571             (last_ae == I40IW_AE_RDMAP_ROE_BAD_LLP_CLOSE) ||
3572             (last_ae == I40IW_AE_LLP_CONNECTION_RESET) ||
3573              iwdev->reset)) {
3574                issue_close = 1;
3575                iwqp->cm_id = NULL;
3576                if (!iwqp->flush_issued) {
3577                        iwqp->flush_issued = 1;
3578                        issue_flush = 1;
3579                }
3580        }
3581
3582        spin_unlock_irqrestore(&iwqp->lock, flags);
3583        if (issue_flush && !iwqp->destroyed) {
3584                /* Flush the queues */
3585                i40iw_flush_wqes(iwdev, iwqp);
3586
3587                if (qp->term_flags && iwqp->ibqp.event_handler) {
3588                        ibevent.device = iwqp->ibqp.device;
3589                        ibevent.event = (qp->eventtype == TERM_EVENT_QP_FATAL) ?
3590                                        IB_EVENT_QP_FATAL : IB_EVENT_QP_ACCESS_ERR;
3591                        ibevent.element.qp = &iwqp->ibqp;
3592                        iwqp->ibqp.event_handler(&ibevent, iwqp->ibqp.qp_context);
3593                }
3594        }
3595
3596        if (cm_id && cm_id->event_handler) {
3597                if (issue_disconn) {
3598                        ret = i40iw_send_cm_event(NULL,
3599                                                  cm_id,
3600                                                  IW_CM_EVENT_DISCONNECT,
3601                                                  disconn_status);
3602
3603                        if (ret)
3604                                i40iw_debug(&iwdev->sc_dev,
3605                                            I40IW_DEBUG_CM,
3606                                            "disconnect event failed %s: - cm_id = %p\n",
3607                                            __func__, cm_id);
3608                }
3609                if (issue_close) {
3610                        i40iw_qp_disconnect(iwqp);
3611                        cm_id->provider_data = iwqp;
3612                        ret = i40iw_send_cm_event(NULL, cm_id, IW_CM_EVENT_CLOSE, 0);
3613                        if (ret)
3614                                i40iw_debug(&iwdev->sc_dev,
3615                                            I40IW_DEBUG_CM,
3616                                            "close event failed %s: - cm_id = %p\n",
3617                                            __func__, cm_id);
3618                        cm_id->rem_ref(cm_id);
3619                }
3620        }
3621}
3622
3623/**
3624 * i40iw_disconnect_worker - worker for connection close
3625 * @work: points or disconn structure
3626 */
3627static void i40iw_disconnect_worker(struct work_struct *work)
3628{
3629        struct disconn_work *dwork = container_of(work, struct disconn_work, work);
3630        struct i40iw_qp *iwqp = dwork->iwqp;
3631
3632        kfree(dwork);
3633        i40iw_cm_disconn_true(iwqp);
3634        i40iw_rem_ref(&iwqp->ibqp);
3635}
3636
3637/**
3638 * i40iw_accept - registered call for connection to be accepted
3639 * @cm_id: cm information for passive connection
3640 * @conn_param: accpet parameters
3641 */
3642int i40iw_accept(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3643{
3644        struct ib_qp *ibqp;
3645        struct i40iw_qp *iwqp;
3646        struct i40iw_device *iwdev;
3647        struct i40iw_sc_dev *dev;
3648        struct i40iw_cm_core *cm_core;
3649        struct i40iw_cm_node *cm_node;
3650        struct ib_qp_attr attr;
3651        int passive_state;
3652        struct ib_mr *ibmr;
3653        struct i40iw_pd *iwpd;
3654        u16 buf_len = 0;
3655        struct i40iw_kmem_info accept;
3656        enum i40iw_status_code status;
3657        u64 tagged_offset;
3658        unsigned long flags;
3659
3660        memset(&attr, 0, sizeof(attr));
3661        ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3662        if (!ibqp)
3663                return -EINVAL;
3664
3665        iwqp = to_iwqp(ibqp);
3666        iwdev = iwqp->iwdev;
3667        dev = &iwdev->sc_dev;
3668        cm_core = &iwdev->cm_core;
3669        cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3670
3671        if (((struct sockaddr_in *)&cm_id->local_addr)->sin_family == AF_INET) {
3672                cm_node->ipv4 = true;
3673                cm_node->vlan_id = i40iw_get_vlan_ipv4(cm_node->loc_addr);
3674        } else {
3675                cm_node->ipv4 = false;
3676                i40iw_netdev_vlan_ipv6(cm_node->loc_addr, &cm_node->vlan_id);
3677        }
3678        i40iw_debug(cm_node->dev,
3679                    I40IW_DEBUG_CM,
3680                    "Accept vlan_id=%d\n",
3681                    cm_node->vlan_id);
3682        if (cm_node->state == I40IW_CM_STATE_LISTENER_DESTROYED) {
3683                if (cm_node->loopbackpartner)
3684                        i40iw_rem_ref_cm_node(cm_node->loopbackpartner);
3685                i40iw_rem_ref_cm_node(cm_node);
3686                return -EINVAL;
3687        }
3688
3689        passive_state = atomic_add_return(1, &cm_node->passive_state);
3690        if (passive_state == I40IW_SEND_RESET_EVENT) {
3691                i40iw_rem_ref_cm_node(cm_node);
3692                return -ECONNRESET;
3693        }
3694
3695        cm_node->cm_core->stats_accepts++;
3696        iwqp->cm_node = (void *)cm_node;
3697        cm_node->iwqp = iwqp;
3698
3699        buf_len = conn_param->private_data_len + I40IW_MAX_IETF_SIZE;
3700
3701        status = i40iw_allocate_dma_mem(dev->hw, &iwqp->ietf_mem, buf_len, 1);
3702
3703        if (status)
3704                return -ENOMEM;
3705        cm_node->pdata.size = conn_param->private_data_len;
3706        accept.addr = iwqp->ietf_mem.va;
3707        accept.size = i40iw_cm_build_mpa_frame(cm_node, &accept, MPA_KEY_REPLY);
3708        memcpy(accept.addr + accept.size, conn_param->private_data,
3709               conn_param->private_data_len);
3710
3711        /* setup our first outgoing iWarp send WQE (the IETF frame response) */
3712        if ((cm_node->ipv4 &&
3713             !i40iw_ipv4_is_loopback(cm_node->loc_addr[0], cm_node->rem_addr[0])) ||
3714            (!cm_node->ipv4 &&
3715             !i40iw_ipv6_is_loopback(cm_node->loc_addr, cm_node->rem_addr))) {
3716                iwpd = iwqp->iwpd;
3717                tagged_offset = (uintptr_t)iwqp->ietf_mem.va;
3718                ibmr = i40iw_reg_phys_mr(&iwpd->ibpd,
3719                                         iwqp->ietf_mem.pa,
3720                                         buf_len,
3721                                         IB_ACCESS_LOCAL_WRITE,
3722                                         &tagged_offset);
3723                if (IS_ERR(ibmr)) {
3724                        i40iw_free_dma_mem(dev->hw, &iwqp->ietf_mem);
3725                        return -ENOMEM;
3726                }
3727
3728                ibmr->pd = &iwpd->ibpd;
3729                ibmr->device = iwpd->ibpd.device;
3730                iwqp->lsmm_mr = ibmr;
3731                if (iwqp->page)
3732                        iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3733                dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp,
3734                                                        iwqp->ietf_mem.va,
3735                                                        (accept.size + conn_param->private_data_len),
3736                                                        ibmr->lkey);
3737
3738        } else {
3739                if (iwqp->page)
3740                        iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
3741                dev->iw_priv_qp_ops->qp_send_lsmm(&iwqp->sc_qp, NULL, 0, 0);
3742        }
3743
3744        if (iwqp->page)
3745                kunmap(iwqp->page);
3746
3747        iwqp->cm_id = cm_id;
3748        cm_node->cm_id = cm_id;
3749
3750        cm_id->provider_data = (void *)iwqp;
3751        iwqp->active_conn = 0;
3752
3753        cm_node->lsmm_size = accept.size + conn_param->private_data_len;
3754        i40iw_cm_init_tsa_conn(iwqp, cm_node);
3755        cm_id->add_ref(cm_id);
3756        i40iw_add_ref(&iwqp->ibqp);
3757
3758        attr.qp_state = IB_QPS_RTS;
3759        cm_node->qhash_set = false;
3760        i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
3761
3762        cm_node->accelerated = true;
3763        spin_lock_irqsave(&cm_core->ht_lock, flags);
3764        list_move_tail(&cm_node->list, &cm_core->accelerated_list);
3765        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
3766
3767        status =
3768                i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_ESTABLISHED, 0);
3769        if (status)
3770                i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - ESTABLISHED\n");
3771
3772        if (cm_node->loopbackpartner) {
3773                cm_node->loopbackpartner->pdata.size = conn_param->private_data_len;
3774
3775                /* copy entire MPA frame to our cm_node's frame */
3776                memcpy(cm_node->loopbackpartner->pdata_buf,
3777                       conn_param->private_data,
3778                       conn_param->private_data_len);
3779                i40iw_create_event(cm_node->loopbackpartner, I40IW_CM_EVENT_CONNECTED);
3780        }
3781
3782        if (cm_node->accept_pend) {
3783                atomic_dec(&cm_node->listener->pend_accepts_cnt);
3784                cm_node->accept_pend = 0;
3785        }
3786        return 0;
3787}
3788
3789/**
3790 * i40iw_reject - registered call for connection to be rejected
3791 * @cm_id: cm information for passive connection
3792 * @pdata: private data to be sent
3793 * @pdata_len: private data length
3794 */
3795int i40iw_reject(struct iw_cm_id *cm_id, const void *pdata, u8 pdata_len)
3796{
3797        struct i40iw_device *iwdev;
3798        struct i40iw_cm_node *cm_node;
3799        struct i40iw_cm_node *loopback;
3800
3801        cm_node = (struct i40iw_cm_node *)cm_id->provider_data;
3802        loopback = cm_node->loopbackpartner;
3803        cm_node->cm_id = cm_id;
3804        cm_node->pdata.size = pdata_len;
3805
3806        iwdev = to_iwdev(cm_id->device);
3807        if (!iwdev)
3808                return -EINVAL;
3809        cm_node->cm_core->stats_rejects++;
3810
3811        if (pdata_len + sizeof(struct ietf_mpa_v2) > MAX_CM_BUFFER)
3812                return -EINVAL;
3813
3814        if (loopback) {
3815                memcpy(&loopback->pdata_buf, pdata, pdata_len);
3816                loopback->pdata.size = pdata_len;
3817        }
3818
3819        return i40iw_cm_reject(cm_node, pdata, pdata_len);
3820}
3821
3822/**
3823 * i40iw_connect - registered call for connection to be established
3824 * @cm_id: cm information for passive connection
3825 * @conn_param: Information about the connection
3826 */
3827int i40iw_connect(struct iw_cm_id *cm_id, struct iw_cm_conn_param *conn_param)
3828{
3829        struct ib_qp *ibqp;
3830        struct i40iw_qp *iwqp;
3831        struct i40iw_device *iwdev;
3832        struct i40iw_cm_node *cm_node;
3833        struct i40iw_cm_info cm_info;
3834        struct sockaddr_in *laddr;
3835        struct sockaddr_in *raddr;
3836        struct sockaddr_in6 *laddr6;
3837        struct sockaddr_in6 *raddr6;
3838        int ret = 0;
3839
3840        ibqp = i40iw_get_qp(cm_id->device, conn_param->qpn);
3841        if (!ibqp)
3842                return -EINVAL;
3843        iwqp = to_iwqp(ibqp);
3844        if (!iwqp)
3845                return -EINVAL;
3846        iwdev = to_iwdev(iwqp->ibqp.device);
3847        if (!iwdev)
3848                return -EINVAL;
3849
3850        laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3851        raddr = (struct sockaddr_in *)&cm_id->m_remote_addr;
3852        laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3853        raddr6 = (struct sockaddr_in6 *)&cm_id->m_remote_addr;
3854
3855        if (!(laddr->sin_port) || !(raddr->sin_port))
3856                return -EINVAL;
3857
3858        iwqp->active_conn = 1;
3859        iwqp->cm_id = NULL;
3860        cm_id->provider_data = iwqp;
3861
3862        /* set up the connection params for the node */
3863        if (cm_id->remote_addr.ss_family == AF_INET) {
3864                cm_info.ipv4 = true;
3865                memset(cm_info.loc_addr, 0, sizeof(cm_info.loc_addr));
3866                memset(cm_info.rem_addr, 0, sizeof(cm_info.rem_addr));
3867                cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3868                cm_info.rem_addr[0] = ntohl(raddr->sin_addr.s_addr);
3869                cm_info.loc_port = ntohs(laddr->sin_port);
3870                cm_info.rem_port = ntohs(raddr->sin_port);
3871                cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3872        } else {
3873                cm_info.ipv4 = false;
3874                i40iw_copy_ip_ntohl(cm_info.loc_addr,
3875                                    laddr6->sin6_addr.in6_u.u6_addr32);
3876                i40iw_copy_ip_ntohl(cm_info.rem_addr,
3877                                    raddr6->sin6_addr.in6_u.u6_addr32);
3878                cm_info.loc_port = ntohs(laddr6->sin6_port);
3879                cm_info.rem_port = ntohs(raddr6->sin6_port);
3880                i40iw_netdev_vlan_ipv6(cm_info.loc_addr, &cm_info.vlan_id);
3881        }
3882        cm_info.cm_id = cm_id;
3883        cm_info.tos = cm_id->tos;
3884        cm_info.user_pri = rt_tos2priority(cm_id->tos);
3885        i40iw_debug(&iwdev->sc_dev, I40IW_DEBUG_DCB, "%s TOS:[%d] UP:[%d]\n",
3886                    __func__, cm_id->tos, cm_info.user_pri);
3887        cm_id->add_ref(cm_id);
3888        cm_node = i40iw_create_cm_node(&iwdev->cm_core, iwdev,
3889                                       conn_param, &cm_info);
3890
3891        if (IS_ERR(cm_node)) {
3892                ret = PTR_ERR(cm_node);
3893                cm_id->rem_ref(cm_id);
3894                return ret;
3895        }
3896
3897        if ((cm_info.ipv4 && (laddr->sin_addr.s_addr != raddr->sin_addr.s_addr)) ||
3898            (!cm_info.ipv4 && memcmp(laddr6->sin6_addr.in6_u.u6_addr32,
3899                                     raddr6->sin6_addr.in6_u.u6_addr32,
3900                                     sizeof(laddr6->sin6_addr.in6_u.u6_addr32)))) {
3901                if (i40iw_manage_qhash(iwdev, &cm_info, I40IW_QHASH_TYPE_TCP_ESTABLISHED,
3902                                       I40IW_QHASH_MANAGE_TYPE_ADD, NULL, true)) {
3903                        ret = -EINVAL;
3904                        goto err;
3905                }
3906                cm_node->qhash_set = true;
3907        }
3908
3909        if (i40iw_manage_apbvt(iwdev, cm_info.loc_port,
3910                               I40IW_MANAGE_APBVT_ADD)) {
3911                ret =  -EINVAL;
3912                goto err;
3913        }
3914
3915        cm_node->apbvt_set = true;
3916        iwqp->cm_node = cm_node;
3917        cm_node->iwqp = iwqp;
3918        iwqp->cm_id = cm_id;
3919        i40iw_add_ref(&iwqp->ibqp);
3920
3921        if (cm_node->state != I40IW_CM_STATE_OFFLOADED) {
3922                cm_node->state = I40IW_CM_STATE_SYN_SENT;
3923                ret = i40iw_send_syn(cm_node, 0);
3924                if (ret)
3925                        goto err;
3926        }
3927
3928        if (cm_node->loopbackpartner) {
3929                cm_node->loopbackpartner->state = I40IW_CM_STATE_MPAREQ_RCVD;
3930                i40iw_create_event(cm_node->loopbackpartner,
3931                                   I40IW_CM_EVENT_MPA_REQ);
3932        }
3933
3934        i40iw_debug(cm_node->dev,
3935                    I40IW_DEBUG_CM,
3936                    "Api - connect(): port=0x%04x, cm_node=%p, cm_id = %p.\n",
3937                    cm_node->rem_port,
3938                    cm_node,
3939                    cm_node->cm_id);
3940
3941        return 0;
3942
3943err:
3944        if (cm_info.ipv4)
3945                i40iw_debug(&iwdev->sc_dev,
3946                            I40IW_DEBUG_CM,
3947                            "Api - connect() FAILED: dest addr=%pI4",
3948                            cm_info.rem_addr);
3949        else
3950                i40iw_debug(&iwdev->sc_dev,
3951                            I40IW_DEBUG_CM,
3952                            "Api - connect() FAILED: dest addr=%pI6",
3953                            cm_info.rem_addr);
3954
3955        i40iw_rem_ref_cm_node(cm_node);
3956        cm_id->rem_ref(cm_id);
3957        iwdev->cm_core.stats_connect_errs++;
3958        return ret;
3959}
3960
3961/**
3962 * i40iw_create_listen - registered call creating listener
3963 * @cm_id: cm information for passive connection
3964 * @backlog: to max accept pending count
3965 */
3966int i40iw_create_listen(struct iw_cm_id *cm_id, int backlog)
3967{
3968        struct i40iw_device *iwdev;
3969        struct i40iw_cm_listener *cm_listen_node;
3970        struct i40iw_cm_info cm_info;
3971        enum i40iw_status_code ret;
3972        struct sockaddr_in *laddr;
3973        struct sockaddr_in6 *laddr6;
3974        bool wildcard = false;
3975
3976        iwdev = to_iwdev(cm_id->device);
3977        if (!iwdev)
3978                return -EINVAL;
3979
3980        laddr = (struct sockaddr_in *)&cm_id->m_local_addr;
3981        laddr6 = (struct sockaddr_in6 *)&cm_id->m_local_addr;
3982        memset(&cm_info, 0, sizeof(cm_info));
3983        if (laddr->sin_family == AF_INET) {
3984                cm_info.ipv4 = true;
3985                cm_info.loc_addr[0] = ntohl(laddr->sin_addr.s_addr);
3986                cm_info.loc_port = ntohs(laddr->sin_port);
3987
3988                if (laddr->sin_addr.s_addr != INADDR_ANY)
3989                        cm_info.vlan_id = i40iw_get_vlan_ipv4(cm_info.loc_addr);
3990                else
3991                        wildcard = true;
3992
3993        } else {
3994                cm_info.ipv4 = false;
3995                i40iw_copy_ip_ntohl(cm_info.loc_addr,
3996                                    laddr6->sin6_addr.in6_u.u6_addr32);
3997                cm_info.loc_port = ntohs(laddr6->sin6_port);
3998                if (ipv6_addr_type(&laddr6->sin6_addr) != IPV6_ADDR_ANY)
3999                        i40iw_netdev_vlan_ipv6(cm_info.loc_addr,
4000                                               &cm_info.vlan_id);
4001                else
4002                        wildcard = true;
4003        }
4004        cm_info.backlog = backlog;
4005        cm_info.cm_id = cm_id;
4006
4007        cm_listen_node = i40iw_make_listen_node(&iwdev->cm_core, iwdev, &cm_info);
4008        if (!cm_listen_node) {
4009                i40iw_pr_err("cm_listen_node == NULL\n");
4010                return -ENOMEM;
4011        }
4012
4013        cm_id->provider_data = cm_listen_node;
4014
4015        cm_listen_node->tos = cm_id->tos;
4016        cm_listen_node->user_pri = rt_tos2priority(cm_id->tos);
4017        cm_info.user_pri = cm_listen_node->user_pri;
4018
4019        if (!cm_listen_node->reused_node) {
4020                if (wildcard) {
4021                        if (cm_info.ipv4)
4022                                ret = i40iw_add_mqh_4(iwdev,
4023                                                      &cm_info,
4024                                                      cm_listen_node);
4025                        else
4026                                ret = i40iw_add_mqh_6(iwdev,
4027                                                      &cm_info,
4028                                                      cm_listen_node);
4029                        if (ret)
4030                                goto error;
4031
4032                        ret = i40iw_manage_apbvt(iwdev,
4033                                                 cm_info.loc_port,
4034                                                 I40IW_MANAGE_APBVT_ADD);
4035
4036                        if (ret)
4037                                goto error;
4038                } else {
4039                        ret = i40iw_manage_qhash(iwdev,
4040                                                 &cm_info,
4041                                                 I40IW_QHASH_TYPE_TCP_SYN,
4042                                                 I40IW_QHASH_MANAGE_TYPE_ADD,
4043                                                 NULL,
4044                                                 true);
4045                        if (ret)
4046                                goto error;
4047                        cm_listen_node->qhash_set = true;
4048                        ret = i40iw_manage_apbvt(iwdev,
4049                                                 cm_info.loc_port,
4050                                                 I40IW_MANAGE_APBVT_ADD);
4051                        if (ret)
4052                                goto error;
4053                }
4054        }
4055        cm_id->add_ref(cm_id);
4056        cm_listen_node->cm_core->stats_listen_created++;
4057        return 0;
4058 error:
4059        i40iw_cm_del_listen(&iwdev->cm_core, (void *)cm_listen_node, false);
4060        return -EINVAL;
4061}
4062
4063/**
4064 * i40iw_destroy_listen - registered call to destroy listener
4065 * @cm_id: cm information for passive connection
4066 */
4067int i40iw_destroy_listen(struct iw_cm_id *cm_id)
4068{
4069        struct i40iw_device *iwdev;
4070
4071        iwdev = to_iwdev(cm_id->device);
4072        if (cm_id->provider_data)
4073                i40iw_cm_del_listen(&iwdev->cm_core, cm_id->provider_data, true);
4074        else
4075                i40iw_pr_err("cm_id->provider_data was NULL\n");
4076
4077        cm_id->rem_ref(cm_id);
4078
4079        return 0;
4080}
4081
4082/**
4083 * i40iw_cm_event_connected - handle connected active node
4084 * @event: the info for cm_node of connection
4085 */
4086static void i40iw_cm_event_connected(struct i40iw_cm_event *event)
4087{
4088        struct i40iw_qp *iwqp;
4089        struct i40iw_device *iwdev;
4090        struct i40iw_cm_core *cm_core;
4091        struct i40iw_cm_node *cm_node;
4092        struct i40iw_sc_dev *dev;
4093        struct ib_qp_attr attr;
4094        struct iw_cm_id *cm_id;
4095        unsigned long flags;
4096        int status;
4097        bool read0;
4098
4099        cm_node = event->cm_node;
4100        cm_id = cm_node->cm_id;
4101        iwqp = (struct i40iw_qp *)cm_id->provider_data;
4102        iwdev = to_iwdev(iwqp->ibqp.device);
4103        dev = &iwdev->sc_dev;
4104        cm_core = &iwdev->cm_core;
4105
4106        if (iwqp->destroyed) {
4107                status = -ETIMEDOUT;
4108                goto error;
4109        }
4110        i40iw_cm_init_tsa_conn(iwqp, cm_node);
4111        read0 = (cm_node->send_rdma0_op == SEND_RDMA_READ_ZERO);
4112        if (iwqp->page)
4113                iwqp->sc_qp.qp_uk.sq_base = kmap(iwqp->page);
4114        dev->iw_priv_qp_ops->qp_send_rtt(&iwqp->sc_qp, read0);
4115        if (iwqp->page)
4116                kunmap(iwqp->page);
4117
4118        memset(&attr, 0, sizeof(attr));
4119        attr.qp_state = IB_QPS_RTS;
4120        cm_node->qhash_set = false;
4121        i40iw_modify_qp(&iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4122
4123        cm_node->accelerated = true;
4124        spin_lock_irqsave(&cm_core->ht_lock, flags);
4125        list_move_tail(&cm_node->list, &cm_core->accelerated_list);
4126        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4127        status = i40iw_send_cm_event(cm_node, cm_id, IW_CM_EVENT_CONNECT_REPLY,
4128                                     0);
4129        if (status)
4130                i40iw_debug(dev, I40IW_DEBUG_CM, "error sending cm event - CONNECT_REPLY\n");
4131
4132        return;
4133
4134error:
4135        iwqp->cm_id = NULL;
4136        cm_id->provider_data = NULL;
4137        i40iw_send_cm_event(event->cm_node,
4138                            cm_id,
4139                            IW_CM_EVENT_CONNECT_REPLY,
4140                            status);
4141        cm_id->rem_ref(cm_id);
4142        i40iw_rem_ref_cm_node(event->cm_node);
4143}
4144
4145/**
4146 * i40iw_cm_event_reset - handle reset
4147 * @event: the info for cm_node of connection
4148 */
4149static void i40iw_cm_event_reset(struct i40iw_cm_event *event)
4150{
4151        struct i40iw_cm_node *cm_node = event->cm_node;
4152        struct iw_cm_id   *cm_id = cm_node->cm_id;
4153        struct i40iw_qp *iwqp;
4154
4155        if (!cm_id)
4156                return;
4157
4158        iwqp = cm_id->provider_data;
4159        if (!iwqp)
4160                return;
4161
4162        i40iw_debug(cm_node->dev,
4163                    I40IW_DEBUG_CM,
4164                    "reset event %p - cm_id = %p\n",
4165                     event->cm_node, cm_id);
4166        iwqp->cm_id = NULL;
4167
4168        i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_DISCONNECT, -ECONNRESET);
4169        i40iw_send_cm_event(cm_node, cm_node->cm_id, IW_CM_EVENT_CLOSE, 0);
4170}
4171
4172/**
4173 * i40iw_cm_event_handler - worker thread callback to send event to cm upper layer
4174 * @work: pointer of cm event info.
4175 */
4176static void i40iw_cm_event_handler(struct work_struct *work)
4177{
4178        struct i40iw_cm_event *event = container_of(work,
4179                                                    struct i40iw_cm_event,
4180                                                    event_work);
4181        struct i40iw_cm_node *cm_node;
4182
4183        if (!event || !event->cm_node || !event->cm_node->cm_core)
4184                return;
4185
4186        cm_node = event->cm_node;
4187
4188        switch (event->type) {
4189        case I40IW_CM_EVENT_MPA_REQ:
4190                i40iw_send_cm_event(cm_node,
4191                                    cm_node->cm_id,
4192                                    IW_CM_EVENT_CONNECT_REQUEST,
4193                                    0);
4194                break;
4195        case I40IW_CM_EVENT_RESET:
4196                i40iw_cm_event_reset(event);
4197                break;
4198        case I40IW_CM_EVENT_CONNECTED:
4199                if (!event->cm_node->cm_id ||
4200                    (event->cm_node->state != I40IW_CM_STATE_OFFLOADED))
4201                        break;
4202                i40iw_cm_event_connected(event);
4203                break;
4204        case I40IW_CM_EVENT_MPA_REJECT:
4205                if (!event->cm_node->cm_id ||
4206                    (cm_node->state == I40IW_CM_STATE_OFFLOADED))
4207                        break;
4208                i40iw_send_cm_event(cm_node,
4209                                    cm_node->cm_id,
4210                                    IW_CM_EVENT_CONNECT_REPLY,
4211                                    -ECONNREFUSED);
4212                break;
4213        case I40IW_CM_EVENT_ABORTED:
4214                if (!event->cm_node->cm_id ||
4215                    (event->cm_node->state == I40IW_CM_STATE_OFFLOADED))
4216                        break;
4217                i40iw_event_connect_error(event);
4218                break;
4219        default:
4220                i40iw_pr_err("event type = %d\n", event->type);
4221                break;
4222        }
4223
4224        event->cm_info.cm_id->rem_ref(event->cm_info.cm_id);
4225        i40iw_rem_ref_cm_node(event->cm_node);
4226        kfree(event);
4227}
4228
4229/**
4230 * i40iw_cm_post_event - queue event request for worker thread
4231 * @event: cm node's info for up event call
4232 */
4233static void i40iw_cm_post_event(struct i40iw_cm_event *event)
4234{
4235        atomic_inc(&event->cm_node->ref_count);
4236        event->cm_info.cm_id->add_ref(event->cm_info.cm_id);
4237        INIT_WORK(&event->event_work, i40iw_cm_event_handler);
4238
4239        queue_work(event->cm_node->cm_core->event_wq, &event->event_work);
4240}
4241
4242/**
4243 * i40iw_qhash_ctrl - enable/disable qhash for list
4244 * @iwdev: device pointer
4245 * @parent_listen_node: parent listen node
4246 * @nfo: cm info node
4247 * @ipaddr: Pointer to IPv4 or IPv6 address
4248 * @ipv4: flag indicating IPv4 when true
4249 * @ifup: flag indicating interface up when true
4250 *
4251 * Enables or disables the qhash for the node in the child
4252 * listen list that matches ipaddr. If no matching IP was found
4253 * it will allocate and add a new child listen node to the
4254 * parent listen node. The listen_list_lock is assumed to be
4255 * held when called.
4256 */
4257static void i40iw_qhash_ctrl(struct i40iw_device *iwdev,
4258                             struct i40iw_cm_listener *parent_listen_node,
4259                             struct i40iw_cm_info *nfo,
4260                             u32 *ipaddr, bool ipv4, bool ifup)
4261{
4262        struct list_head *child_listen_list = &parent_listen_node->child_listen_list;
4263        struct i40iw_cm_listener *child_listen_node;
4264        struct list_head *pos, *tpos;
4265        enum i40iw_status_code ret;
4266        bool node_allocated = false;
4267        enum i40iw_quad_hash_manage_type op =
4268                ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4269
4270        list_for_each_safe(pos, tpos, child_listen_list) {
4271                child_listen_node =
4272                        list_entry(pos,
4273                                   struct i40iw_cm_listener,
4274                                   child_listen_list);
4275                if (!memcmp(child_listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16))
4276                        goto set_qhash;
4277        }
4278
4279        /* if not found then add a child listener if interface is going up */
4280        if (!ifup)
4281                return;
4282        child_listen_node = kmemdup(parent_listen_node,
4283                        sizeof(*child_listen_node), GFP_ATOMIC);
4284        if (!child_listen_node)
4285                return;
4286        node_allocated = true;
4287
4288        memcpy(child_listen_node->loc_addr, ipaddr,  ipv4 ? 4 : 16);
4289
4290set_qhash:
4291        memcpy(nfo->loc_addr,
4292               child_listen_node->loc_addr,
4293               sizeof(nfo->loc_addr));
4294        nfo->vlan_id = child_listen_node->vlan_id;
4295        ret = i40iw_manage_qhash(iwdev, nfo,
4296                                 I40IW_QHASH_TYPE_TCP_SYN,
4297                                 op,
4298                                 NULL, false);
4299        if (!ret) {
4300                child_listen_node->qhash_set = ifup;
4301                if (node_allocated)
4302                        list_add(&child_listen_node->child_listen_list,
4303                                 &parent_listen_node->child_listen_list);
4304        } else if (node_allocated) {
4305                kfree(child_listen_node);
4306        }
4307}
4308
4309/**
4310 * i40iw_cm_teardown_connections - teardown QPs
4311 * @iwdev: device pointer
4312 * @ipaddr: Pointer to IPv4 or IPv6 address
4313 * @ipv4: flag indicating IPv4 when true
4314 * @disconnect_all: flag indicating disconnect all QPs
4315 * teardown QPs where source or destination addr matches ip addr
4316 */
4317void i40iw_cm_teardown_connections(struct i40iw_device *iwdev, u32 *ipaddr,
4318                                   struct i40iw_cm_info *nfo,
4319                                   bool disconnect_all)
4320{
4321        struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4322        struct list_head *list_core_temp;
4323        struct list_head *list_node;
4324        struct i40iw_cm_node *cm_node;
4325        unsigned long flags;
4326        struct list_head teardown_list;
4327        struct ib_qp_attr attr;
4328
4329        INIT_LIST_HEAD(&teardown_list);
4330        spin_lock_irqsave(&cm_core->ht_lock, flags);
4331        list_for_each_safe(list_node, list_core_temp,
4332                           &cm_core->accelerated_list) {
4333                cm_node = container_of(list_node, struct i40iw_cm_node, list);
4334                if (disconnect_all ||
4335                    (nfo->vlan_id == cm_node->vlan_id &&
4336                    (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4337                     !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4338                        atomic_inc(&cm_node->ref_count);
4339                        list_add(&cm_node->teardown_entry, &teardown_list);
4340                }
4341        }
4342        list_for_each_safe(list_node, list_core_temp,
4343                           &cm_core->non_accelerated_list) {
4344                cm_node = container_of(list_node, struct i40iw_cm_node, list);
4345                if (disconnect_all ||
4346                    (nfo->vlan_id == cm_node->vlan_id &&
4347                    (!memcmp(cm_node->loc_addr, ipaddr, nfo->ipv4 ? 4 : 16) ||
4348                     !memcmp(cm_node->rem_addr, ipaddr, nfo->ipv4 ? 4 : 16)))) {
4349                        atomic_inc(&cm_node->ref_count);
4350                        list_add(&cm_node->teardown_entry, &teardown_list);
4351                }
4352        }
4353        spin_unlock_irqrestore(&cm_core->ht_lock, flags);
4354
4355        list_for_each_safe(list_node, list_core_temp, &teardown_list) {
4356                cm_node = container_of(list_node, struct i40iw_cm_node,
4357                                       teardown_entry);
4358                attr.qp_state = IB_QPS_ERR;
4359                i40iw_modify_qp(&cm_node->iwqp->ibqp, &attr, IB_QP_STATE, NULL);
4360                if (iwdev->reset)
4361                        i40iw_cm_disconn(cm_node->iwqp);
4362                i40iw_rem_ref_cm_node(cm_node);
4363        }
4364}
4365
4366/**
4367 * i40iw_ifdown_notify - process an ifdown on an interface
4368 * @iwdev: device pointer
4369 * @ipaddr: Pointer to IPv4 or IPv6 address
4370 * @ipv4: flag indicating IPv4 when true
4371 * @ifup: flag indicating interface up when true
4372 */
4373void i40iw_if_notify(struct i40iw_device *iwdev, struct net_device *netdev,
4374                     u32 *ipaddr, bool ipv4, bool ifup)
4375{
4376        struct i40iw_cm_core *cm_core = &iwdev->cm_core;
4377        unsigned long flags;
4378        struct i40iw_cm_listener *listen_node;
4379        static const u32 ip_zero[4] = { 0, 0, 0, 0 };
4380        struct i40iw_cm_info nfo;
4381        u16 vlan_id = rdma_vlan_dev_vlan_id(netdev);
4382        enum i40iw_status_code ret;
4383        enum i40iw_quad_hash_manage_type op =
4384                ifup ? I40IW_QHASH_MANAGE_TYPE_ADD : I40IW_QHASH_MANAGE_TYPE_DELETE;
4385
4386        nfo.vlan_id = vlan_id;
4387        nfo.ipv4 = ipv4;
4388
4389        /* Disable or enable qhash for listeners */
4390        spin_lock_irqsave(&cm_core->listen_list_lock, flags);
4391        list_for_each_entry(listen_node, &cm_core->listen_nodes, list) {
4392                if (vlan_id == listen_node->vlan_id &&
4393                    (!memcmp(listen_node->loc_addr, ipaddr, ipv4 ? 4 : 16) ||
4394                    !memcmp(listen_node->loc_addr, ip_zero, ipv4 ? 4 : 16))) {
4395                        memcpy(nfo.loc_addr, listen_node->loc_addr,
4396                               sizeof(nfo.loc_addr));
4397                        nfo.loc_port = listen_node->loc_port;
4398                        nfo.user_pri = listen_node->user_pri;
4399                        if (!list_empty(&listen_node->child_listen_list)) {
4400                                i40iw_qhash_ctrl(iwdev,
4401                                                 listen_node,
4402                                                 &nfo,
4403                                                 ipaddr, ipv4, ifup);
4404                        } else if (memcmp(listen_node->loc_addr, ip_zero,
4405                                          ipv4 ? 4 : 16)) {
4406                                ret = i40iw_manage_qhash(iwdev,
4407                                                         &nfo,
4408                                                         I40IW_QHASH_TYPE_TCP_SYN,
4409                                                         op,
4410                                                         NULL,
4411                                                         false);
4412                                if (!ret)
4413                                        listen_node->qhash_set = ifup;
4414                        }
4415                }
4416        }
4417        spin_unlock_irqrestore(&cm_core->listen_list_lock, flags);
4418
4419        /* teardown connected qp's on ifdown */
4420        if (!ifup)
4421                i40iw_cm_teardown_connections(iwdev, ipaddr, &nfo, false);
4422}
4423