linux/net/dccp/output.c
<<
>>
Prefs
   1// SPDX-License-Identifier: GPL-2.0-or-later
   2/*
   3 *  net/dccp/output.c
   4 *
   5 *  An implementation of the DCCP protocol
   6 *  Arnaldo Carvalho de Melo <acme@conectiva.com.br>
   7 */
   8
   9#include <linux/dccp.h>
  10#include <linux/kernel.h>
  11#include <linux/skbuff.h>
  12#include <linux/slab.h>
  13#include <linux/sched/signal.h>
  14
  15#include <net/inet_sock.h>
  16#include <net/sock.h>
  17
  18#include "ackvec.h"
  19#include "ccid.h"
  20#include "dccp.h"
  21
  22static inline void dccp_event_ack_sent(struct sock *sk)
  23{
  24        inet_csk_clear_xmit_timer(sk, ICSK_TIME_DACK);
  25}
  26
  27/* enqueue @skb on sk_send_head for retransmission, return clone to send now */
  28static struct sk_buff *dccp_skb_entail(struct sock *sk, struct sk_buff *skb)
  29{
  30        skb_set_owner_w(skb, sk);
  31        WARN_ON(sk->sk_send_head);
  32        sk->sk_send_head = skb;
  33        return skb_clone(sk->sk_send_head, gfp_any());
  34}
  35
  36/*
  37 * All SKB's seen here are completely headerless. It is our
  38 * job to build the DCCP header, and pass the packet down to
  39 * IP so it can do the same plus pass the packet off to the
  40 * device.
  41 */
  42static int dccp_transmit_skb(struct sock *sk, struct sk_buff *skb)
  43{
  44        if (likely(skb != NULL)) {
  45                struct inet_sock *inet = inet_sk(sk);
  46                const struct inet_connection_sock *icsk = inet_csk(sk);
  47                struct dccp_sock *dp = dccp_sk(sk);
  48                struct dccp_skb_cb *dcb = DCCP_SKB_CB(skb);
  49                struct dccp_hdr *dh;
  50                /* XXX For now we're using only 48 bits sequence numbers */
  51                const u32 dccp_header_size = sizeof(*dh) +
  52                                             sizeof(struct dccp_hdr_ext) +
  53                                          dccp_packet_hdr_len(dcb->dccpd_type);
  54                int err, set_ack = 1;
  55                u64 ackno = dp->dccps_gsr;
  56                /*
  57                 * Increment GSS here already in case the option code needs it.
  58                 * Update GSS for real only if option processing below succeeds.
  59                 */
  60                dcb->dccpd_seq = ADD48(dp->dccps_gss, 1);
  61
  62                switch (dcb->dccpd_type) {
  63                case DCCP_PKT_DATA:
  64                        set_ack = 0;
  65                        fallthrough;
  66                case DCCP_PKT_DATAACK:
  67                case DCCP_PKT_RESET:
  68                        break;
  69
  70                case DCCP_PKT_REQUEST:
  71                        set_ack = 0;
  72                        /* Use ISS on the first (non-retransmitted) Request. */
  73                        if (icsk->icsk_retransmits == 0)
  74                                dcb->dccpd_seq = dp->dccps_iss;
  75                        fallthrough;
  76
  77                case DCCP_PKT_SYNC:
  78                case DCCP_PKT_SYNCACK:
  79                        ackno = dcb->dccpd_ack_seq;
  80                        fallthrough;
  81                default:
  82                        /*
  83                         * Set owner/destructor: some skbs are allocated via
  84                         * alloc_skb (e.g. when retransmission may happen).
  85                         * Only Data, DataAck, and Reset packets should come
  86                         * through here with skb->sk set.
  87                         */
  88                        WARN_ON(skb->sk);
  89                        skb_set_owner_w(skb, sk);
  90                        break;
  91                }
  92
  93                if (dccp_insert_options(sk, skb)) {
  94                        kfree_skb(skb);
  95                        return -EPROTO;
  96                }
  97
  98
  99                /* Build DCCP header and checksum it. */
 100                dh = dccp_zeroed_hdr(skb, dccp_header_size);
 101                dh->dccph_type  = dcb->dccpd_type;
 102                dh->dccph_sport = inet->inet_sport;
 103                dh->dccph_dport = inet->inet_dport;
 104                dh->dccph_doff  = (dccp_header_size + dcb->dccpd_opt_len) / 4;
 105                dh->dccph_ccval = dcb->dccpd_ccval;
 106                dh->dccph_cscov = dp->dccps_pcslen;
 107                /* XXX For now we're using only 48 bits sequence numbers */
 108                dh->dccph_x     = 1;
 109
 110                dccp_update_gss(sk, dcb->dccpd_seq);
 111                dccp_hdr_set_seq(dh, dp->dccps_gss);
 112                if (set_ack)
 113                        dccp_hdr_set_ack(dccp_hdr_ack_bits(skb), ackno);
 114
 115                switch (dcb->dccpd_type) {
 116                case DCCP_PKT_REQUEST:
 117                        dccp_hdr_request(skb)->dccph_req_service =
 118                                                        dp->dccps_service;
 119                        /*
 120                         * Limit Ack window to ISS <= P.ackno <= GSS, so that
 121                         * only Responses to Requests we sent are considered.
 122                         */
 123                        dp->dccps_awl = dp->dccps_iss;
 124                        break;
 125                case DCCP_PKT_RESET:
 126                        dccp_hdr_reset(skb)->dccph_reset_code =
 127                                                        dcb->dccpd_reset_code;
 128                        break;
 129                }
 130
 131                icsk->icsk_af_ops->send_check(sk, skb);
 132
 133                if (set_ack)
 134                        dccp_event_ack_sent(sk);
 135
 136                DCCP_INC_STATS(DCCP_MIB_OUTSEGS);
 137
 138                err = icsk->icsk_af_ops->queue_xmit(sk, skb, &inet->cork.fl);
 139                return net_xmit_eval(err);
 140        }
 141        return -ENOBUFS;
 142}
 143
 144/**
 145 * dccp_determine_ccmps  -  Find out about CCID-specific packet-size limits
 146 * @dp: socket to find packet size limits of
 147 *
 148 * We only consider the HC-sender CCID for setting the CCMPS (RFC 4340, 14.),
 149 * since the RX CCID is restricted to feedback packets (Acks), which are small
 150 * in comparison with the data traffic. A value of 0 means "no current CCMPS".
 151 */
 152static u32 dccp_determine_ccmps(const struct dccp_sock *dp)
 153{
 154        const struct ccid *tx_ccid = dp->dccps_hc_tx_ccid;
 155
 156        if (tx_ccid == NULL || tx_ccid->ccid_ops == NULL)
 157                return 0;
 158        return tx_ccid->ccid_ops->ccid_ccmps;
 159}
 160
 161unsigned int dccp_sync_mss(struct sock *sk, u32 pmtu)
 162{
 163        struct inet_connection_sock *icsk = inet_csk(sk);
 164        struct dccp_sock *dp = dccp_sk(sk);
 165        u32 ccmps = dccp_determine_ccmps(dp);
 166        u32 cur_mps = ccmps ? min(pmtu, ccmps) : pmtu;
 167
 168        /* Account for header lengths and IPv4/v6 option overhead */
 169        cur_mps -= (icsk->icsk_af_ops->net_header_len + icsk->icsk_ext_hdr_len +
 170                    sizeof(struct dccp_hdr) + sizeof(struct dccp_hdr_ext));
 171
 172        /*
 173         * Leave enough headroom for common DCCP header options.
 174         * This only considers options which may appear on DCCP-Data packets, as
 175         * per table 3 in RFC 4340, 5.8. When running out of space for other
 176         * options (eg. Ack Vector which can take up to 255 bytes), it is better
 177         * to schedule a separate Ack. Thus we leave headroom for the following:
 178         *  - 1 byte for Slow Receiver (11.6)
 179         *  - 6 bytes for Timestamp (13.1)
 180         *  - 10 bytes for Timestamp Echo (13.3)
 181         *  - 8 bytes for NDP count (7.7, when activated)
 182         *  - 6 bytes for Data Checksum (9.3)
 183         *  - %DCCPAV_MIN_OPTLEN bytes for Ack Vector size (11.4, when enabled)
 184         */
 185        cur_mps -= roundup(1 + 6 + 10 + dp->dccps_send_ndp_count * 8 + 6 +
 186                           (dp->dccps_hc_rx_ackvec ? DCCPAV_MIN_OPTLEN : 0), 4);
 187
 188        /* And store cached results */
 189        icsk->icsk_pmtu_cookie = pmtu;
 190        dp->dccps_mss_cache = cur_mps;
 191
 192        return cur_mps;
 193}
 194
 195EXPORT_SYMBOL_GPL(dccp_sync_mss);
 196
 197void dccp_write_space(struct sock *sk)
 198{
 199        struct socket_wq *wq;
 200
 201        rcu_read_lock();
 202        wq = rcu_dereference(sk->sk_wq);
 203        if (skwq_has_sleeper(wq))
 204                wake_up_interruptible(&wq->wait);
 205        /* Should agree with poll, otherwise some programs break */
 206        if (sock_writeable(sk))
 207                sk_wake_async(sk, SOCK_WAKE_SPACE, POLL_OUT);
 208
 209        rcu_read_unlock();
 210}
 211
 212/**
 213 * dccp_wait_for_ccid  -  Await CCID send permission
 214 * @sk:    socket to wait for
 215 * @delay: timeout in jiffies
 216 *
 217 * This is used by CCIDs which need to delay the send time in process context.
 218 */
 219static int dccp_wait_for_ccid(struct sock *sk, unsigned long delay)
 220{
 221        DEFINE_WAIT(wait);
 222        long remaining;
 223
 224        prepare_to_wait(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
 225        sk->sk_write_pending++;
 226        release_sock(sk);
 227
 228        remaining = schedule_timeout(delay);
 229
 230        lock_sock(sk);
 231        sk->sk_write_pending--;
 232        finish_wait(sk_sleep(sk), &wait);
 233
 234        if (signal_pending(current) || sk->sk_err)
 235                return -1;
 236        return remaining;
 237}
 238
 239/**
 240 * dccp_xmit_packet  -  Send data packet under control of CCID
 241 * @sk: socket to send data packet on
 242 *
 243 * Transmits next-queued payload and informs CCID to account for the packet.
 244 */
 245static void dccp_xmit_packet(struct sock *sk)
 246{
 247        int err, len;
 248        struct dccp_sock *dp = dccp_sk(sk);
 249        struct sk_buff *skb = dccp_qpolicy_pop(sk);
 250
 251        if (unlikely(skb == NULL))
 252                return;
 253        len = skb->len;
 254
 255        if (sk->sk_state == DCCP_PARTOPEN) {
 256                const u32 cur_mps = dp->dccps_mss_cache - DCCP_FEATNEG_OVERHEAD;
 257                /*
 258                 * See 8.1.5 - Handshake Completion.
 259                 *
 260                 * For robustness we resend Confirm options until the client has
 261                 * entered OPEN. During the initial feature negotiation, the MPS
 262                 * is smaller than usual, reduced by the Change/Confirm options.
 263                 */
 264                if (!list_empty(&dp->dccps_featneg) && len > cur_mps) {
 265                        DCCP_WARN("Payload too large (%d) for featneg.\n", len);
 266                        dccp_send_ack(sk);
 267                        dccp_feat_list_purge(&dp->dccps_featneg);
 268                }
 269
 270                inet_csk_schedule_ack(sk);
 271                inet_csk_reset_xmit_timer(sk, ICSK_TIME_DACK,
 272                                              inet_csk(sk)->icsk_rto,
 273                                              DCCP_RTO_MAX);
 274                DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_DATAACK;
 275        } else if (dccp_ack_pending(sk)) {
 276                DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_DATAACK;
 277        } else {
 278                DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_DATA;
 279        }
 280
 281        err = dccp_transmit_skb(sk, skb);
 282        if (err)
 283                dccp_pr_debug("transmit_skb() returned err=%d\n", err);
 284        /*
 285         * Register this one as sent even if an error occurred. To the remote
 286         * end a local packet drop is indistinguishable from network loss, i.e.
 287         * any local drop will eventually be reported via receiver feedback.
 288         */
 289        ccid_hc_tx_packet_sent(dp->dccps_hc_tx_ccid, sk, len);
 290
 291        /*
 292         * If the CCID needs to transfer additional header options out-of-band
 293         * (e.g. Ack Vectors or feature-negotiation options), it activates this
 294         * flag to schedule a Sync. The Sync will automatically incorporate all
 295         * currently pending header options, thus clearing the backlog.
 296         */
 297        if (dp->dccps_sync_scheduled)
 298                dccp_send_sync(sk, dp->dccps_gsr, DCCP_PKT_SYNC);
 299}
 300
 301/**
 302 * dccp_flush_write_queue  -  Drain queue at end of connection
 303 * @sk: socket to be drained
 304 * @time_budget: time allowed to drain the queue
 305 *
 306 * Since dccp_sendmsg queues packets without waiting for them to be sent, it may
 307 * happen that the TX queue is not empty at the end of a connection. We give the
 308 * HC-sender CCID a grace period of up to @time_budget jiffies. If this function
 309 * returns with a non-empty write queue, it will be purged later.
 310 */
 311void dccp_flush_write_queue(struct sock *sk, long *time_budget)
 312{
 313        struct dccp_sock *dp = dccp_sk(sk);
 314        struct sk_buff *skb;
 315        long delay, rc;
 316
 317        while (*time_budget > 0 && (skb = skb_peek(&sk->sk_write_queue))) {
 318                rc = ccid_hc_tx_send_packet(dp->dccps_hc_tx_ccid, sk, skb);
 319
 320                switch (ccid_packet_dequeue_eval(rc)) {
 321                case CCID_PACKET_WILL_DEQUEUE_LATER:
 322                        /*
 323                         * If the CCID determines when to send, the next sending
 324                         * time is unknown or the CCID may not even send again
 325                         * (e.g. remote host crashes or lost Ack packets).
 326                         */
 327                        DCCP_WARN("CCID did not manage to send all packets\n");
 328                        return;
 329                case CCID_PACKET_DELAY:
 330                        delay = msecs_to_jiffies(rc);
 331                        if (delay > *time_budget)
 332                                return;
 333                        rc = dccp_wait_for_ccid(sk, delay);
 334                        if (rc < 0)
 335                                return;
 336                        *time_budget -= (delay - rc);
 337                        /* check again if we can send now */
 338                        break;
 339                case CCID_PACKET_SEND_AT_ONCE:
 340                        dccp_xmit_packet(sk);
 341                        break;
 342                case CCID_PACKET_ERR:
 343                        skb_dequeue(&sk->sk_write_queue);
 344                        kfree_skb(skb);
 345                        dccp_pr_debug("packet discarded due to err=%ld\n", rc);
 346                }
 347        }
 348}
 349
 350void dccp_write_xmit(struct sock *sk)
 351{
 352        struct dccp_sock *dp = dccp_sk(sk);
 353        struct sk_buff *skb;
 354
 355        while ((skb = dccp_qpolicy_top(sk))) {
 356                int rc = ccid_hc_tx_send_packet(dp->dccps_hc_tx_ccid, sk, skb);
 357
 358                switch (ccid_packet_dequeue_eval(rc)) {
 359                case CCID_PACKET_WILL_DEQUEUE_LATER:
 360                        return;
 361                case CCID_PACKET_DELAY:
 362                        sk_reset_timer(sk, &dp->dccps_xmit_timer,
 363                                       jiffies + msecs_to_jiffies(rc));
 364                        return;
 365                case CCID_PACKET_SEND_AT_ONCE:
 366                        dccp_xmit_packet(sk);
 367                        break;
 368                case CCID_PACKET_ERR:
 369                        dccp_qpolicy_drop(sk, skb);
 370                        dccp_pr_debug("packet discarded due to err=%d\n", rc);
 371                }
 372        }
 373}
 374
 375/**
 376 * dccp_retransmit_skb  -  Retransmit Request, Close, or CloseReq packets
 377 * @sk: socket to perform retransmit on
 378 *
 379 * There are only four retransmittable packet types in DCCP:
 380 * - Request  in client-REQUEST  state (sec. 8.1.1),
 381 * - CloseReq in server-CLOSEREQ state (sec. 8.3),
 382 * - Close    in   node-CLOSING  state (sec. 8.3),
 383 * - Acks in client-PARTOPEN state (sec. 8.1.5, handled by dccp_delack_timer()).
 384 * This function expects sk->sk_send_head to contain the original skb.
 385 */
 386int dccp_retransmit_skb(struct sock *sk)
 387{
 388        WARN_ON(sk->sk_send_head == NULL);
 389
 390        if (inet_csk(sk)->icsk_af_ops->rebuild_header(sk) != 0)
 391                return -EHOSTUNREACH; /* Routing failure or similar. */
 392
 393        /* this count is used to distinguish original and retransmitted skb */
 394        inet_csk(sk)->icsk_retransmits++;
 395
 396        return dccp_transmit_skb(sk, skb_clone(sk->sk_send_head, GFP_ATOMIC));
 397}
 398
 399struct sk_buff *dccp_make_response(const struct sock *sk, struct dst_entry *dst,
 400                                   struct request_sock *req)
 401{
 402        struct dccp_hdr *dh;
 403        struct dccp_request_sock *dreq;
 404        const u32 dccp_header_size = sizeof(struct dccp_hdr) +
 405                                     sizeof(struct dccp_hdr_ext) +
 406                                     sizeof(struct dccp_hdr_response);
 407        struct sk_buff *skb;
 408
 409        /* sk is marked const to clearly express we dont hold socket lock.
 410         * sock_wmalloc() will atomically change sk->sk_wmem_alloc,
 411         * it is safe to promote sk to non const.
 412         */
 413        skb = sock_wmalloc((struct sock *)sk, MAX_DCCP_HEADER, 1,
 414                           GFP_ATOMIC);
 415        if (!skb)
 416                return NULL;
 417
 418        skb_reserve(skb, MAX_DCCP_HEADER);
 419
 420        skb_dst_set(skb, dst_clone(dst));
 421
 422        dreq = dccp_rsk(req);
 423        if (inet_rsk(req)->acked)       /* increase GSS upon retransmission */
 424                dccp_inc_seqno(&dreq->dreq_gss);
 425        DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_RESPONSE;
 426        DCCP_SKB_CB(skb)->dccpd_seq  = dreq->dreq_gss;
 427
 428        /* Resolve feature dependencies resulting from choice of CCID */
 429        if (dccp_feat_server_ccid_dependencies(dreq))
 430                goto response_failed;
 431
 432        if (dccp_insert_options_rsk(dreq, skb))
 433                goto response_failed;
 434
 435        /* Build and checksum header */
 436        dh = dccp_zeroed_hdr(skb, dccp_header_size);
 437
 438        dh->dccph_sport = htons(inet_rsk(req)->ir_num);
 439        dh->dccph_dport = inet_rsk(req)->ir_rmt_port;
 440        dh->dccph_doff  = (dccp_header_size +
 441                           DCCP_SKB_CB(skb)->dccpd_opt_len) / 4;
 442        dh->dccph_type  = DCCP_PKT_RESPONSE;
 443        dh->dccph_x     = 1;
 444        dccp_hdr_set_seq(dh, dreq->dreq_gss);
 445        dccp_hdr_set_ack(dccp_hdr_ack_bits(skb), dreq->dreq_gsr);
 446        dccp_hdr_response(skb)->dccph_resp_service = dreq->dreq_service;
 447
 448        dccp_csum_outgoing(skb);
 449
 450        /* We use `acked' to remember that a Response was already sent. */
 451        inet_rsk(req)->acked = 1;
 452        DCCP_INC_STATS(DCCP_MIB_OUTSEGS);
 453        return skb;
 454response_failed:
 455        kfree_skb(skb);
 456        return NULL;
 457}
 458
 459EXPORT_SYMBOL_GPL(dccp_make_response);
 460
 461/* answer offending packet in @rcv_skb with Reset from control socket @ctl */
 462struct sk_buff *dccp_ctl_make_reset(struct sock *sk, struct sk_buff *rcv_skb)
 463{
 464        struct dccp_hdr *rxdh = dccp_hdr(rcv_skb), *dh;
 465        struct dccp_skb_cb *dcb = DCCP_SKB_CB(rcv_skb);
 466        const u32 dccp_hdr_reset_len = sizeof(struct dccp_hdr) +
 467                                       sizeof(struct dccp_hdr_ext) +
 468                                       sizeof(struct dccp_hdr_reset);
 469        struct dccp_hdr_reset *dhr;
 470        struct sk_buff *skb;
 471
 472        skb = alloc_skb(sk->sk_prot->max_header, GFP_ATOMIC);
 473        if (skb == NULL)
 474                return NULL;
 475
 476        skb_reserve(skb, sk->sk_prot->max_header);
 477
 478        /* Swap the send and the receive. */
 479        dh = dccp_zeroed_hdr(skb, dccp_hdr_reset_len);
 480        dh->dccph_type  = DCCP_PKT_RESET;
 481        dh->dccph_sport = rxdh->dccph_dport;
 482        dh->dccph_dport = rxdh->dccph_sport;
 483        dh->dccph_doff  = dccp_hdr_reset_len / 4;
 484        dh->dccph_x     = 1;
 485
 486        dhr = dccp_hdr_reset(skb);
 487        dhr->dccph_reset_code = dcb->dccpd_reset_code;
 488
 489        switch (dcb->dccpd_reset_code) {
 490        case DCCP_RESET_CODE_PACKET_ERROR:
 491                dhr->dccph_reset_data[0] = rxdh->dccph_type;
 492                break;
 493        case DCCP_RESET_CODE_OPTION_ERROR:
 494        case DCCP_RESET_CODE_MANDATORY_ERROR:
 495                memcpy(dhr->dccph_reset_data, dcb->dccpd_reset_data, 3);
 496                break;
 497        }
 498        /*
 499         * From RFC 4340, 8.3.1:
 500         *   If P.ackno exists, set R.seqno := P.ackno + 1.
 501         *   Else set R.seqno := 0.
 502         */
 503        if (dcb->dccpd_ack_seq != DCCP_PKT_WITHOUT_ACK_SEQ)
 504                dccp_hdr_set_seq(dh, ADD48(dcb->dccpd_ack_seq, 1));
 505        dccp_hdr_set_ack(dccp_hdr_ack_bits(skb), dcb->dccpd_seq);
 506
 507        dccp_csum_outgoing(skb);
 508        return skb;
 509}
 510
 511EXPORT_SYMBOL_GPL(dccp_ctl_make_reset);
 512
 513/* send Reset on established socket, to close or abort the connection */
 514int dccp_send_reset(struct sock *sk, enum dccp_reset_codes code)
 515{
 516        struct sk_buff *skb;
 517        /*
 518         * FIXME: what if rebuild_header fails?
 519         * Should we be doing a rebuild_header here?
 520         */
 521        int err = inet_csk(sk)->icsk_af_ops->rebuild_header(sk);
 522
 523        if (err != 0)
 524                return err;
 525
 526        skb = sock_wmalloc(sk, sk->sk_prot->max_header, 1, GFP_ATOMIC);
 527        if (skb == NULL)
 528                return -ENOBUFS;
 529
 530        /* Reserve space for headers and prepare control bits. */
 531        skb_reserve(skb, sk->sk_prot->max_header);
 532        DCCP_SKB_CB(skb)->dccpd_type       = DCCP_PKT_RESET;
 533        DCCP_SKB_CB(skb)->dccpd_reset_code = code;
 534
 535        return dccp_transmit_skb(sk, skb);
 536}
 537
 538/*
 539 * Do all connect socket setups that can be done AF independent.
 540 */
 541int dccp_connect(struct sock *sk)
 542{
 543        struct sk_buff *skb;
 544        struct dccp_sock *dp = dccp_sk(sk);
 545        struct dst_entry *dst = __sk_dst_get(sk);
 546        struct inet_connection_sock *icsk = inet_csk(sk);
 547
 548        sk->sk_err = 0;
 549        sock_reset_flag(sk, SOCK_DONE);
 550
 551        dccp_sync_mss(sk, dst_mtu(dst));
 552
 553        /* do not connect if feature negotiation setup fails */
 554        if (dccp_feat_finalise_settings(dccp_sk(sk)))
 555                return -EPROTO;
 556
 557        /* Initialise GAR as per 8.5; AWL/AWH are set in dccp_transmit_skb() */
 558        dp->dccps_gar = dp->dccps_iss;
 559
 560        skb = alloc_skb(sk->sk_prot->max_header, sk->sk_allocation);
 561        if (unlikely(skb == NULL))
 562                return -ENOBUFS;
 563
 564        /* Reserve space for headers. */
 565        skb_reserve(skb, sk->sk_prot->max_header);
 566
 567        DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_REQUEST;
 568
 569        dccp_transmit_skb(sk, dccp_skb_entail(sk, skb));
 570        DCCP_INC_STATS(DCCP_MIB_ACTIVEOPENS);
 571
 572        /* Timer for repeating the REQUEST until an answer. */
 573        icsk->icsk_retransmits = 0;
 574        inet_csk_reset_xmit_timer(sk, ICSK_TIME_RETRANS,
 575                                  icsk->icsk_rto, DCCP_RTO_MAX);
 576        return 0;
 577}
 578
 579EXPORT_SYMBOL_GPL(dccp_connect);
 580
 581void dccp_send_ack(struct sock *sk)
 582{
 583        /* If we have been reset, we may not send again. */
 584        if (sk->sk_state != DCCP_CLOSED) {
 585                struct sk_buff *skb = alloc_skb(sk->sk_prot->max_header,
 586                                                GFP_ATOMIC);
 587
 588                if (skb == NULL) {
 589                        inet_csk_schedule_ack(sk);
 590                        inet_csk(sk)->icsk_ack.ato = TCP_ATO_MIN;
 591                        inet_csk_reset_xmit_timer(sk, ICSK_TIME_DACK,
 592                                                  TCP_DELACK_MAX,
 593                                                  DCCP_RTO_MAX);
 594                        return;
 595                }
 596
 597                /* Reserve space for headers */
 598                skb_reserve(skb, sk->sk_prot->max_header);
 599                DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_ACK;
 600                dccp_transmit_skb(sk, skb);
 601        }
 602}
 603
 604EXPORT_SYMBOL_GPL(dccp_send_ack);
 605
 606#if 0
 607/* FIXME: Is this still necessary (11.3) - currently nowhere used by DCCP. */
 608void dccp_send_delayed_ack(struct sock *sk)
 609{
 610        struct inet_connection_sock *icsk = inet_csk(sk);
 611        /*
 612         * FIXME: tune this timer. elapsed time fixes the skew, so no problem
 613         * with using 2s, and active senders also piggyback the ACK into a
 614         * DATAACK packet, so this is really for quiescent senders.
 615         */
 616        unsigned long timeout = jiffies + 2 * HZ;
 617
 618        /* Use new timeout only if there wasn't a older one earlier. */
 619        if (icsk->icsk_ack.pending & ICSK_ACK_TIMER) {
 620                /* If delack timer was blocked or is about to expire,
 621                 * send ACK now.
 622                 *
 623                 * FIXME: check the "about to expire" part
 624                 */
 625                if (icsk->icsk_ack.blocked) {
 626                        dccp_send_ack(sk);
 627                        return;
 628                }
 629
 630                if (!time_before(timeout, icsk->icsk_ack.timeout))
 631                        timeout = icsk->icsk_ack.timeout;
 632        }
 633        icsk->icsk_ack.pending |= ICSK_ACK_SCHED | ICSK_ACK_TIMER;
 634        icsk->icsk_ack.timeout = timeout;
 635        sk_reset_timer(sk, &icsk->icsk_delack_timer, timeout);
 636}
 637#endif
 638
 639void dccp_send_sync(struct sock *sk, const u64 ackno,
 640                    const enum dccp_pkt_type pkt_type)
 641{
 642        /*
 643         * We are not putting this on the write queue, so
 644         * dccp_transmit_skb() will set the ownership to this
 645         * sock.
 646         */
 647        struct sk_buff *skb = alloc_skb(sk->sk_prot->max_header, GFP_ATOMIC);
 648
 649        if (skb == NULL) {
 650                /* FIXME: how to make sure the sync is sent? */
 651                DCCP_CRIT("could not send %s", dccp_packet_name(pkt_type));
 652                return;
 653        }
 654
 655        /* Reserve space for headers and prepare control bits. */
 656        skb_reserve(skb, sk->sk_prot->max_header);
 657        DCCP_SKB_CB(skb)->dccpd_type = pkt_type;
 658        DCCP_SKB_CB(skb)->dccpd_ack_seq = ackno;
 659
 660        /*
 661         * Clear the flag in case the Sync was scheduled for out-of-band data,
 662         * such as carrying a long Ack Vector.
 663         */
 664        dccp_sk(sk)->dccps_sync_scheduled = 0;
 665
 666        dccp_transmit_skb(sk, skb);
 667}
 668
 669EXPORT_SYMBOL_GPL(dccp_send_sync);
 670
 671/*
 672 * Send a DCCP_PKT_CLOSE/CLOSEREQ. The caller locks the socket for us. This
 673 * cannot be allowed to fail queueing a DCCP_PKT_CLOSE/CLOSEREQ frame under
 674 * any circumstances.
 675 */
 676void dccp_send_close(struct sock *sk, const int active)
 677{
 678        struct dccp_sock *dp = dccp_sk(sk);
 679        struct sk_buff *skb;
 680        const gfp_t prio = active ? GFP_KERNEL : GFP_ATOMIC;
 681
 682        skb = alloc_skb(sk->sk_prot->max_header, prio);
 683        if (skb == NULL)
 684                return;
 685
 686        /* Reserve space for headers and prepare control bits. */
 687        skb_reserve(skb, sk->sk_prot->max_header);
 688        if (dp->dccps_role == DCCP_ROLE_SERVER && !dp->dccps_server_timewait)
 689                DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_CLOSEREQ;
 690        else
 691                DCCP_SKB_CB(skb)->dccpd_type = DCCP_PKT_CLOSE;
 692
 693        if (active) {
 694                skb = dccp_skb_entail(sk, skb);
 695                /*
 696                 * Retransmission timer for active-close: RFC 4340, 8.3 requires
 697                 * to retransmit the Close/CloseReq until the CLOSING/CLOSEREQ
 698                 * state can be left. The initial timeout is 2 RTTs.
 699                 * Since RTT measurement is done by the CCIDs, there is no easy
 700                 * way to get an RTT sample. The fallback RTT from RFC 4340, 3.4
 701                 * is too low (200ms); we use a high value to avoid unnecessary
 702                 * retransmissions when the link RTT is > 0.2 seconds.
 703                 * FIXME: Let main module sample RTTs and use that instead.
 704                 */
 705                inet_csk_reset_xmit_timer(sk, ICSK_TIME_RETRANS,
 706                                          DCCP_TIMEOUT_INIT, DCCP_RTO_MAX);
 707        }
 708        dccp_transmit_skb(sk, skb);
 709}
 710