linux/net/ipv6/exthdrs.c
<<
>>
Prefs
   1/*
   2 *      Extension Header handling for IPv6
   3 *      Linux INET6 implementation
   4 *
   5 *      Authors:
   6 *      Pedro Roque             <roque@di.fc.ul.pt>
   7 *      Andi Kleen              <ak@muc.de>
   8 *      Alexey Kuznetsov        <kuznet@ms2.inr.ac.ru>
   9 *
  10 *      This program is free software; you can redistribute it and/or
  11 *      modify it under the terms of the GNU General Public License
  12 *      as published by the Free Software Foundation; either version
  13 *      2 of the License, or (at your option) any later version.
  14 */
  15
  16/* Changes:
  17 *      yoshfuji                : ensure not to overrun while parsing
  18 *                                tlv options.
  19 *      Mitsuru KANDA @USAGI and: Remove ipv6_parse_exthdrs().
  20 *      YOSHIFUJI Hideaki @USAGI  Register inbound extension header
  21 *                                handlers as inet6_protocol{}.
  22 */
  23
  24#include <linux/errno.h>
  25#include <linux/types.h>
  26#include <linux/socket.h>
  27#include <linux/sockios.h>
  28#include <linux/net.h>
  29#include <linux/netdevice.h>
  30#include <linux/in6.h>
  31#include <linux/icmpv6.h>
  32#include <linux/slab.h>
  33#include <linux/export.h>
  34
  35#include <net/dst.h>
  36#include <net/sock.h>
  37#include <net/snmp.h>
  38
  39#include <net/ipv6.h>
  40#include <net/protocol.h>
  41#include <net/transp_v6.h>
  42#include <net/rawv6.h>
  43#include <net/ndisc.h>
  44#include <net/ip6_route.h>
  45#include <net/addrconf.h>
  46#include <net/calipso.h>
  47#if IS_ENABLED(CONFIG_IPV6_MIP6)
  48#include <net/xfrm.h>
  49#endif
  50#include <linux/seg6.h>
  51#include <net/seg6.h>
  52#ifdef CONFIG_IPV6_SEG6_HMAC
  53#include <net/seg6_hmac.h>
  54#endif
  55
  56#include <linux/uaccess.h>
  57
  58/*
  59 *      Parsing tlv encoded headers.
  60 *
  61 *      Parsing function "func" returns true, if parsing succeed
  62 *      and false, if it failed.
  63 *      It MUST NOT touch skb->h.
  64 */
  65
  66struct tlvtype_proc {
  67        int     type;
  68        bool    (*func)(struct sk_buff *skb, int offset);
  69};
  70
  71/*********************
  72  Generic functions
  73 *********************/
  74
  75/* An unknown option is detected, decide what to do */
  76
  77static bool ip6_tlvopt_unknown(struct sk_buff *skb, int optoff,
  78                               bool disallow_unknowns)
  79{
  80        if (disallow_unknowns) {
  81                /* If unknown TLVs are disallowed by configuration
  82                 * then always silently drop packet. Note this also
  83                 * means no ICMP parameter problem is sent which
  84                 * could be a good property to mitigate a reflection DOS
  85                 * attack.
  86                 */
  87
  88                goto drop;
  89        }
  90
  91        switch ((skb_network_header(skb)[optoff] & 0xC0) >> 6) {
  92        case 0: /* ignore */
  93                return true;
  94
  95        case 1: /* drop packet */
  96                break;
  97
  98        case 3: /* Send ICMP if not a multicast address and drop packet */
  99                /* Actually, it is redundant check. icmp_send
 100                   will recheck in any case.
 101                 */
 102                if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr))
 103                        break;
 104                /* fall through */
 105        case 2: /* send ICMP PARM PROB regardless and drop packet */
 106                icmpv6_param_prob(skb, ICMPV6_UNK_OPTION, optoff);
 107                return false;
 108        }
 109
 110drop:
 111        kfree_skb(skb);
 112        return false;
 113}
 114
 115/* Parse tlv encoded option header (hop-by-hop or destination) */
 116
 117static bool ip6_parse_tlv(const struct tlvtype_proc *procs,
 118                          struct sk_buff *skb,
 119                          int max_count)
 120{
 121        int len = (skb_transport_header(skb)[1] + 1) << 3;
 122        const unsigned char *nh = skb_network_header(skb);
 123        int off = skb_network_header_len(skb);
 124        const struct tlvtype_proc *curr;
 125        bool disallow_unknowns = false;
 126        int tlv_count = 0;
 127        int padlen = 0;
 128
 129        if (unlikely(max_count < 0)) {
 130                disallow_unknowns = true;
 131                max_count = -max_count;
 132        }
 133
 134        if (skb_transport_offset(skb) + len > skb_headlen(skb))
 135                goto bad;
 136
 137        off += 2;
 138        len -= 2;
 139
 140        while (len > 0) {
 141                int optlen = nh[off + 1] + 2;
 142                int i;
 143
 144                switch (nh[off]) {
 145                case IPV6_TLV_PAD1:
 146                        optlen = 1;
 147                        padlen++;
 148                        if (padlen > 7)
 149                                goto bad;
 150                        break;
 151
 152                case IPV6_TLV_PADN:
 153                        /* RFC 2460 states that the purpose of PadN is
 154                         * to align the containing header to multiples
 155                         * of 8. 7 is therefore the highest valid value.
 156                         * See also RFC 4942, Section 2.1.9.5.
 157                         */
 158                        padlen += optlen;
 159                        if (padlen > 7)
 160                                goto bad;
 161                        /* RFC 4942 recommends receiving hosts to
 162                         * actively check PadN payload to contain
 163                         * only zeroes.
 164                         */
 165                        for (i = 2; i < optlen; i++) {
 166                                if (nh[off + i] != 0)
 167                                        goto bad;
 168                        }
 169                        break;
 170
 171                default: /* Other TLV code so scan list */
 172                        if (optlen > len)
 173                                goto bad;
 174
 175                        tlv_count++;
 176                        if (tlv_count > max_count)
 177                                goto bad;
 178
 179                        for (curr = procs; curr->type >= 0; curr++) {
 180                                if (curr->type == nh[off]) {
 181                                        /* type specific length/alignment
 182                                           checks will be performed in the
 183                                           func(). */
 184                                        if (curr->func(skb, off) == false)
 185                                                return false;
 186                                        break;
 187                                }
 188                        }
 189                        if (curr->type < 0 &&
 190                            !ip6_tlvopt_unknown(skb, off, disallow_unknowns))
 191                                return false;
 192
 193                        padlen = 0;
 194                        break;
 195                }
 196                off += optlen;
 197                len -= optlen;
 198        }
 199
 200        if (len == 0)
 201                return true;
 202bad:
 203        kfree_skb(skb);
 204        return false;
 205}
 206
 207/*****************************
 208  Destination options header.
 209 *****************************/
 210
 211#if IS_ENABLED(CONFIG_IPV6_MIP6)
 212static bool ipv6_dest_hao(struct sk_buff *skb, int optoff)
 213{
 214        struct ipv6_destopt_hao *hao;
 215        struct inet6_skb_parm *opt = IP6CB(skb);
 216        struct ipv6hdr *ipv6h = ipv6_hdr(skb);
 217        int ret;
 218
 219        if (opt->dsthao) {
 220                net_dbg_ratelimited("hao duplicated\n");
 221                goto discard;
 222        }
 223        opt->dsthao = opt->dst1;
 224        opt->dst1 = 0;
 225
 226        hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) + optoff);
 227
 228        if (hao->length != 16) {
 229                net_dbg_ratelimited("hao invalid option length = %d\n",
 230                                    hao->length);
 231                goto discard;
 232        }
 233
 234        if (!(ipv6_addr_type(&hao->addr) & IPV6_ADDR_UNICAST)) {
 235                net_dbg_ratelimited("hao is not an unicast addr: %pI6\n",
 236                                    &hao->addr);
 237                goto discard;
 238        }
 239
 240        ret = xfrm6_input_addr(skb, (xfrm_address_t *)&ipv6h->daddr,
 241                               (xfrm_address_t *)&hao->addr, IPPROTO_DSTOPTS);
 242        if (unlikely(ret < 0))
 243                goto discard;
 244
 245        if (skb_cloned(skb)) {
 246                if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC))
 247                        goto discard;
 248
 249                /* update all variable using below by copied skbuff */
 250                hao = (struct ipv6_destopt_hao *)(skb_network_header(skb) +
 251                                                  optoff);
 252                ipv6h = ipv6_hdr(skb);
 253        }
 254
 255        if (skb->ip_summed == CHECKSUM_COMPLETE)
 256                skb->ip_summed = CHECKSUM_NONE;
 257
 258        swap(ipv6h->saddr, hao->addr);
 259
 260        if (skb->tstamp == 0)
 261                __net_timestamp(skb);
 262
 263        return true;
 264
 265 discard:
 266        kfree_skb(skb);
 267        return false;
 268}
 269#endif
 270
 271static const struct tlvtype_proc tlvprocdestopt_lst[] = {
 272#if IS_ENABLED(CONFIG_IPV6_MIP6)
 273        {
 274                .type   = IPV6_TLV_HAO,
 275                .func   = ipv6_dest_hao,
 276        },
 277#endif
 278        {-1,                    NULL}
 279};
 280
 281static int ipv6_destopt_rcv(struct sk_buff *skb)
 282{
 283        struct inet6_skb_parm *opt = IP6CB(skb);
 284#if IS_ENABLED(CONFIG_IPV6_MIP6)
 285        __u16 dstbuf;
 286#endif
 287        struct dst_entry *dst = skb_dst(skb);
 288        struct net *net = dev_net(skb->dev);
 289        int extlen;
 290
 291        if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
 292            !pskb_may_pull(skb, (skb_transport_offset(skb) +
 293                                 ((skb_transport_header(skb)[1] + 1) << 3)))) {
 294                __IP6_INC_STATS(dev_net(dst->dev), ip6_dst_idev(dst),
 295                                IPSTATS_MIB_INHDRERRORS);
 296fail_and_free:
 297                kfree_skb(skb);
 298                return -1;
 299        }
 300
 301        extlen = (skb_transport_header(skb)[1] + 1) << 3;
 302        if (extlen > net->ipv6.sysctl.max_dst_opts_len)
 303                goto fail_and_free;
 304
 305        opt->lastopt = opt->dst1 = skb_network_header_len(skb);
 306#if IS_ENABLED(CONFIG_IPV6_MIP6)
 307        dstbuf = opt->dst1;
 308#endif
 309
 310        if (ip6_parse_tlv(tlvprocdestopt_lst, skb,
 311                          init_net.ipv6.sysctl.max_dst_opts_cnt)) {
 312                skb->transport_header += extlen;
 313                opt = IP6CB(skb);
 314#if IS_ENABLED(CONFIG_IPV6_MIP6)
 315                opt->nhoff = dstbuf;
 316#else
 317                opt->nhoff = opt->dst1;
 318#endif
 319                return 1;
 320        }
 321
 322        __IP6_INC_STATS(dev_net(dst->dev),
 323                        ip6_dst_idev(dst), IPSTATS_MIB_INHDRERRORS);
 324        return -1;
 325}
 326
 327static void seg6_update_csum(struct sk_buff *skb)
 328{
 329        struct ipv6_sr_hdr *hdr;
 330        struct in6_addr *addr;
 331        __be32 from, to;
 332
 333        /* srh is at transport offset and seg_left is already decremented
 334         * but daddr is not yet updated with next segment
 335         */
 336
 337        hdr = (struct ipv6_sr_hdr *)skb_transport_header(skb);
 338        addr = hdr->segments + hdr->segments_left;
 339
 340        hdr->segments_left++;
 341        from = *(__be32 *)hdr;
 342
 343        hdr->segments_left--;
 344        to = *(__be32 *)hdr;
 345
 346        /* update skb csum with diff resulting from seg_left decrement */
 347
 348        update_csum_diff4(skb, from, to);
 349
 350        /* compute csum diff between current and next segment and update */
 351
 352        update_csum_diff16(skb, (__be32 *)(&ipv6_hdr(skb)->daddr),
 353                           (__be32 *)addr);
 354}
 355
 356static int ipv6_srh_rcv(struct sk_buff *skb)
 357{
 358        struct inet6_skb_parm *opt = IP6CB(skb);
 359        struct net *net = dev_net(skb->dev);
 360        struct ipv6_sr_hdr *hdr;
 361        struct inet6_dev *idev;
 362        struct in6_addr *addr;
 363        int accept_seg6;
 364
 365        hdr = (struct ipv6_sr_hdr *)skb_transport_header(skb);
 366
 367        idev = __in6_dev_get(skb->dev);
 368
 369        accept_seg6 = net->ipv6.devconf_all->seg6_enabled;
 370        if (accept_seg6 > idev->cnf.seg6_enabled)
 371                accept_seg6 = idev->cnf.seg6_enabled;
 372
 373        if (!accept_seg6) {
 374                kfree_skb(skb);
 375                return -1;
 376        }
 377
 378#ifdef CONFIG_IPV6_SEG6_HMAC
 379        if (!seg6_hmac_validate_skb(skb)) {
 380                kfree_skb(skb);
 381                return -1;
 382        }
 383#endif
 384
 385looped_back:
 386        if (hdr->segments_left == 0) {
 387                if (hdr->nexthdr == NEXTHDR_IPV6) {
 388                        int offset = (hdr->hdrlen + 1) << 3;
 389
 390                        skb_postpull_rcsum(skb, skb_network_header(skb),
 391                                           skb_network_header_len(skb));
 392
 393                        if (!pskb_pull(skb, offset)) {
 394                                kfree_skb(skb);
 395                                return -1;
 396                        }
 397                        skb_postpull_rcsum(skb, skb_transport_header(skb),
 398                                           offset);
 399
 400                        skb_reset_network_header(skb);
 401                        skb_reset_transport_header(skb);
 402                        skb->encapsulation = 0;
 403
 404                        __skb_tunnel_rx(skb, skb->dev, net);
 405
 406                        netif_rx(skb);
 407                        return -1;
 408                }
 409
 410                opt->srcrt = skb_network_header_len(skb);
 411                opt->lastopt = opt->srcrt;
 412                skb->transport_header += (hdr->hdrlen + 1) << 3;
 413                opt->nhoff = (&hdr->nexthdr) - skb_network_header(skb);
 414
 415                return 1;
 416        }
 417
 418        if (hdr->segments_left >= (hdr->hdrlen >> 1)) {
 419                __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 420                                IPSTATS_MIB_INHDRERRORS);
 421                icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
 422                                  ((&hdr->segments_left) -
 423                                   skb_network_header(skb)));
 424                return -1;
 425        }
 426
 427        if (skb_cloned(skb)) {
 428                if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC)) {
 429                        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 430                                        IPSTATS_MIB_OUTDISCARDS);
 431                        kfree_skb(skb);
 432                        return -1;
 433                }
 434        }
 435
 436        hdr = (struct ipv6_sr_hdr *)skb_transport_header(skb);
 437
 438        hdr->segments_left--;
 439        addr = hdr->segments + hdr->segments_left;
 440
 441        skb_push(skb, sizeof(struct ipv6hdr));
 442
 443        if (skb->ip_summed == CHECKSUM_COMPLETE)
 444                seg6_update_csum(skb);
 445
 446        ipv6_hdr(skb)->daddr = *addr;
 447
 448        skb_dst_drop(skb);
 449
 450        ip6_route_input(skb);
 451
 452        if (skb_dst(skb)->error) {
 453                dst_input(skb);
 454                return -1;
 455        }
 456
 457        if (skb_dst(skb)->dev->flags & IFF_LOOPBACK) {
 458                if (ipv6_hdr(skb)->hop_limit <= 1) {
 459                        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 460                                        IPSTATS_MIB_INHDRERRORS);
 461                        icmpv6_send(skb, ICMPV6_TIME_EXCEED,
 462                                    ICMPV6_EXC_HOPLIMIT, 0);
 463                        kfree_skb(skb);
 464                        return -1;
 465                }
 466                ipv6_hdr(skb)->hop_limit--;
 467
 468                skb_pull(skb, sizeof(struct ipv6hdr));
 469                goto looped_back;
 470        }
 471
 472        dst_input(skb);
 473
 474        return -1;
 475}
 476
 477/********************************
 478  Routing header.
 479 ********************************/
 480
 481/* called with rcu_read_lock() */
 482static int ipv6_rthdr_rcv(struct sk_buff *skb)
 483{
 484        struct inet6_skb_parm *opt = IP6CB(skb);
 485        struct in6_addr *addr = NULL;
 486        struct in6_addr daddr;
 487        struct inet6_dev *idev;
 488        int n, i;
 489        struct ipv6_rt_hdr *hdr;
 490        struct rt0_hdr *rthdr;
 491        struct net *net = dev_net(skb->dev);
 492        int accept_source_route = net->ipv6.devconf_all->accept_source_route;
 493
 494        idev = __in6_dev_get(skb->dev);
 495        if (idev && accept_source_route > idev->cnf.accept_source_route)
 496                accept_source_route = idev->cnf.accept_source_route;
 497
 498        if (!pskb_may_pull(skb, skb_transport_offset(skb) + 8) ||
 499            !pskb_may_pull(skb, (skb_transport_offset(skb) +
 500                                 ((skb_transport_header(skb)[1] + 1) << 3)))) {
 501                __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 502                                IPSTATS_MIB_INHDRERRORS);
 503                kfree_skb(skb);
 504                return -1;
 505        }
 506
 507        hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
 508
 509        if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr) ||
 510            skb->pkt_type != PACKET_HOST) {
 511                __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 512                                IPSTATS_MIB_INADDRERRORS);
 513                kfree_skb(skb);
 514                return -1;
 515        }
 516
 517        /* segment routing */
 518        if (hdr->type == IPV6_SRCRT_TYPE_4)
 519                return ipv6_srh_rcv(skb);
 520
 521looped_back:
 522        if (hdr->segments_left == 0) {
 523                switch (hdr->type) {
 524#if IS_ENABLED(CONFIG_IPV6_MIP6)
 525                case IPV6_SRCRT_TYPE_2:
 526                        /* Silently discard type 2 header unless it was
 527                         * processed by own
 528                         */
 529                        if (!addr) {
 530                                __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 531                                                IPSTATS_MIB_INADDRERRORS);
 532                                kfree_skb(skb);
 533                                return -1;
 534                        }
 535                        break;
 536#endif
 537                default:
 538                        break;
 539                }
 540
 541                opt->lastopt = opt->srcrt = skb_network_header_len(skb);
 542                skb->transport_header += (hdr->hdrlen + 1) << 3;
 543                opt->dst0 = opt->dst1;
 544                opt->dst1 = 0;
 545                opt->nhoff = (&hdr->nexthdr) - skb_network_header(skb);
 546                return 1;
 547        }
 548
 549        switch (hdr->type) {
 550#if IS_ENABLED(CONFIG_IPV6_MIP6)
 551        case IPV6_SRCRT_TYPE_2:
 552                if (accept_source_route < 0)
 553                        goto unknown_rh;
 554                /* Silently discard invalid RTH type 2 */
 555                if (hdr->hdrlen != 2 || hdr->segments_left != 1) {
 556                        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 557                                        IPSTATS_MIB_INHDRERRORS);
 558                        kfree_skb(skb);
 559                        return -1;
 560                }
 561                break;
 562#endif
 563        default:
 564                goto unknown_rh;
 565        }
 566
 567        /*
 568         *      This is the routing header forwarding algorithm from
 569         *      RFC 2460, page 16.
 570         */
 571
 572        n = hdr->hdrlen >> 1;
 573
 574        if (hdr->segments_left > n) {
 575                __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 576                                IPSTATS_MIB_INHDRERRORS);
 577                icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
 578                                  ((&hdr->segments_left) -
 579                                   skb_network_header(skb)));
 580                return -1;
 581        }
 582
 583        /* We are about to mangle packet header. Be careful!
 584           Do not damage packets queued somewhere.
 585         */
 586        if (skb_cloned(skb)) {
 587                /* the copy is a forwarded packet */
 588                if (pskb_expand_head(skb, 0, 0, GFP_ATOMIC)) {
 589                        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 590                                        IPSTATS_MIB_OUTDISCARDS);
 591                        kfree_skb(skb);
 592                        return -1;
 593                }
 594                hdr = (struct ipv6_rt_hdr *)skb_transport_header(skb);
 595        }
 596
 597        if (skb->ip_summed == CHECKSUM_COMPLETE)
 598                skb->ip_summed = CHECKSUM_NONE;
 599
 600        i = n - --hdr->segments_left;
 601
 602        rthdr = (struct rt0_hdr *) hdr;
 603        addr = rthdr->addr;
 604        addr += i - 1;
 605
 606        switch (hdr->type) {
 607#if IS_ENABLED(CONFIG_IPV6_MIP6)
 608        case IPV6_SRCRT_TYPE_2:
 609                if (xfrm6_input_addr(skb, (xfrm_address_t *)addr,
 610                                     (xfrm_address_t *)&ipv6_hdr(skb)->saddr,
 611                                     IPPROTO_ROUTING) < 0) {
 612                        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 613                                        IPSTATS_MIB_INADDRERRORS);
 614                        kfree_skb(skb);
 615                        return -1;
 616                }
 617                if (!ipv6_chk_home_addr(dev_net(skb_dst(skb)->dev), addr)) {
 618                        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 619                                        IPSTATS_MIB_INADDRERRORS);
 620                        kfree_skb(skb);
 621                        return -1;
 622                }
 623                break;
 624#endif
 625        default:
 626                break;
 627        }
 628
 629        if (ipv6_addr_is_multicast(addr)) {
 630                __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 631                                IPSTATS_MIB_INADDRERRORS);
 632                kfree_skb(skb);
 633                return -1;
 634        }
 635
 636        daddr = *addr;
 637        *addr = ipv6_hdr(skb)->daddr;
 638        ipv6_hdr(skb)->daddr = daddr;
 639
 640        skb_dst_drop(skb);
 641        ip6_route_input(skb);
 642        if (skb_dst(skb)->error) {
 643                skb_push(skb, skb->data - skb_network_header(skb));
 644                dst_input(skb);
 645                return -1;
 646        }
 647
 648        if (skb_dst(skb)->dev->flags&IFF_LOOPBACK) {
 649                if (ipv6_hdr(skb)->hop_limit <= 1) {
 650                        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)),
 651                                        IPSTATS_MIB_INHDRERRORS);
 652                        icmpv6_send(skb, ICMPV6_TIME_EXCEED, ICMPV6_EXC_HOPLIMIT,
 653                                    0);
 654                        kfree_skb(skb);
 655                        return -1;
 656                }
 657                ipv6_hdr(skb)->hop_limit--;
 658                goto looped_back;
 659        }
 660
 661        skb_push(skb, skb->data - skb_network_header(skb));
 662        dst_input(skb);
 663        return -1;
 664
 665unknown_rh:
 666        __IP6_INC_STATS(net, ip6_dst_idev(skb_dst(skb)), IPSTATS_MIB_INHDRERRORS);
 667        icmpv6_param_prob(skb, ICMPV6_HDR_FIELD,
 668                          (&hdr->type) - skb_network_header(skb));
 669        return -1;
 670}
 671
 672static const struct inet6_protocol rthdr_protocol = {
 673        .handler        =       ipv6_rthdr_rcv,
 674        .flags          =       INET6_PROTO_NOPOLICY,
 675};
 676
 677static const struct inet6_protocol destopt_protocol = {
 678        .handler        =       ipv6_destopt_rcv,
 679        .flags          =       INET6_PROTO_NOPOLICY,
 680};
 681
 682static const struct inet6_protocol nodata_protocol = {
 683        .handler        =       dst_discard,
 684        .flags          =       INET6_PROTO_NOPOLICY,
 685};
 686
 687int __init ipv6_exthdrs_init(void)
 688{
 689        int ret;
 690
 691        ret = inet6_add_protocol(&rthdr_protocol, IPPROTO_ROUTING);
 692        if (ret)
 693                goto out;
 694
 695        ret = inet6_add_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
 696        if (ret)
 697                goto out_rthdr;
 698
 699        ret = inet6_add_protocol(&nodata_protocol, IPPROTO_NONE);
 700        if (ret)
 701                goto out_destopt;
 702
 703out:
 704        return ret;
 705out_destopt:
 706        inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
 707out_rthdr:
 708        inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
 709        goto out;
 710};
 711
 712void ipv6_exthdrs_exit(void)
 713{
 714        inet6_del_protocol(&nodata_protocol, IPPROTO_NONE);
 715        inet6_del_protocol(&destopt_protocol, IPPROTO_DSTOPTS);
 716        inet6_del_protocol(&rthdr_protocol, IPPROTO_ROUTING);
 717}
 718
 719/**********************************
 720  Hop-by-hop options.
 721 **********************************/
 722
 723/*
 724 * Note: we cannot rely on skb_dst(skb) before we assign it in ip6_route_input().
 725 */
 726static inline struct inet6_dev *ipv6_skb_idev(struct sk_buff *skb)
 727{
 728        return skb_dst(skb) ? ip6_dst_idev(skb_dst(skb)) : __in6_dev_get(skb->dev);
 729}
 730
 731static inline struct net *ipv6_skb_net(struct sk_buff *skb)
 732{
 733        return skb_dst(skb) ? dev_net(skb_dst(skb)->dev) : dev_net(skb->dev);
 734}
 735
 736/* Router Alert as of RFC 2711 */
 737
 738static bool ipv6_hop_ra(struct sk_buff *skb, int optoff)
 739{
 740        const unsigned char *nh = skb_network_header(skb);
 741
 742        if (nh[optoff + 1] == 2) {
 743                IP6CB(skb)->flags |= IP6SKB_ROUTERALERT;
 744                memcpy(&IP6CB(skb)->ra, nh + optoff + 2, sizeof(IP6CB(skb)->ra));
 745                return true;
 746        }
 747        net_dbg_ratelimited("ipv6_hop_ra: wrong RA length %d\n",
 748                            nh[optoff + 1]);
 749        kfree_skb(skb);
 750        return false;
 751}
 752
 753/* Jumbo payload */
 754
 755static bool ipv6_hop_jumbo(struct sk_buff *skb, int optoff)
 756{
 757        const unsigned char *nh = skb_network_header(skb);
 758        struct net *net = ipv6_skb_net(skb);
 759        u32 pkt_len;
 760
 761        if (nh[optoff + 1] != 4 || (optoff & 3) != 2) {
 762                net_dbg_ratelimited("ipv6_hop_jumbo: wrong jumbo opt length/alignment %d\n",
 763                                    nh[optoff+1]);
 764                __IP6_INC_STATS(net, ipv6_skb_idev(skb),
 765                                IPSTATS_MIB_INHDRERRORS);
 766                goto drop;
 767        }
 768
 769        pkt_len = ntohl(*(__be32 *)(nh + optoff + 2));
 770        if (pkt_len <= IPV6_MAXPLEN) {
 771                __IP6_INC_STATS(net, ipv6_skb_idev(skb),
 772                                IPSTATS_MIB_INHDRERRORS);
 773                icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff+2);
 774                return false;
 775        }
 776        if (ipv6_hdr(skb)->payload_len) {
 777                __IP6_INC_STATS(net, ipv6_skb_idev(skb),
 778                                IPSTATS_MIB_INHDRERRORS);
 779                icmpv6_param_prob(skb, ICMPV6_HDR_FIELD, optoff);
 780                return false;
 781        }
 782
 783        if (pkt_len > skb->len - sizeof(struct ipv6hdr)) {
 784                __IP6_INC_STATS(net, ipv6_skb_idev(skb),
 785                                IPSTATS_MIB_INTRUNCATEDPKTS);
 786                goto drop;
 787        }
 788
 789        if (pskb_trim_rcsum(skb, pkt_len + sizeof(struct ipv6hdr)))
 790                goto drop;
 791
 792        IP6CB(skb)->flags |= IP6SKB_JUMBOGRAM;
 793        return true;
 794
 795drop:
 796        kfree_skb(skb);
 797        return false;
 798}
 799
 800/* CALIPSO RFC 5570 */
 801
 802static bool ipv6_hop_calipso(struct sk_buff *skb, int optoff)
 803{
 804        const unsigned char *nh = skb_network_header(skb);
 805
 806        if (nh[optoff + 1] < 8)
 807                goto drop;
 808
 809        if (nh[optoff + 6] * 4 + 8 > nh[optoff + 1])
 810                goto drop;
 811
 812        if (!calipso_validate(skb, nh + optoff))
 813                goto drop;
 814
 815        return true;
 816
 817drop:
 818        kfree_skb(skb);
 819        return false;
 820}
 821
 822static const struct tlvtype_proc tlvprochopopt_lst[] = {
 823        {
 824                .type   = IPV6_TLV_ROUTERALERT,
 825                .func   = ipv6_hop_ra,
 826        },
 827        {
 828                .type   = IPV6_TLV_JUMBO,
 829                .func   = ipv6_hop_jumbo,
 830        },
 831        {
 832                .type   = IPV6_TLV_CALIPSO,
 833                .func   = ipv6_hop_calipso,
 834        },
 835        { -1, }
 836};
 837
 838int ipv6_parse_hopopts(struct sk_buff *skb)
 839{
 840        struct inet6_skb_parm *opt = IP6CB(skb);
 841        struct net *net = dev_net(skb->dev);
 842        int extlen;
 843
 844        /*
 845         * skb_network_header(skb) is equal to skb->data, and
 846         * skb_network_header_len(skb) is always equal to
 847         * sizeof(struct ipv6hdr) by definition of
 848         * hop-by-hop options.
 849         */
 850        if (!pskb_may_pull(skb, sizeof(struct ipv6hdr) + 8) ||
 851            !pskb_may_pull(skb, (sizeof(struct ipv6hdr) +
 852                                 ((skb_transport_header(skb)[1] + 1) << 3)))) {
 853fail_and_free:
 854                kfree_skb(skb);
 855                return -1;
 856        }
 857
 858        extlen = (skb_transport_header(skb)[1] + 1) << 3;
 859        if (extlen > net->ipv6.sysctl.max_hbh_opts_len)
 860                goto fail_and_free;
 861
 862        opt->flags |= IP6SKB_HOPBYHOP;
 863        if (ip6_parse_tlv(tlvprochopopt_lst, skb,
 864                          init_net.ipv6.sysctl.max_hbh_opts_cnt)) {
 865                skb->transport_header += extlen;
 866                opt = IP6CB(skb);
 867                opt->nhoff = sizeof(struct ipv6hdr);
 868                return 1;
 869        }
 870        return -1;
 871}
 872
 873/*
 874 *      Creating outbound headers.
 875 *
 876 *      "build" functions work when skb is filled from head to tail (datagram)
 877 *      "push"  functions work when headers are added from tail to head (tcp)
 878 *
 879 *      In both cases we assume, that caller reserved enough room
 880 *      for headers.
 881 */
 882
 883static void ipv6_push_rthdr0(struct sk_buff *skb, u8 *proto,
 884                             struct ipv6_rt_hdr *opt,
 885                             struct in6_addr **addr_p, struct in6_addr *saddr)
 886{
 887        struct rt0_hdr *phdr, *ihdr;
 888        int hops;
 889
 890        ihdr = (struct rt0_hdr *) opt;
 891
 892        phdr = skb_push(skb, (ihdr->rt_hdr.hdrlen + 1) << 3);
 893        memcpy(phdr, ihdr, sizeof(struct rt0_hdr));
 894
 895        hops = ihdr->rt_hdr.hdrlen >> 1;
 896
 897        if (hops > 1)
 898                memcpy(phdr->addr, ihdr->addr + 1,
 899                       (hops - 1) * sizeof(struct in6_addr));
 900
 901        phdr->addr[hops - 1] = **addr_p;
 902        *addr_p = ihdr->addr;
 903
 904        phdr->rt_hdr.nexthdr = *proto;
 905        *proto = NEXTHDR_ROUTING;
 906}
 907
 908static void ipv6_push_rthdr4(struct sk_buff *skb, u8 *proto,
 909                             struct ipv6_rt_hdr *opt,
 910                             struct in6_addr **addr_p, struct in6_addr *saddr)
 911{
 912        struct ipv6_sr_hdr *sr_phdr, *sr_ihdr;
 913        int plen, hops;
 914
 915        sr_ihdr = (struct ipv6_sr_hdr *)opt;
 916        plen = (sr_ihdr->hdrlen + 1) << 3;
 917
 918        sr_phdr = skb_push(skb, plen);
 919        memcpy(sr_phdr, sr_ihdr, sizeof(struct ipv6_sr_hdr));
 920
 921        hops = sr_ihdr->first_segment + 1;
 922        memcpy(sr_phdr->segments + 1, sr_ihdr->segments + 1,
 923               (hops - 1) * sizeof(struct in6_addr));
 924
 925        sr_phdr->segments[0] = **addr_p;
 926        *addr_p = &sr_ihdr->segments[sr_ihdr->segments_left];
 927
 928        if (sr_ihdr->hdrlen > hops * 2) {
 929                int tlvs_offset, tlvs_length;
 930
 931                tlvs_offset = (1 + hops * 2) << 3;
 932                tlvs_length = (sr_ihdr->hdrlen - hops * 2) << 3;
 933                memcpy((char *)sr_phdr + tlvs_offset,
 934                       (char *)sr_ihdr + tlvs_offset, tlvs_length);
 935        }
 936
 937#ifdef CONFIG_IPV6_SEG6_HMAC
 938        if (sr_has_hmac(sr_phdr)) {
 939                struct net *net = NULL;
 940
 941                if (skb->dev)
 942                        net = dev_net(skb->dev);
 943                else if (skb->sk)
 944                        net = sock_net(skb->sk);
 945
 946                WARN_ON(!net);
 947
 948                if (net)
 949                        seg6_push_hmac(net, saddr, sr_phdr);
 950        }
 951#endif
 952
 953        sr_phdr->nexthdr = *proto;
 954        *proto = NEXTHDR_ROUTING;
 955}
 956
 957static void ipv6_push_rthdr(struct sk_buff *skb, u8 *proto,
 958                            struct ipv6_rt_hdr *opt,
 959                            struct in6_addr **addr_p, struct in6_addr *saddr)
 960{
 961        switch (opt->type) {
 962        case IPV6_SRCRT_TYPE_0:
 963        case IPV6_SRCRT_STRICT:
 964        case IPV6_SRCRT_TYPE_2:
 965                ipv6_push_rthdr0(skb, proto, opt, addr_p, saddr);
 966                break;
 967        case IPV6_SRCRT_TYPE_4:
 968                ipv6_push_rthdr4(skb, proto, opt, addr_p, saddr);
 969                break;
 970        default:
 971                break;
 972        }
 973}
 974
 975static void ipv6_push_exthdr(struct sk_buff *skb, u8 *proto, u8 type, struct ipv6_opt_hdr *opt)
 976{
 977        struct ipv6_opt_hdr *h = skb_push(skb, ipv6_optlen(opt));
 978
 979        memcpy(h, opt, ipv6_optlen(opt));
 980        h->nexthdr = *proto;
 981        *proto = type;
 982}
 983
 984void ipv6_push_nfrag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt,
 985                          u8 *proto,
 986                          struct in6_addr **daddr, struct in6_addr *saddr)
 987{
 988        if (opt->srcrt) {
 989                ipv6_push_rthdr(skb, proto, opt->srcrt, daddr, saddr);
 990                /*
 991                 * IPV6_RTHDRDSTOPTS is ignored
 992                 * unless IPV6_RTHDR is set (RFC3542).
 993                 */
 994                if (opt->dst0opt)
 995                        ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst0opt);
 996        }
 997        if (opt->hopopt)
 998                ipv6_push_exthdr(skb, proto, NEXTHDR_HOP, opt->hopopt);
 999}
1000
1001void ipv6_push_frag_opts(struct sk_buff *skb, struct ipv6_txoptions *opt, u8 *proto)
1002{
1003        if (opt->dst1opt)
1004                ipv6_push_exthdr(skb, proto, NEXTHDR_DEST, opt->dst1opt);
1005}
1006EXPORT_SYMBOL(ipv6_push_frag_opts);
1007
1008struct ipv6_txoptions *
1009ipv6_dup_options(struct sock *sk, struct ipv6_txoptions *opt)
1010{
1011        struct ipv6_txoptions *opt2;
1012
1013        opt2 = sock_kmalloc(sk, opt->tot_len, GFP_ATOMIC);
1014        if (opt2) {
1015                long dif = (char *)opt2 - (char *)opt;
1016                memcpy(opt2, opt, opt->tot_len);
1017                if (opt2->hopopt)
1018                        *((char **)&opt2->hopopt) += dif;
1019                if (opt2->dst0opt)
1020                        *((char **)&opt2->dst0opt) += dif;
1021                if (opt2->dst1opt)
1022                        *((char **)&opt2->dst1opt) += dif;
1023                if (opt2->srcrt)
1024                        *((char **)&opt2->srcrt) += dif;
1025                refcount_set(&opt2->refcnt, 1);
1026        }
1027        return opt2;
1028}
1029EXPORT_SYMBOL_GPL(ipv6_dup_options);
1030
1031static int ipv6_renew_option(void *ohdr,
1032                             struct ipv6_opt_hdr __user *newopt, int newoptlen,
1033                             int inherit,
1034                             struct ipv6_opt_hdr **hdr,
1035                             char **p)
1036{
1037        if (inherit) {
1038                if (ohdr) {
1039                        memcpy(*p, ohdr, ipv6_optlen((struct ipv6_opt_hdr *)ohdr));
1040                        *hdr = (struct ipv6_opt_hdr *)*p;
1041                        *p += CMSG_ALIGN(ipv6_optlen(*hdr));
1042                }
1043        } else {
1044                if (newopt) {
1045                        if (copy_from_user(*p, newopt, newoptlen))
1046                                return -EFAULT;
1047                        *hdr = (struct ipv6_opt_hdr *)*p;
1048                        if (ipv6_optlen(*hdr) > newoptlen)
1049                                return -EINVAL;
1050                        *p += CMSG_ALIGN(newoptlen);
1051                }
1052        }
1053        return 0;
1054}
1055
1056/**
1057 * ipv6_renew_options - replace a specific ext hdr with a new one.
1058 *
1059 * @sk: sock from which to allocate memory
1060 * @opt: original options
1061 * @newtype: option type to replace in @opt
1062 * @newopt: new option of type @newtype to replace (user-mem)
1063 * @newoptlen: length of @newopt
1064 *
1065 * Returns a new set of options which is a copy of @opt with the
1066 * option type @newtype replaced with @newopt.
1067 *
1068 * @opt may be NULL, in which case a new set of options is returned
1069 * containing just @newopt.
1070 *
1071 * @newopt may be NULL, in which case the specified option type is
1072 * not copied into the new set of options.
1073 *
1074 * The new set of options is allocated from the socket option memory
1075 * buffer of @sk.
1076 */
1077struct ipv6_txoptions *
1078ipv6_renew_options(struct sock *sk, struct ipv6_txoptions *opt,
1079                   int newtype,
1080                   struct ipv6_opt_hdr __user *newopt, int newoptlen)
1081{
1082        int tot_len = 0;
1083        char *p;
1084        struct ipv6_txoptions *opt2;
1085        int err;
1086
1087        if (opt) {
1088                if (newtype != IPV6_HOPOPTS && opt->hopopt)
1089                        tot_len += CMSG_ALIGN(ipv6_optlen(opt->hopopt));
1090                if (newtype != IPV6_RTHDRDSTOPTS && opt->dst0opt)
1091                        tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst0opt));
1092                if (newtype != IPV6_RTHDR && opt->srcrt)
1093                        tot_len += CMSG_ALIGN(ipv6_optlen(opt->srcrt));
1094                if (newtype != IPV6_DSTOPTS && opt->dst1opt)
1095                        tot_len += CMSG_ALIGN(ipv6_optlen(opt->dst1opt));
1096        }
1097
1098        if (newopt && newoptlen)
1099                tot_len += CMSG_ALIGN(newoptlen);
1100
1101        if (!tot_len)
1102                return NULL;
1103
1104        tot_len += sizeof(*opt2);
1105        opt2 = sock_kmalloc(sk, tot_len, GFP_ATOMIC);
1106        if (!opt2)
1107                return ERR_PTR(-ENOBUFS);
1108
1109        memset(opt2, 0, tot_len);
1110        refcount_set(&opt2->refcnt, 1);
1111        opt2->tot_len = tot_len;
1112        p = (char *)(opt2 + 1);
1113
1114        err = ipv6_renew_option(opt ? opt->hopopt : NULL, newopt, newoptlen,
1115                                newtype != IPV6_HOPOPTS,
1116                                &opt2->hopopt, &p);
1117        if (err)
1118                goto out;
1119
1120        err = ipv6_renew_option(opt ? opt->dst0opt : NULL, newopt, newoptlen,
1121                                newtype != IPV6_RTHDRDSTOPTS,
1122                                &opt2->dst0opt, &p);
1123        if (err)
1124                goto out;
1125
1126        err = ipv6_renew_option(opt ? opt->srcrt : NULL, newopt, newoptlen,
1127                                newtype != IPV6_RTHDR,
1128                                (struct ipv6_opt_hdr **)&opt2->srcrt, &p);
1129        if (err)
1130                goto out;
1131
1132        err = ipv6_renew_option(opt ? opt->dst1opt : NULL, newopt, newoptlen,
1133                                newtype != IPV6_DSTOPTS,
1134                                &opt2->dst1opt, &p);
1135        if (err)
1136                goto out;
1137
1138        opt2->opt_nflen = (opt2->hopopt ? ipv6_optlen(opt2->hopopt) : 0) +
1139                          (opt2->dst0opt ? ipv6_optlen(opt2->dst0opt) : 0) +
1140                          (opt2->srcrt ? ipv6_optlen(opt2->srcrt) : 0);
1141        opt2->opt_flen = (opt2->dst1opt ? ipv6_optlen(opt2->dst1opt) : 0);
1142
1143        return opt2;
1144out:
1145        sock_kfree_s(sk, opt2, opt2->tot_len);
1146        return ERR_PTR(err);
1147}
1148
1149/**
1150 * ipv6_renew_options_kern - replace a specific ext hdr with a new one.
1151 *
1152 * @sk: sock from which to allocate memory
1153 * @opt: original options
1154 * @newtype: option type to replace in @opt
1155 * @newopt: new option of type @newtype to replace (kernel-mem)
1156 * @newoptlen: length of @newopt
1157 *
1158 * See ipv6_renew_options().  The difference is that @newopt is
1159 * kernel memory, rather than user memory.
1160 */
1161struct ipv6_txoptions *
1162ipv6_renew_options_kern(struct sock *sk, struct ipv6_txoptions *opt,
1163                        int newtype, struct ipv6_opt_hdr *newopt,
1164                        int newoptlen)
1165{
1166        struct ipv6_txoptions *ret_val;
1167        const mm_segment_t old_fs = get_fs();
1168
1169        set_fs(KERNEL_DS);
1170        ret_val = ipv6_renew_options(sk, opt, newtype,
1171                                     (struct ipv6_opt_hdr __user *)newopt,
1172                                     newoptlen);
1173        set_fs(old_fs);
1174        return ret_val;
1175}
1176
1177struct ipv6_txoptions *ipv6_fixup_options(struct ipv6_txoptions *opt_space,
1178                                          struct ipv6_txoptions *opt)
1179{
1180        /*
1181         * ignore the dest before srcrt unless srcrt is being included.
1182         * --yoshfuji
1183         */
1184        if (opt && opt->dst0opt && !opt->srcrt) {
1185                if (opt_space != opt) {
1186                        memcpy(opt_space, opt, sizeof(*opt_space));
1187                        opt = opt_space;
1188                }
1189                opt->opt_nflen -= ipv6_optlen(opt->dst0opt);
1190                opt->dst0opt = NULL;
1191        }
1192
1193        return opt;
1194}
1195EXPORT_SYMBOL_GPL(ipv6_fixup_options);
1196
1197/**
1198 * fl6_update_dst - update flowi destination address with info given
1199 *                  by srcrt option, if any.
1200 *
1201 * @fl6: flowi6 for which daddr is to be updated
1202 * @opt: struct ipv6_txoptions in which to look for srcrt opt
1203 * @orig: copy of original daddr address if modified
1204 *
1205 * Returns NULL if no txoptions or no srcrt, otherwise returns orig
1206 * and initial value of fl6->daddr set in orig
1207 */
1208struct in6_addr *fl6_update_dst(struct flowi6 *fl6,
1209                                const struct ipv6_txoptions *opt,
1210                                struct in6_addr *orig)
1211{
1212        if (!opt || !opt->srcrt)
1213                return NULL;
1214
1215        *orig = fl6->daddr;
1216
1217        switch (opt->srcrt->type) {
1218        case IPV6_SRCRT_TYPE_0:
1219        case IPV6_SRCRT_STRICT:
1220        case IPV6_SRCRT_TYPE_2:
1221                fl6->daddr = *((struct rt0_hdr *)opt->srcrt)->addr;
1222                break;
1223        case IPV6_SRCRT_TYPE_4:
1224        {
1225                struct ipv6_sr_hdr *srh = (struct ipv6_sr_hdr *)opt->srcrt;
1226
1227                fl6->daddr = srh->segments[srh->segments_left];
1228                break;
1229        }
1230        default:
1231                return NULL;
1232        }
1233
1234        return orig;
1235}
1236EXPORT_SYMBOL_GPL(fl6_update_dst);
1237