linux/tools/testing/selftests/net/ip_defrag.c
<<
>>
Prefs
   1// SPDX-License-Identifier: GPL-2.0
   2
   3#define _GNU_SOURCE
   4
   5#include <arpa/inet.h>
   6#include <errno.h>
   7#include <error.h>
   8#include <linux/in.h>
   9#include <netinet/ip.h>
  10#include <netinet/ip6.h>
  11#include <netinet/udp.h>
  12#include <stdbool.h>
  13#include <stdio.h>
  14#include <stdlib.h>
  15#include <string.h>
  16#include <time.h>
  17#include <unistd.h>
  18
  19static bool             cfg_do_ipv4;
  20static bool             cfg_do_ipv6;
  21static bool             cfg_verbose;
  22static bool             cfg_overlap;
  23static bool             cfg_permissive;
  24static unsigned short   cfg_port = 9000;
  25
  26const struct in_addr addr4 = { .s_addr = __constant_htonl(INADDR_LOOPBACK + 2) };
  27const struct in6_addr addr6 = IN6ADDR_LOOPBACK_INIT;
  28
  29#define IP4_HLEN        (sizeof(struct iphdr))
  30#define IP6_HLEN        (sizeof(struct ip6_hdr))
  31#define UDP_HLEN        (sizeof(struct udphdr))
  32
  33/* IPv6 fragment header lenth. */
  34#define FRAG_HLEN       8
  35
  36static int payload_len;
  37static int max_frag_len;
  38
  39#define MSG_LEN_MAX     10000   /* Max UDP payload length. */
  40
  41#define IP4_MF          (1u << 13)  /* IPv4 MF flag. */
  42#define IP6_MF          (1)  /* IPv6 MF flag. */
  43
  44#define CSUM_MANGLED_0 (0xffff)
  45
  46static uint8_t udp_payload[MSG_LEN_MAX];
  47static uint8_t ip_frame[IP_MAXPACKET];
  48static uint32_t ip_id = 0xabcd;
  49static int msg_counter;
  50static int frag_counter;
  51static unsigned int seed;
  52
  53/* Receive a UDP packet. Validate it matches udp_payload. */
  54static void recv_validate_udp(int fd_udp)
  55{
  56        ssize_t ret;
  57        static uint8_t recv_buff[MSG_LEN_MAX];
  58
  59        ret = recv(fd_udp, recv_buff, payload_len, 0);
  60        msg_counter++;
  61
  62        if (cfg_overlap) {
  63                if (ret == -1 && (errno == ETIMEDOUT || errno == EAGAIN))
  64                        return;  /* OK */
  65                if (!cfg_permissive) {
  66                        if (ret != -1)
  67                                error(1, 0, "recv: expected timeout; got %d",
  68                                        (int)ret);
  69                        error(1, errno, "recv: expected timeout: %d", errno);
  70                }
  71        }
  72
  73        if (ret == -1)
  74                error(1, errno, "recv: payload_len = %d max_frag_len = %d",
  75                        payload_len, max_frag_len);
  76        if (ret != payload_len)
  77                error(1, 0, "recv: wrong size: %d vs %d", (int)ret, payload_len);
  78        if (memcmp(udp_payload, recv_buff, payload_len))
  79                error(1, 0, "recv: wrong data");
  80}
  81
  82static uint32_t raw_checksum(uint8_t *buf, int len, uint32_t sum)
  83{
  84        int i;
  85
  86        for (i = 0; i < (len & ~1U); i += 2) {
  87                sum += (u_int16_t)ntohs(*((u_int16_t *)(buf + i)));
  88                if (sum > 0xffff)
  89                        sum -= 0xffff;
  90        }
  91
  92        if (i < len) {
  93                sum += buf[i] << 8;
  94                if (sum > 0xffff)
  95                        sum -= 0xffff;
  96        }
  97
  98        return sum;
  99}
 100
 101static uint16_t udp_checksum(struct ip *iphdr, struct udphdr *udphdr)
 102{
 103        uint32_t sum = 0;
 104        uint16_t res;
 105
 106        sum = raw_checksum((uint8_t *)&iphdr->ip_src, 2 * sizeof(iphdr->ip_src),
 107                                IPPROTO_UDP + (uint32_t)(UDP_HLEN + payload_len));
 108        sum = raw_checksum((uint8_t *)udphdr, UDP_HLEN, sum);
 109        sum = raw_checksum((uint8_t *)udp_payload, payload_len, sum);
 110        res = 0xffff & ~sum;
 111        if (res)
 112                return htons(res);
 113        else
 114                return CSUM_MANGLED_0;
 115}
 116
 117static uint16_t udp6_checksum(struct ip6_hdr *iphdr, struct udphdr *udphdr)
 118{
 119        uint32_t sum = 0;
 120        uint16_t res;
 121
 122        sum = raw_checksum((uint8_t *)&iphdr->ip6_src, 2 * sizeof(iphdr->ip6_src),
 123                                IPPROTO_UDP);
 124        sum = raw_checksum((uint8_t *)&udphdr->len, sizeof(udphdr->len), sum);
 125        sum = raw_checksum((uint8_t *)udphdr, UDP_HLEN, sum);
 126        sum = raw_checksum((uint8_t *)udp_payload, payload_len, sum);
 127        res = 0xffff & ~sum;
 128        if (res)
 129                return htons(res);
 130        else
 131                return CSUM_MANGLED_0;
 132}
 133
 134static void send_fragment(int fd_raw, struct sockaddr *addr, socklen_t alen,
 135                                int offset, bool ipv6)
 136{
 137        int frag_len;
 138        int res;
 139        int payload_offset = offset > 0 ? offset - UDP_HLEN : 0;
 140        uint8_t *frag_start = ipv6 ? ip_frame + IP6_HLEN + FRAG_HLEN :
 141                                        ip_frame + IP4_HLEN;
 142
 143        if (offset == 0) {
 144                struct udphdr udphdr;
 145                udphdr.source = htons(cfg_port + 1);
 146                udphdr.dest = htons(cfg_port);
 147                udphdr.len = htons(UDP_HLEN + payload_len);
 148                udphdr.check = 0;
 149                if (ipv6)
 150                        udphdr.check = udp6_checksum((struct ip6_hdr *)ip_frame, &udphdr);
 151                else
 152                        udphdr.check = udp_checksum((struct ip *)ip_frame, &udphdr);
 153                memcpy(frag_start, &udphdr, UDP_HLEN);
 154        }
 155
 156        if (ipv6) {
 157                struct ip6_hdr *ip6hdr = (struct ip6_hdr *)ip_frame;
 158                struct ip6_frag *fraghdr = (struct ip6_frag *)(ip_frame + IP6_HLEN);
 159                if (payload_len - payload_offset <= max_frag_len && offset > 0) {
 160                        /* This is the last fragment. */
 161                        frag_len = FRAG_HLEN + payload_len - payload_offset;
 162                        fraghdr->ip6f_offlg = htons(offset);
 163                } else {
 164                        frag_len = FRAG_HLEN + max_frag_len;
 165                        fraghdr->ip6f_offlg = htons(offset | IP6_MF);
 166                }
 167                ip6hdr->ip6_plen = htons(frag_len);
 168                if (offset == 0)
 169                        memcpy(frag_start + UDP_HLEN, udp_payload,
 170                                frag_len - FRAG_HLEN - UDP_HLEN);
 171                else
 172                        memcpy(frag_start, udp_payload + payload_offset,
 173                                frag_len - FRAG_HLEN);
 174                frag_len += IP6_HLEN;
 175        } else {
 176                struct ip *iphdr = (struct ip *)ip_frame;
 177                if (payload_len - payload_offset <= max_frag_len && offset > 0) {
 178                        /* This is the last fragment. */
 179                        frag_len = IP4_HLEN + payload_len - payload_offset;
 180                        iphdr->ip_off = htons(offset / 8);
 181                } else {
 182                        frag_len = IP4_HLEN + max_frag_len;
 183                        iphdr->ip_off = htons(offset / 8 | IP4_MF);
 184                }
 185                iphdr->ip_len = htons(frag_len);
 186                if (offset == 0)
 187                        memcpy(frag_start + UDP_HLEN, udp_payload,
 188                                frag_len - IP4_HLEN - UDP_HLEN);
 189                else
 190                        memcpy(frag_start, udp_payload + payload_offset,
 191                                frag_len - IP4_HLEN);
 192        }
 193
 194        res = sendto(fd_raw, ip_frame, frag_len, 0, addr, alen);
 195        if (res < 0 && errno != EPERM)
 196                error(1, errno, "send_fragment");
 197        if (res >= 0 && res != frag_len)
 198                error(1, 0, "send_fragment: %d vs %d", res, frag_len);
 199
 200        frag_counter++;
 201}
 202
 203static void send_udp_frags(int fd_raw, struct sockaddr *addr,
 204                                socklen_t alen, bool ipv6)
 205{
 206        struct ip *iphdr = (struct ip *)ip_frame;
 207        struct ip6_hdr *ip6hdr = (struct ip6_hdr *)ip_frame;
 208        int res;
 209        int offset;
 210        int frag_len;
 211
 212        /* Send the UDP datagram using raw IP fragments: the 0th fragment
 213         * has the UDP header; other fragments are pieces of udp_payload
 214         * split in chunks of frag_len size.
 215         *
 216         * Odd fragments (1st, 3rd, 5th, etc.) are sent out first, then
 217         * even fragments (0th, 2nd, etc.) are sent out.
 218         */
 219        if (ipv6) {
 220                struct ip6_frag *fraghdr = (struct ip6_frag *)(ip_frame + IP6_HLEN);
 221                ((struct sockaddr_in6 *)addr)->sin6_port = 0;
 222                memset(ip6hdr, 0, sizeof(*ip6hdr));
 223                ip6hdr->ip6_flow = htonl(6<<28);  /* Version. */
 224                ip6hdr->ip6_nxt = IPPROTO_FRAGMENT;
 225                ip6hdr->ip6_hops = 255;
 226                ip6hdr->ip6_src = addr6;
 227                ip6hdr->ip6_dst = addr6;
 228                fraghdr->ip6f_nxt = IPPROTO_UDP;
 229                fraghdr->ip6f_reserved = 0;
 230                fraghdr->ip6f_ident = htonl(ip_id++);
 231        } else {
 232                memset(iphdr, 0, sizeof(*iphdr));
 233                iphdr->ip_hl = 5;
 234                iphdr->ip_v = 4;
 235                iphdr->ip_tos = 0;
 236                iphdr->ip_id = htons(ip_id++);
 237                iphdr->ip_ttl = 0x40;
 238                iphdr->ip_p = IPPROTO_UDP;
 239                iphdr->ip_src.s_addr = htonl(INADDR_LOOPBACK);
 240                iphdr->ip_dst = addr4;
 241                iphdr->ip_sum = 0;
 242        }
 243
 244        /* Occasionally test in-order fragments. */
 245        if (!cfg_overlap && (rand() % 100 < 15)) {
 246                offset = 0;
 247                while (offset < (UDP_HLEN + payload_len)) {
 248                        send_fragment(fd_raw, addr, alen, offset, ipv6);
 249                        offset += max_frag_len;
 250                }
 251                return;
 252        }
 253
 254        /* Occasionally test IPv4 "runs" (see net/ipv4/ip_fragment.c) */
 255        if (!cfg_overlap && (rand() % 100 < 20) &&
 256                        (payload_len > 9 * max_frag_len)) {
 257                offset = 6 * max_frag_len;
 258                while (offset < (UDP_HLEN + payload_len)) {
 259                        send_fragment(fd_raw, addr, alen, offset, ipv6);
 260                        offset += max_frag_len;
 261                }
 262                offset = 3 * max_frag_len;
 263                while (offset < 6 * max_frag_len) {
 264                        send_fragment(fd_raw, addr, alen, offset, ipv6);
 265                        offset += max_frag_len;
 266                }
 267                offset = 0;
 268                while (offset < 3 * max_frag_len) {
 269                        send_fragment(fd_raw, addr, alen, offset, ipv6);
 270                        offset += max_frag_len;
 271                }
 272                return;
 273        }
 274
 275        /* Odd fragments. */
 276        offset = max_frag_len;
 277        while (offset < (UDP_HLEN + payload_len)) {
 278                send_fragment(fd_raw, addr, alen, offset, ipv6);
 279                /* IPv4 ignores duplicates, so randomly send a duplicate. */
 280                if (rand() % 100 == 1)
 281                        send_fragment(fd_raw, addr, alen, offset, ipv6);
 282                offset += 2 * max_frag_len;
 283        }
 284
 285        if (cfg_overlap) {
 286                /* Send an extra random fragment.
 287                 *
 288                 * Duplicates and some fragments completely inside
 289                 * previously sent fragments are dropped/ignored. So
 290                 * random offset and frag_len can result in a dropped
 291                 * fragment instead of a dropped queue/packet. Thus we
 292                 * hard-code offset and frag_len.
 293                 */
 294                if (max_frag_len * 4 < payload_len || max_frag_len < 16) {
 295                        /* not enough payload for random offset and frag_len. */
 296                        offset = 8;
 297                        frag_len = UDP_HLEN + max_frag_len;
 298                } else {
 299                        offset = rand() % (payload_len / 2);
 300                        frag_len = 2 * max_frag_len + 1 + rand() % 256;
 301                }
 302                if (ipv6) {
 303                        struct ip6_frag *fraghdr = (struct ip6_frag *)(ip_frame + IP6_HLEN);
 304                        /* sendto() returns EINVAL if offset + frag_len is too small. */
 305                        /* In IPv6 if !!(frag_len % 8), the fragment is dropped. */
 306                        frag_len &= ~0x7;
 307                        fraghdr->ip6f_offlg = htons(offset / 8 | IP6_MF);
 308                        ip6hdr->ip6_plen = htons(frag_len);
 309                        frag_len += IP6_HLEN;
 310                } else {
 311                        frag_len += IP4_HLEN;
 312                        iphdr->ip_off = htons(offset / 8 | IP4_MF);
 313                        iphdr->ip_len = htons(frag_len);
 314                }
 315                res = sendto(fd_raw, ip_frame, frag_len, 0, addr, alen);
 316                if (res < 0 && errno != EPERM)
 317                        error(1, errno, "sendto overlap: %d", frag_len);
 318                if (res >= 0 && res != frag_len)
 319                        error(1, 0, "sendto overlap: %d vs %d", (int)res, frag_len);
 320                frag_counter++;
 321        }
 322
 323        /* Event fragments. */
 324        offset = 0;
 325        while (offset < (UDP_HLEN + payload_len)) {
 326                send_fragment(fd_raw, addr, alen, offset, ipv6);
 327                /* IPv4 ignores duplicates, so randomly send a duplicate. */
 328                if (rand() % 100 == 1)
 329                        send_fragment(fd_raw, addr, alen, offset, ipv6);
 330                offset += 2 * max_frag_len;
 331        }
 332}
 333
 334static void run_test(struct sockaddr *addr, socklen_t alen, bool ipv6)
 335{
 336        int fd_tx_raw, fd_rx_udp;
 337        /* Frag queue timeout is set to one second in the calling script;
 338         * socket timeout should be just a bit longer to avoid tests interfering
 339         * with each other.
 340         */
 341        struct timeval tv = { .tv_sec = 1, .tv_usec = 10 };
 342        int idx;
 343        int min_frag_len = 8;
 344
 345        /* Initialize the payload. */
 346        for (idx = 0; idx < MSG_LEN_MAX; ++idx)
 347                udp_payload[idx] = idx % 256;
 348
 349        /* Open sockets. */
 350        fd_tx_raw = socket(addr->sa_family, SOCK_RAW, IPPROTO_RAW);
 351        if (fd_tx_raw == -1)
 352                error(1, errno, "socket tx_raw");
 353
 354        fd_rx_udp = socket(addr->sa_family, SOCK_DGRAM, 0);
 355        if (fd_rx_udp == -1)
 356                error(1, errno, "socket rx_udp");
 357        if (bind(fd_rx_udp, addr, alen))
 358                error(1, errno, "bind");
 359        /* Fail fast. */
 360        if (setsockopt(fd_rx_udp, SOL_SOCKET, SO_RCVTIMEO, &tv, sizeof(tv)))
 361                error(1, errno, "setsockopt rcv timeout");
 362
 363        for (payload_len = min_frag_len; payload_len < MSG_LEN_MAX;
 364                        payload_len += (rand() % 4096)) {
 365                if (cfg_verbose)
 366                        printf("payload_len: %d\n", payload_len);
 367
 368                if (cfg_overlap) {
 369                        /* With overlaps, one send/receive pair below takes
 370                         * at least one second (== timeout) to run, so there
 371                         * is not enough test time to run a nested loop:
 372                         * the full overlap test takes 20-30 seconds.
 373                         */
 374                        max_frag_len = min_frag_len +
 375                                rand() % (1500 - FRAG_HLEN - min_frag_len);
 376                        send_udp_frags(fd_tx_raw, addr, alen, ipv6);
 377                        recv_validate_udp(fd_rx_udp);
 378                } else {
 379                        /* Without overlaps, each packet reassembly (== one
 380                         * send/receive pair below) takes very little time to
 381                         * run, so we can easily afford more thourough testing
 382                         * with a nested loop: the full non-overlap test takes
 383                         * less than one second).
 384                         */
 385                        max_frag_len = min_frag_len;
 386                        do {
 387                                send_udp_frags(fd_tx_raw, addr, alen, ipv6);
 388                                recv_validate_udp(fd_rx_udp);
 389                                max_frag_len += 8 * (rand() % 8);
 390                        } while (max_frag_len < (1500 - FRAG_HLEN) &&
 391                                 max_frag_len <= payload_len);
 392                }
 393        }
 394
 395        /* Cleanup. */
 396        if (close(fd_tx_raw))
 397                error(1, errno, "close tx_raw");
 398        if (close(fd_rx_udp))
 399                error(1, errno, "close rx_udp");
 400
 401        if (cfg_verbose)
 402                printf("processed %d messages, %d fragments\n",
 403                        msg_counter, frag_counter);
 404
 405        fprintf(stderr, "PASS\n");
 406}
 407
 408
 409static void run_test_v4(void)
 410{
 411        struct sockaddr_in addr = {0};
 412
 413        addr.sin_family = AF_INET;
 414        addr.sin_port = htons(cfg_port);
 415        addr.sin_addr = addr4;
 416
 417        run_test((void *)&addr, sizeof(addr), false /* !ipv6 */);
 418}
 419
 420static void run_test_v6(void)
 421{
 422        struct sockaddr_in6 addr = {0};
 423
 424        addr.sin6_family = AF_INET6;
 425        addr.sin6_port = htons(cfg_port);
 426        addr.sin6_addr = addr6;
 427
 428        run_test((void *)&addr, sizeof(addr), true /* ipv6 */);
 429}
 430
 431static void parse_opts(int argc, char **argv)
 432{
 433        int c;
 434
 435        while ((c = getopt(argc, argv, "46opv")) != -1) {
 436                switch (c) {
 437                case '4':
 438                        cfg_do_ipv4 = true;
 439                        break;
 440                case '6':
 441                        cfg_do_ipv6 = true;
 442                        break;
 443                case 'o':
 444                        cfg_overlap = true;
 445                        break;
 446                case 'p':
 447                        cfg_permissive = true;
 448                        break;
 449                case 'v':
 450                        cfg_verbose = true;
 451                        break;
 452                default:
 453                        error(1, 0, "%s: parse error", argv[0]);
 454                }
 455        }
 456}
 457
 458int main(int argc, char **argv)
 459{
 460        parse_opts(argc, argv);
 461        seed = time(NULL);
 462        srand(seed);
 463        /* Print the seed to track/reproduce potential failures. */
 464        printf("seed = %d\n", seed);
 465
 466        if (cfg_do_ipv4)
 467                run_test_v4();
 468        if (cfg_do_ipv6)
 469                run_test_v6();
 470
 471        return 0;
 472}
 473