1// SPDX-License-Identifier: GPL-2.0
2
3#define _GNU_SOURCE
4
5#include <arpa/inet.h>
6#include <errno.h>
7#include <error.h>
8#include <linux/in.h>
9#include <netinet/ip.h>
10#include <netinet/ip6.h>
11#include <netinet/udp.h>
12#include <stdbool.h>
13#include <stdio.h>
14#include <stdlib.h>
15#include <string.h>
16#include <time.h>
17#include <unistd.h>
18
19static bool cfg_do_ipv4;
20static bool cfg_do_ipv6;
21static bool cfg_verbose;
22static bool cfg_overlap;
23static bool cfg_permissive;
24static unsigned short cfg_port = 9000;
25
26const struct in_addr addr4 = { .s_addr = __constant_htonl(INADDR_LOOPBACK + 2) };
27const struct in6_addr addr6 = IN6ADDR_LOOPBACK_INIT;
28
29#define IP4_HLEN (sizeof(struct iphdr))
30#define IP6_HLEN (sizeof(struct ip6_hdr))
31#define UDP_HLEN (sizeof(struct udphdr))
32
33/* IPv6 fragment header lenth. */
34#define FRAG_HLEN 8
35
36static int payload_len;
37static int max_frag_len;
38
39#define MSG_LEN_MAX 10000 /* Max UDP payload length. */
40
41#define IP4_MF (1u << 13) /* IPv4 MF flag. */
42#define IP6_MF (1) /* IPv6 MF flag. */
43
44#define CSUM_MANGLED_0 (0xffff)
45
46static uint8_t udp_payload[MSG_LEN_MAX];
47static uint8_t ip_frame[IP_MAXPACKET];
48static uint32_t ip_id = 0xabcd;
49static int msg_counter;
50static int frag_counter;
51static unsigned int seed;
52
53/* Receive a UDP packet. Validate it matches udp_payload. */
54static void recv_validate_udp(int fd_udp)
55{
56 ssize_t ret;
57 static uint8_t recv_buff[MSG_LEN_MAX];
58
59 ret = recv(fd_udp, recv_buff, payload_len, 0);
60 msg_counter++;
61
62 if (cfg_overlap) {
63 if (ret == -1 && (errno == ETIMEDOUT || errno == EAGAIN))
64 return; /* OK */
65 if (!cfg_permissive) {
66 if (ret != -1)
67 error(1, 0, "recv: expected timeout; got %d",
68 (int)ret);
69 error(1, errno, "recv: expected timeout: %d", errno);
70 }
71 }
72
73 if (ret == -1)
74 error(1, errno, "recv: payload_len = %d max_frag_len = %d",
75 payload_len, max_frag_len);
76 if (ret != payload_len)
77 error(1, 0, "recv: wrong size: %d vs %d", (int)ret, payload_len);
78 if (memcmp(p: udp_payload, q: recv_buff, size: payload_len))
79 error(1, 0, "recv: wrong data");
80}
81
82static uint32_t raw_checksum(uint8_t *buf, int len, uint32_t sum)
83{
84 int i;
85
86 for (i = 0; i < (len & ~1U); i += 2) {
87 sum += (u_int16_t)ntohs(*((u_int16_t *)(buf + i)));
88 if (sum > 0xffff)
89 sum -= 0xffff;
90 }
91
92 if (i < len) {
93 sum += buf[i] << 8;
94 if (sum > 0xffff)
95 sum -= 0xffff;
96 }
97
98 return sum;
99}
100
101static uint16_t udp_checksum(struct ip *iphdr, struct udphdr *udphdr)
102{
103 uint32_t sum = 0;
104 uint16_t res;
105
106 sum = raw_checksum((uint8_t *)&iphdr->ip_src, 2 * sizeof(iphdr->ip_src),
107 IPPROTO_UDP + (uint32_t)(UDP_HLEN + payload_len));
108 sum = raw_checksum((uint8_t *)udphdr, UDP_HLEN, sum);
109 sum = raw_checksum(buf: (uint8_t *)udp_payload, len: payload_len, sum);
110 res = 0xffff & ~sum;
111 if (res)
112 return htons(res);
113 else
114 return CSUM_MANGLED_0;
115}
116
117static uint16_t udp6_checksum(struct ip6_hdr *iphdr, struct udphdr *udphdr)
118{
119 uint32_t sum = 0;
120 uint16_t res;
121
122 sum = raw_checksum(buf: (uint8_t *)&iphdr->ip6_src, len: 2 * sizeof(iphdr->ip6_src),
123 IPPROTO_UDP);
124 sum = raw_checksum(buf: (uint8_t *)&udphdr->len, len: sizeof(udphdr->len), sum);
125 sum = raw_checksum((uint8_t *)udphdr, UDP_HLEN, sum);
126 sum = raw_checksum(buf: (uint8_t *)udp_payload, len: payload_len, sum);
127 res = 0xffff & ~sum;
128 if (res)
129 return htons(res);
130 else
131 return CSUM_MANGLED_0;
132}
133
134static void send_fragment(int fd_raw, struct sockaddr *addr, socklen_t alen,
135 int offset, bool ipv6)
136{
137 int frag_len;
138 int res;
139 int payload_offset = offset > 0 ? offset - UDP_HLEN : 0;
140 uint8_t *frag_start = ipv6 ? ip_frame + IP6_HLEN + FRAG_HLEN :
141 ip_frame + IP4_HLEN;
142
143 if (offset == 0) {
144 struct udphdr udphdr;
145 udphdr.source = htons(cfg_port + 1);
146 udphdr.dest = htons(cfg_port);
147 udphdr.len = htons(UDP_HLEN + payload_len);
148 udphdr.check = 0;
149 if (ipv6)
150 udphdr.check = udp6_checksum(iphdr: (struct ip6_hdr *)ip_frame, udphdr: &udphdr);
151 else
152 udphdr.check = udp_checksum(iphdr: (struct ip *)ip_frame, udphdr: &udphdr);
153 memcpy(frag_start, &udphdr, UDP_HLEN);
154 }
155
156 if (ipv6) {
157 struct ip6_hdr *ip6hdr = (struct ip6_hdr *)ip_frame;
158 struct ip6_frag *fraghdr = (struct ip6_frag *)(ip_frame + IP6_HLEN);
159 if (payload_len - payload_offset <= max_frag_len && offset > 0) {
160 /* This is the last fragment. */
161 frag_len = FRAG_HLEN + payload_len - payload_offset;
162 fraghdr->ip6f_offlg = htons(offset);
163 } else {
164 frag_len = FRAG_HLEN + max_frag_len;
165 fraghdr->ip6f_offlg = htons(offset | IP6_MF);
166 }
167 ip6hdr->ip6_plen = htons(frag_len);
168 if (offset == 0)
169 memcpy(frag_start + UDP_HLEN, udp_payload,
170 frag_len - FRAG_HLEN - UDP_HLEN);
171 else
172 memcpy(frag_start, udp_payload + payload_offset,
173 frag_len - FRAG_HLEN);
174 frag_len += IP6_HLEN;
175 } else {
176 struct ip *iphdr = (struct ip *)ip_frame;
177 if (payload_len - payload_offset <= max_frag_len && offset > 0) {
178 /* This is the last fragment. */
179 frag_len = IP4_HLEN + payload_len - payload_offset;
180 iphdr->ip_off = htons(offset / 8);
181 } else {
182 frag_len = IP4_HLEN + max_frag_len;
183 iphdr->ip_off = htons(offset / 8 | IP4_MF);
184 }
185 iphdr->ip_len = htons(frag_len);
186 if (offset == 0)
187 memcpy(frag_start + UDP_HLEN, udp_payload,
188 frag_len - IP4_HLEN - UDP_HLEN);
189 else
190 memcpy(frag_start, udp_payload + payload_offset,
191 frag_len - IP4_HLEN);
192 }
193
194 res = sendto(fd_raw, ip_frame, frag_len, 0, addr, alen);
195 if (res < 0 && errno != EPERM)
196 error(1, errno, "send_fragment");
197 if (res >= 0 && res != frag_len)
198 error(1, 0, "send_fragment: %d vs %d", res, frag_len);
199
200 frag_counter++;
201}
202
203static void send_udp_frags(int fd_raw, struct sockaddr *addr,
204 socklen_t alen, bool ipv6)
205{
206 struct ip *iphdr = (struct ip *)ip_frame;
207 struct ip6_hdr *ip6hdr = (struct ip6_hdr *)ip_frame;
208 int res;
209 int offset;
210 int frag_len;
211
212 /* Send the UDP datagram using raw IP fragments: the 0th fragment
213 * has the UDP header; other fragments are pieces of udp_payload
214 * split in chunks of frag_len size.
215 *
216 * Odd fragments (1st, 3rd, 5th, etc.) are sent out first, then
217 * even fragments (0th, 2nd, etc.) are sent out.
218 */
219 if (ipv6) {
220 struct ip6_frag *fraghdr = (struct ip6_frag *)(ip_frame + IP6_HLEN);
221 ((struct sockaddr_in6 *)addr)->sin6_port = 0;
222 memset(ip6hdr, 0, sizeof(*ip6hdr));
223 ip6hdr->ip6_flow = htonl(6<<28); /* Version. */
224 ip6hdr->ip6_nxt = IPPROTO_FRAGMENT;
225 ip6hdr->ip6_hops = 255;
226 ip6hdr->ip6_src = addr6;
227 ip6hdr->ip6_dst = addr6;
228 fraghdr->ip6f_nxt = IPPROTO_UDP;
229 fraghdr->ip6f_reserved = 0;
230 fraghdr->ip6f_ident = htonl(ip_id++);
231 } else {
232 memset(iphdr, 0, sizeof(*iphdr));
233 iphdr->ip_hl = 5;
234 iphdr->ip_v = 4;
235 iphdr->ip_tos = 0;
236 iphdr->ip_id = htons(ip_id++);
237 iphdr->ip_ttl = 0x40;
238 iphdr->ip_p = IPPROTO_UDP;
239 iphdr->ip_src.s_addr = htonl(INADDR_LOOPBACK);
240 iphdr->ip_dst = addr4;
241 iphdr->ip_sum = 0;
242 }
243
244 /* Occasionally test in-order fragments. */
245 if (!cfg_overlap && (rand() % 100 < 15)) {
246 offset = 0;
247 while (offset < (UDP_HLEN + payload_len)) {
248 send_fragment(fd_raw, addr, alen, offset, ipv6);
249 offset += max_frag_len;
250 }
251 return;
252 }
253
254 /* Occasionally test IPv4 "runs" (see net/ipv4/ip_fragment.c) */
255 if (!cfg_overlap && (rand() % 100 < 20) &&
256 (payload_len > 9 * max_frag_len)) {
257 offset = 6 * max_frag_len;
258 while (offset < (UDP_HLEN + payload_len)) {
259 send_fragment(fd_raw, addr, alen, offset, ipv6);
260 offset += max_frag_len;
261 }
262 offset = 3 * max_frag_len;
263 while (offset < 6 * max_frag_len) {
264 send_fragment(fd_raw, addr, alen, offset, ipv6);
265 offset += max_frag_len;
266 }
267 offset = 0;
268 while (offset < 3 * max_frag_len) {
269 send_fragment(fd_raw, addr, alen, offset, ipv6);
270 offset += max_frag_len;
271 }
272 return;
273 }
274
275 /* Odd fragments. */
276 offset = max_frag_len;
277 while (offset < (UDP_HLEN + payload_len)) {
278 send_fragment(fd_raw, addr, alen, offset, ipv6);
279 /* IPv4 ignores duplicates, so randomly send a duplicate. */
280 if (rand() % 100 == 1)
281 send_fragment(fd_raw, addr, alen, offset, ipv6);
282 offset += 2 * max_frag_len;
283 }
284
285 if (cfg_overlap) {
286 /* Send an extra random fragment.
287 *
288 * Duplicates and some fragments completely inside
289 * previously sent fragments are dropped/ignored. So
290 * random offset and frag_len can result in a dropped
291 * fragment instead of a dropped queue/packet. Thus we
292 * hard-code offset and frag_len.
293 */
294 if (max_frag_len * 4 < payload_len || max_frag_len < 16) {
295 /* not enough payload for random offset and frag_len. */
296 offset = 8;
297 frag_len = UDP_HLEN + max_frag_len;
298 } else {
299 offset = rand() % (payload_len / 2);
300 frag_len = 2 * max_frag_len + 1 + rand() % 256;
301 }
302 if (ipv6) {
303 struct ip6_frag *fraghdr = (struct ip6_frag *)(ip_frame + IP6_HLEN);
304 /* sendto() returns EINVAL if offset + frag_len is too small. */
305 /* In IPv6 if !!(frag_len % 8), the fragment is dropped. */
306 frag_len &= ~0x7;
307 fraghdr->ip6f_offlg = htons(offset / 8 | IP6_MF);
308 ip6hdr->ip6_plen = htons(frag_len);
309 frag_len += IP6_HLEN;
310 } else {
311 frag_len += IP4_HLEN;
312 iphdr->ip_off = htons(offset / 8 | IP4_MF);
313 iphdr->ip_len = htons(frag_len);
314 }
315 res = sendto(fd_raw, ip_frame, frag_len, 0, addr, alen);
316 if (res < 0 && errno != EPERM)
317 error(1, errno, "sendto overlap: %d", frag_len);
318 if (res >= 0 && res != frag_len)
319 error(1, 0, "sendto overlap: %d vs %d", (int)res, frag_len);
320 frag_counter++;
321 }
322
323 /* Event fragments. */
324 offset = 0;
325 while (offset < (UDP_HLEN + payload_len)) {
326 send_fragment(fd_raw, addr, alen, offset, ipv6);
327 /* IPv4 ignores duplicates, so randomly send a duplicate. */
328 if (rand() % 100 == 1)
329 send_fragment(fd_raw, addr, alen, offset, ipv6);
330 offset += 2 * max_frag_len;
331 }
332}
333
334static void run_test(struct sockaddr *addr, socklen_t alen, bool ipv6)
335{
336 int fd_tx_raw, fd_rx_udp;
337 /* Frag queue timeout is set to one second in the calling script;
338 * socket timeout should be just a bit longer to avoid tests interfering
339 * with each other.
340 */
341 struct timeval tv = { .tv_sec = 1, .tv_usec = 10 };
342 int idx;
343 int min_frag_len = 8;
344
345 /* Initialize the payload. */
346 for (idx = 0; idx < MSG_LEN_MAX; ++idx)
347 udp_payload[idx] = idx % 256;
348
349 /* Open sockets. */
350 fd_tx_raw = socket(addr->sa_family, SOCK_RAW, IPPROTO_RAW);
351 if (fd_tx_raw == -1)
352 error(1, errno, "socket tx_raw");
353
354 fd_rx_udp = socket(addr->sa_family, SOCK_DGRAM, 0);
355 if (fd_rx_udp == -1)
356 error(1, errno, "socket rx_udp");
357 if (bind(fd_rx_udp, addr, alen))
358 error(1, errno, "bind");
359 /* Fail fast. */
360 if (setsockopt(fd_rx_udp, SOL_SOCKET, SO_RCVTIMEO, &tv, sizeof(tv)))
361 error(1, errno, "setsockopt rcv timeout");
362
363 for (payload_len = min_frag_len; payload_len < MSG_LEN_MAX;
364 payload_len += (rand() % 4096)) {
365 if (cfg_verbose)
366 printf("payload_len: %d\n", payload_len);
367
368 if (cfg_overlap) {
369 /* With overlaps, one send/receive pair below takes
370 * at least one second (== timeout) to run, so there
371 * is not enough test time to run a nested loop:
372 * the full overlap test takes 20-30 seconds.
373 */
374 max_frag_len = min_frag_len +
375 rand() % (1500 - FRAG_HLEN - min_frag_len);
376 send_udp_frags(fd_tx_raw, addr, alen, ipv6);
377 recv_validate_udp(fd_udp: fd_rx_udp);
378 } else {
379 /* Without overlaps, each packet reassembly (== one
380 * send/receive pair below) takes very little time to
381 * run, so we can easily afford more thourough testing
382 * with a nested loop: the full non-overlap test takes
383 * less than one second).
384 */
385 max_frag_len = min_frag_len;
386 do {
387 send_udp_frags(fd_tx_raw, addr, alen, ipv6);
388 recv_validate_udp(fd_udp: fd_rx_udp);
389 max_frag_len += 8 * (rand() % 8);
390 } while (max_frag_len < (1500 - FRAG_HLEN) &&
391 max_frag_len <= payload_len);
392 }
393 }
394
395 /* Cleanup. */
396 if (close(fd_tx_raw))
397 error(1, errno, "close tx_raw");
398 if (close(fd_rx_udp))
399 error(1, errno, "close rx_udp");
400
401 if (cfg_verbose)
402 printf("processed %d messages, %d fragments\n",
403 msg_counter, frag_counter);
404
405 fprintf(stderr, "PASS\n");
406}
407
408
409static void run_test_v4(void)
410{
411 struct sockaddr_in addr = {0};
412
413 addr.sin_family = AF_INET;
414 addr.sin_port = htons(cfg_port);
415 addr.sin_addr = addr4;
416
417 run_test((void *)&addr, sizeof(addr), false /* !ipv6 */);
418}
419
420static void run_test_v6(void)
421{
422 struct sockaddr_in6 addr = {0};
423
424 addr.sin6_family = AF_INET6;
425 addr.sin6_port = htons(cfg_port);
426 addr.sin6_addr = addr6;
427
428 run_test((void *)&addr, sizeof(addr), true /* ipv6 */);
429}
430
431static void parse_opts(int argc, char **argv)
432{
433 int c;
434
435 while ((c = getopt(argc, argv, "46opv")) != -1) {
436 switch (c) {
437 case '4':
438 cfg_do_ipv4 = true;
439 break;
440 case '6':
441 cfg_do_ipv6 = true;
442 break;
443 case 'o':
444 cfg_overlap = true;
445 break;
446 case 'p':
447 cfg_permissive = true;
448 break;
449 case 'v':
450 cfg_verbose = true;
451 break;
452 default:
453 error(1, 0, "%s: parse error", argv[0]);
454 }
455 }
456}
457
458int main(int argc, char **argv)
459{
460 parse_opts(argc, argv);
461 seed = time(NULL);
462 srand(seed);
463 /* Print the seed to track/reproduce potential failures. */
464 printf("seed = %d\n", seed);
465
466 if (cfg_do_ipv4)
467 run_test_v4();
468 if (cfg_do_ipv6)
469 run_test_v6();
470
471 return 0;
472}
473

source code of linux/tools/testing/selftests/net/ip_defrag.c