1 // SPDX-License-Identifier: GPL-2.0
20 #include <sys/socket.h>
21 #include <sys/types.h>
25 #include <netinet/in.h>
27 #include <linux/tcp.h>
29 static int pf = AF_INET;
32 #define IPPROTO_MPTCP 262
41 __u8 mptcpi_add_addr_signal;
42 __u8 mptcpi_add_addr_accepted;
43 __u8 mptcpi_subflows_max;
44 __u8 mptcpi_add_addr_signal_max;
45 __u8 mptcpi_add_addr_accepted_max;
48 __u64 mptcpi_write_seq;
51 __u8 mptcpi_local_addr_used;
52 __u8 mptcpi_local_addr_max;
53 __u8 mptcpi_csum_enabled;
56 struct mptcp_subflow_data {
57 __u32 size_subflow_data; /* size of this structure in userspace */
58 __u32 num_subflows; /* must be 0, set by kernel */
59 __u32 size_kernel; /* must be 0, set by kernel */
60 __u32 size_user; /* size of one element in data[] */
61 } __attribute__((aligned(8)));
63 struct mptcp_subflow_addrs {
65 __kernel_sa_family_t sa_family;
66 struct sockaddr sa_local;
67 struct sockaddr_in sin_local;
68 struct sockaddr_in6 sin6_local;
69 struct __kernel_sockaddr_storage ss_local;
72 struct sockaddr sa_remote;
73 struct sockaddr_in sin_remote;
74 struct sockaddr_in6 sin6_remote;
75 struct __kernel_sockaddr_storage ss_remote;
80 #define MPTCP_TCPINFO 2
81 #define MPTCP_SUBFLOW_ADDRS 3
86 uint64_t mptcpi_rcv_delta;
87 uint64_t tcpi_rcv_delta;
91 #define MIN(a, b) ((a) < (b) ? (a) : (b))
94 static void die_perror(const char *msg)
100 static void die_usage(int r)
102 fprintf(stderr, "Usage: mptcp_sockopt [-6]\n");
106 static void xerror(const char *fmt, ...)
111 vfprintf(stderr, fmt, ap);
117 static const char *getxinfo_strerr(int err)
119 if (err == EAI_SYSTEM)
120 return strerror(errno);
122 return gai_strerror(err);
125 static void xgetaddrinfo(const char *node, const char *service,
126 const struct addrinfo *hints,
127 struct addrinfo **res)
129 int err = getaddrinfo(node, service, hints, res);
132 const char *errstr = getxinfo_strerr(err);
134 fprintf(stderr, "Fatal: getaddrinfo(%s:%s): %s\n",
135 node ? node : "", service ? service : "", errstr);
140 static int sock_listen_mptcp(const char * const listenaddr,
141 const char * const port)
144 struct addrinfo hints = {
145 .ai_protocol = IPPROTO_TCP,
146 .ai_socktype = SOCK_STREAM,
147 .ai_flags = AI_PASSIVE | AI_NUMERICHOST
150 hints.ai_family = pf;
152 struct addrinfo *a, *addr;
155 xgetaddrinfo(listenaddr, port, &hints, &addr);
156 hints.ai_family = pf;
158 for (a = addr; a; a = a->ai_next) {
159 sock = socket(a->ai_family, a->ai_socktype, IPPROTO_MPTCP);
163 if (-1 == setsockopt(sock, SOL_SOCKET, SO_REUSEADDR, &one,
165 perror("setsockopt");
167 if (bind(sock, a->ai_addr, a->ai_addrlen) == 0)
178 xerror("could not create listen socket");
180 if (listen(sock, 20))
181 die_perror("listen");
186 static int sock_connect_mptcp(const char * const remoteaddr,
187 const char * const port, int proto)
189 struct addrinfo hints = {
190 .ai_protocol = IPPROTO_TCP,
191 .ai_socktype = SOCK_STREAM,
193 struct addrinfo *a, *addr;
196 hints.ai_family = pf;
198 xgetaddrinfo(remoteaddr, port, &hints, &addr);
199 for (a = addr; a; a = a->ai_next) {
200 sock = socket(a->ai_family, a->ai_socktype, proto);
204 if (connect(sock, a->ai_addr, a->ai_addrlen) == 0)
207 die_perror("connect");
211 xerror("could not create connect socket");
217 static void parse_opts(int argc, char **argv)
221 while ((c = getopt(argc, argv, "h6")) != -1) {
236 static void do_getsockopt_bogus_sf_data(int fd, int optname)
238 struct mptcp_subflow_data good_data;
240 struct mptcp_subflow_data d;
243 socklen_t olen, _olen;
246 memset(&bd, 0, sizeof(bd));
247 memset(&good_data, 0, sizeof(good_data));
249 olen = sizeof(good_data);
250 good_data.size_subflow_data = olen;
252 ret = getsockopt(fd, SOL_MPTCP, optname, &bd, &olen);
253 assert(ret < 0); /* 0 size_subflow_data */
254 assert(olen == sizeof(good_data));
258 ret = getsockopt(fd, SOL_MPTCP, optname, &bd, &olen);
260 assert(olen == sizeof(good_data));
261 assert(bd.d.num_subflows == 1);
262 assert(bd.d.size_kernel > 0);
263 assert(bd.d.size_user == 0);
266 _olen = rand() % olen;
268 ret = getsockopt(fd, SOL_MPTCP, optname, &bd, &olen);
269 assert(ret < 0); /* bogus olen */
270 assert(olen == _olen); /* must be unchanged */
273 olen = sizeof(good_data);
274 bd.d.size_kernel = 1;
275 ret = getsockopt(fd, SOL_MPTCP, optname, &bd, &olen);
276 assert(ret < 0); /* size_kernel not 0 */
279 olen = sizeof(good_data);
280 bd.d.num_subflows = 1;
281 ret = getsockopt(fd, SOL_MPTCP, optname, &bd, &olen);
282 assert(ret < 0); /* num_subflows not 0 */
284 /* forward compat check: larger struct mptcp_subflow_data on 'old' kernel */
287 bd.d.size_subflow_data = sizeof(bd);
289 ret = getsockopt(fd, SOL_MPTCP, optname, &bd, &olen);
292 /* olen must be truncated to real data size filled by kernel: */
293 assert(olen == sizeof(good_data));
295 assert(bd.d.size_subflow_data == sizeof(bd));
298 bd.d.size_subflow_data += 1;
300 olen = bd.d.size_subflow_data + 1;
303 ret = getsockopt(fd, SOL_MPTCP, optname, &bd, &_olen);
306 /* no truncation, kernel should have filled 1 byte of optname payload in buf[1]: */
307 assert(olen == _olen);
309 assert(bd.d.size_subflow_data == sizeof(good_data) + 1);
310 assert(bd.buf[0] == 0);
313 static void do_getsockopt_mptcp_info(struct so_state *s, int fd, size_t w)
320 ret = getsockopt(fd, SOL_MPTCP, MPTCP_INFO, &i, &olen);
323 die_perror("getsockopt MPTCP_INFO");
325 assert(olen == sizeof(i));
327 if (s->mi.mptcpi_write_seq == 0)
330 assert(s->mi.mptcpi_write_seq + w == i.mptcpi_write_seq);
332 s->mptcpi_rcv_delta = i.mptcpi_rcv_nxt - s->mi.mptcpi_rcv_nxt;
335 static void do_getsockopt_tcp_info(struct so_state *s, int fd, size_t r, size_t w)
338 struct mptcp_subflow_data d;
339 struct tcp_info ti[2];
345 memset(&ti, 0, sizeof(ti));
347 ti.d.size_subflow_data = sizeof(struct mptcp_subflow_data);
348 ti.d.size_user = sizeof(struct tcp_info);
351 ret = getsockopt(fd, SOL_MPTCP, MPTCP_TCPINFO, &ti, &olen);
353 xerror("getsockopt MPTCP_TCPINFO (tries %d, %m)");
355 assert(olen <= sizeof(ti));
356 assert(ti.d.size_kernel > 0);
357 assert(ti.d.size_user ==
358 MIN(ti.d.size_kernel, sizeof(struct tcp_info)));
359 assert(ti.d.num_subflows == 1);
361 assert(olen > (socklen_t)sizeof(struct mptcp_subflow_data));
362 olen -= sizeof(struct mptcp_subflow_data);
363 assert(olen == ti.d.size_user);
365 if (ti.ti[0].tcpi_bytes_sent == w &&
366 ti.ti[0].tcpi_bytes_received == r)
369 if (r == 0 && ti.ti[0].tcpi_bytes_sent == w &&
370 ti.ti[0].tcpi_bytes_received) {
371 s->tcpi_rcv_delta = ti.ti[0].tcpi_bytes_received;
375 /* wait and repeat, might be that tx is still ongoing */
377 } while (tries-- > 0);
379 xerror("tcpi_bytes_sent %" PRIu64 ", want %zu. tcpi_bytes_received %" PRIu64 ", want %zu",
380 ti.ti[0].tcpi_bytes_sent, w, ti.ti[0].tcpi_bytes_received, r);
383 do_getsockopt_bogus_sf_data(fd, MPTCP_TCPINFO);
386 static void do_getsockopt_subflow_addrs(int fd)
388 struct sockaddr_storage remote, local;
389 socklen_t olen, rlen, llen;
392 struct mptcp_subflow_data d;
393 struct mptcp_subflow_addrs addr[2];
396 memset(&addrs, 0, sizeof(addrs));
397 memset(&local, 0, sizeof(local));
398 memset(&remote, 0, sizeof(remote));
400 addrs.d.size_subflow_data = sizeof(struct mptcp_subflow_data);
401 addrs.d.size_user = sizeof(struct mptcp_subflow_addrs);
402 olen = sizeof(addrs);
404 ret = getsockopt(fd, SOL_MPTCP, MPTCP_SUBFLOW_ADDRS, &addrs, &olen);
406 die_perror("getsockopt MPTCP_SUBFLOW_ADDRS");
408 assert(olen <= sizeof(addrs));
409 assert(addrs.d.size_kernel > 0);
410 assert(addrs.d.size_user ==
411 MIN(addrs.d.size_kernel, sizeof(struct mptcp_subflow_addrs)));
412 assert(addrs.d.num_subflows == 1);
414 assert(olen > (socklen_t)sizeof(struct mptcp_subflow_data));
415 olen -= sizeof(struct mptcp_subflow_data);
416 assert(olen == addrs.d.size_user);
418 llen = sizeof(local);
419 ret = getsockname(fd, (struct sockaddr *)&local, &llen);
421 die_perror("getsockname");
422 rlen = sizeof(remote);
423 ret = getpeername(fd, (struct sockaddr *)&remote, &rlen);
425 die_perror("getpeername");
428 assert(rlen == llen);
430 assert(remote.ss_family == local.ss_family);
432 assert(memcmp(&local, &addrs.addr[0].ss_local, sizeof(local)) == 0);
433 assert(memcmp(&remote, &addrs.addr[0].ss_remote, sizeof(remote)) == 0);
435 memset(&addrs, 0, sizeof(addrs));
437 addrs.d.size_subflow_data = sizeof(struct mptcp_subflow_data);
438 addrs.d.size_user = sizeof(sa_family_t);
439 olen = sizeof(addrs.d) + sizeof(sa_family_t);
441 ret = getsockopt(fd, SOL_MPTCP, MPTCP_SUBFLOW_ADDRS, &addrs, &olen);
443 assert(olen == sizeof(addrs.d) + sizeof(sa_family_t));
445 assert(addrs.addr[0].sa_family == pf);
446 assert(addrs.addr[0].sa_family == local.ss_family);
448 assert(memcmp(&local, &addrs.addr[0].ss_local, sizeof(local)) != 0);
449 assert(memcmp(&remote, &addrs.addr[0].ss_remote, sizeof(remote)) != 0);
451 do_getsockopt_bogus_sf_data(fd, MPTCP_SUBFLOW_ADDRS);
454 static void do_getsockopts(struct so_state *s, int fd, size_t r, size_t w)
456 do_getsockopt_mptcp_info(s, fd, w);
458 do_getsockopt_tcp_info(s, fd, r, w);
460 do_getsockopt_subflow_addrs(fd);
463 static void connect_one_server(int fd, int pipefd)
465 char buf[4096], buf2[4096];
466 size_t len, i, total;
471 memset(&s, 0, sizeof(s));
473 len = rand() % (sizeof(buf) - 1);
478 for (i = 0; i < len ; i++) {
479 buf[i] = rand() % 26;
485 do_getsockopts(&s, fd, 0, 0);
487 /* un-block server */
488 ret = read(pipefd, buf2, 4);
492 assert(strncmp(buf2, "xmit", 4) == 0);
494 ret = write(fd, buf, len);
498 if (ret != (ssize_t)len)
499 xerror("short write");
503 ret = read(fd, buf2 + total, sizeof(buf2) - total);
512 } while (total < len);
515 xerror("total %lu, len %lu eof %d\n", total, len, eof);
517 if (memcmp(buf, buf2, len))
518 xerror("data corruption");
520 if (s.tcpi_rcv_delta)
521 assert(s.tcpi_rcv_delta <= total);
523 do_getsockopts(&s, fd, ret, ret);
526 total += 1; /* sequence advances due to FIN */
528 assert(s.mptcpi_rcv_delta == (uint64_t)total);
532 static void process_one_client(int fd, int pipefd)
534 ssize_t ret, ret2, ret3;
538 memset(&s, 0, sizeof(s));
539 do_getsockopts(&s, fd, 0, 0);
541 ret = write(pipefd, "xmit", 4);
544 ret = read(fd, buf, sizeof(buf));
548 assert(s.mptcpi_rcv_delta <= (uint64_t)ret);
550 if (s.tcpi_rcv_delta)
551 assert(s.tcpi_rcv_delta == (uint64_t)ret);
553 ret2 = write(fd, buf, ret);
557 /* wait for hangup */
558 ret3 = read(fd, buf, 1);
560 xerror("expected EOF, got %lu", ret3);
562 do_getsockopts(&s, fd, ret, ret2);
563 if (s.mptcpi_rcv_delta != (uint64_t)ret + 1)
564 xerror("mptcpi_rcv_delta %" PRIu64 ", expect %" PRIu64, s.mptcpi_rcv_delta, ret + 1, s.mptcpi_rcv_delta - ret);
568 static int xaccept(int s)
570 int fd = accept(s, NULL, 0);
573 die_perror("accept");
578 static int server(int pipefd)
584 fd = sock_listen_mptcp("127.0.0.1", "15432");
587 fd = sock_listen_mptcp("::1", "15432");
590 xerror("Unknown pf %d\n", pf);
594 r = write(pipefd, "conn", 4);
600 process_one_client(r, pipefd);
605 static void test_ip_tos_sockopt(int fd)
607 uint8_t tos_in, tos_out;
611 tos_in = rand() & 0xfc;
612 r = setsockopt(fd, SOL_IP, IP_TOS, &tos_in, sizeof(tos_out));
614 die_perror("setsockopt IP_TOS");
618 r = getsockopt(fd, SOL_IP, IP_TOS, &tos_out, &s);
620 die_perror("getsockopt IP_TOS");
622 if (tos_in != tos_out)
623 xerror("tos %x != %x socklen_t %d\n", tos_in, tos_out, s);
626 xerror("tos should be 1 byte");
629 r = getsockopt(fd, SOL_IP, IP_TOS, &tos_out, &s);
631 die_perror("getsockopt IP_TOS 0");
633 xerror("expect socklen_t == 0");
636 r = getsockopt(fd, SOL_IP, IP_TOS, &tos_out, &s);
637 if (r != -1 && errno != EINVAL)
638 die_perror("getsockopt IP_TOS did not indicate -EINVAL");
640 xerror("expect socklen_t == -1");
643 static int client(int pipefd)
651 fd = sock_connect_mptcp("127.0.0.1", "15432", IPPROTO_MPTCP);
654 fd = sock_connect_mptcp("::1", "15432", IPPROTO_MPTCP);
657 xerror("Unknown pf %d\n", pf);
660 test_ip_tos_sockopt(fd);
662 connect_one_server(fd, pipefd);
667 static pid_t xfork(void)
677 static int rcheck(int wstatus, const char *what)
679 if (WIFEXITED(wstatus)) {
680 if (WEXITSTATUS(wstatus) == 0)
682 fprintf(stderr, "%s exited, status=%d\n", what, WEXITSTATUS(wstatus));
683 return WEXITSTATUS(wstatus);
684 } else if (WIFSIGNALED(wstatus)) {
685 xerror("%s killed by signal %d\n", what, WTERMSIG(wstatus));
686 } else if (WIFSTOPPED(wstatus)) {
687 xerror("%s stopped by signal %d\n", what, WSTOPSIG(wstatus));
693 static void init_rng(void)
695 int fd = open("/dev/urandom", O_RDONLY);
702 ret = read(fd, &foo, sizeof(foo));
703 assert(ret == sizeof(foo));
712 int main(int argc, char *argv[])
718 parse_opts(argc, argv);
728 return server(pipefds[1]);
732 /* wait until server bound a socket */
733 e1 = read(pipefds[0], &e1, 4);
738 return client(pipefds[0]);
742 ret = waitpid(s, &wstatus, 0);
744 die_perror("waitpid");
745 e1 = rcheck(wstatus, "server");
746 ret = waitpid(c, &wstatus, 0);
748 die_perror("waitpid");
749 e2 = rcheck(wstatus, "client");