// SPDX-License-Identifier: GPL-2.0 /* Copyright (c) 2020, Tessares SA. */ /* Copyright (c) 2022, SUSE. */ #include #include #include #include #include "cgroup_helpers.h" #include "network_helpers.h" #include "mptcp_sock.skel.h" #include "mptcpify.skel.h" #include "mptcp_subflow.skel.h" #define NS_TEST "mptcp_ns" #define ADDR_1 "10.0.1.1" #define ADDR_2 "10.0.1.2" #define PORT_1 10001 #ifndef IPPROTO_MPTCP #define IPPROTO_MPTCP 262 #endif #ifndef SOL_MPTCP #define SOL_MPTCP 284 #endif #ifndef MPTCP_INFO #define MPTCP_INFO 1 #endif #ifndef MPTCP_INFO_FLAG_FALLBACK #define MPTCP_INFO_FLAG_FALLBACK _BITUL(0) #endif #ifndef MPTCP_INFO_FLAG_REMOTE_KEY_RECEIVED #define MPTCP_INFO_FLAG_REMOTE_KEY_RECEIVED _BITUL(1) #endif #ifndef TCP_CA_NAME_MAX #define TCP_CA_NAME_MAX 16 #endif struct __mptcp_info { __u8 mptcpi_subflows; __u8 mptcpi_add_addr_signal; __u8 mptcpi_add_addr_accepted; __u8 mptcpi_subflows_max; __u8 mptcpi_add_addr_signal_max; __u8 mptcpi_add_addr_accepted_max; __u32 mptcpi_flags; __u32 mptcpi_token; __u64 mptcpi_write_seq; __u64 mptcpi_snd_una; __u64 mptcpi_rcv_nxt; __u8 mptcpi_local_addr_used; __u8 mptcpi_local_addr_max; __u8 mptcpi_csum_enabled; __u32 mptcpi_retransmits; __u64 mptcpi_bytes_retrans; __u64 mptcpi_bytes_sent; __u64 mptcpi_bytes_received; __u64 mptcpi_bytes_acked; }; struct mptcp_storage { __u32 invoked; __u32 is_mptcp; struct sock *sk; __u32 token; struct sock *first; char ca_name[TCP_CA_NAME_MAX]; }; static int start_mptcp_server(int family, const char *addr_str, __u16 port, int timeout_ms) { struct network_helper_opts opts = { .timeout_ms = timeout_ms, .proto = IPPROTO_MPTCP, }; return start_server_str(family, SOCK_STREAM, addr_str, port, &opts); } static int verify_tsk(int map_fd, int client_fd) { int err, cfd = client_fd; struct mptcp_storage val; err = bpf_map_lookup_elem(map_fd, &cfd, &val); if (!ASSERT_OK(err, "bpf_map_lookup_elem")) return err; if (!ASSERT_EQ(val.invoked, 1, "unexpected invoked count")) err++; if (!ASSERT_EQ(val.is_mptcp, 0, "unexpected is_mptcp")) err++; return err; } static void get_msk_ca_name(char ca_name[]) { size_t len; int fd; fd = open("/proc/sys/net/ipv4/tcp_congestion_control", O_RDONLY); if (!ASSERT_GE(fd, 0, "failed to open tcp_congestion_control")) return; len = read(fd, ca_name, TCP_CA_NAME_MAX); if (!ASSERT_GT(len, 0, "failed to read ca_name")) goto err; if (len > 0 && ca_name[len - 1] == '\n') ca_name[len - 1] = '\0'; err: close(fd); } static int verify_msk(int map_fd, int client_fd, __u32 token) { char ca_name[TCP_CA_NAME_MAX]; int err, cfd = client_fd; struct mptcp_storage val; if (!ASSERT_GT(token, 0, "invalid token")) return -1; get_msk_ca_name(ca_name); err = bpf_map_lookup_elem(map_fd, &cfd, &val); if (!ASSERT_OK(err, "bpf_map_lookup_elem")) return err; if (!ASSERT_EQ(val.invoked, 1, "unexpected invoked count")) err++; if (!ASSERT_EQ(val.is_mptcp, 1, "unexpected is_mptcp")) err++; if (!ASSERT_EQ(val.token, token, "unexpected token")) err++; if (!ASSERT_EQ(val.first, val.sk, "unexpected first")) err++; if (!ASSERT_STRNEQ(val.ca_name, ca_name, TCP_CA_NAME_MAX, "unexpected ca_name")) err++; return err; } static int run_test(int cgroup_fd, int server_fd, bool is_mptcp) { int client_fd, prog_fd, map_fd, err; struct mptcp_sock *sock_skel; sock_skel = mptcp_sock__open_and_load(); if (!ASSERT_OK_PTR(sock_skel, "skel_open_load")) return libbpf_get_error(sock_skel); err = mptcp_sock__attach(sock_skel); if (!ASSERT_OK(err, "skel_attach")) goto out; prog_fd = bpf_program__fd(sock_skel->progs._sockops); map_fd = bpf_map__fd(sock_skel->maps.socket_storage_map); err = bpf_prog_attach(prog_fd, cgroup_fd, BPF_CGROUP_SOCK_OPS, 0); if (!ASSERT_OK(err, "bpf_prog_attach")) goto out; client_fd = connect_to_fd(server_fd, 0); if (!ASSERT_GE(client_fd, 0, "connect to fd")) { err = -EIO; goto out; } err += is_mptcp ? verify_msk(map_fd, client_fd, sock_skel->bss->token) : verify_tsk(map_fd, client_fd); close(client_fd); out: mptcp_sock__destroy(sock_skel); return err; } static void test_base(void) { struct netns_obj *netns = NULL; int server_fd, cgroup_fd; cgroup_fd = test__join_cgroup("/mptcp"); if (!ASSERT_GE(cgroup_fd, 0, "test__join_cgroup")) return; netns = netns_new(NS_TEST, true); if (!ASSERT_OK_PTR(netns, "netns_new")) goto fail; /* without MPTCP */ server_fd = start_server(AF_INET, SOCK_STREAM, NULL, 0, 0); if (!ASSERT_GE(server_fd, 0, "start_server")) goto with_mptcp; ASSERT_OK(run_test(cgroup_fd, server_fd, false), "run_test tcp"); close(server_fd); with_mptcp: /* with MPTCP */ server_fd = start_mptcp_server(AF_INET, NULL, 0, 0); if (!ASSERT_GE(server_fd, 0, "start_mptcp_server")) goto fail; ASSERT_OK(run_test(cgroup_fd, server_fd, true), "run_test mptcp"); close(server_fd); fail: netns_free(netns); close(cgroup_fd); } static void send_byte(int fd) { char b = 0x55; ASSERT_EQ(write(fd, &b, sizeof(b)), 1, "send single byte"); } static int verify_mptcpify(int server_fd, int client_fd) { struct __mptcp_info info; socklen_t optlen; int protocol; int err = 0; optlen = sizeof(protocol); if (!ASSERT_OK(getsockopt(server_fd, SOL_SOCKET, SO_PROTOCOL, &protocol, &optlen), "getsockopt(SOL_PROTOCOL)")) return -1; if (!ASSERT_EQ(protocol, IPPROTO_MPTCP, "protocol isn't MPTCP")) err++; optlen = sizeof(info); if (!ASSERT_OK(getsockopt(client_fd, SOL_MPTCP, MPTCP_INFO, &info, &optlen), "getsockopt(MPTCP_INFO)")) return -1; if (!ASSERT_GE(info.mptcpi_flags, 0, "unexpected mptcpi_flags")) err++; if (!ASSERT_FALSE(info.mptcpi_flags & MPTCP_INFO_FLAG_FALLBACK, "MPTCP fallback")) err++; if (!ASSERT_TRUE(info.mptcpi_flags & MPTCP_INFO_FLAG_REMOTE_KEY_RECEIVED, "no remote key received")) err++; return err; } static int run_mptcpify(int cgroup_fd) { int server_fd, client_fd, err = 0; struct mptcpify *mptcpify_skel; mptcpify_skel = mptcpify__open_and_load(); if (!ASSERT_OK_PTR(mptcpify_skel, "skel_open_load")) return libbpf_get_error(mptcpify_skel); mptcpify_skel->bss->pid = getpid(); err = mptcpify__attach(mptcpify_skel); if (!ASSERT_OK(err, "skel_attach")) goto out; /* without MPTCP */ server_fd = start_server(AF_INET, SOCK_STREAM, NULL, 0, 0); if (!ASSERT_GE(server_fd, 0, "start_server")) { err = -EIO; goto out; } client_fd = connect_to_fd(server_fd, 0); if (!ASSERT_GE(client_fd, 0, "connect to fd")) { err = -EIO; goto close_server; } send_byte(client_fd); err = verify_mptcpify(server_fd, client_fd); close(client_fd); close_server: close(server_fd); out: mptcpify__destroy(mptcpify_skel); return err; } static void test_mptcpify(void) { struct netns_obj *netns = NULL; int cgroup_fd; cgroup_fd = test__join_cgroup("/mptcpify"); if (!ASSERT_GE(cgroup_fd, 0, "test__join_cgroup")) return; netns = netns_new(NS_TEST, true); if (!ASSERT_OK_PTR(netns, "netns_new")) goto fail; ASSERT_OK(run_mptcpify(cgroup_fd), "run_mptcpify"); fail: netns_free(netns); close(cgroup_fd); } static int endpoint_init(char *flags) { SYS(fail, "ip -net %s link add veth1 type veth peer name veth2", NS_TEST); SYS(fail, "ip -net %s addr add %s/24 dev veth1", NS_TEST, ADDR_1); SYS(fail, "ip -net %s link set dev veth1 up", NS_TEST); SYS(fail, "ip -net %s addr add %s/24 dev veth2", NS_TEST, ADDR_2); SYS(fail, "ip -net %s link set dev veth2 up", NS_TEST); if (SYS_NOFAIL("ip -net %s mptcp endpoint add %s %s", NS_TEST, ADDR_2, flags)) { printf("'ip mptcp' not supported, skip this test.\n"); test__skip(); goto fail; } return 0; fail: return -1; } static void wait_for_new_subflows(int fd) { socklen_t len; u8 subflows; int err, i; len = sizeof(subflows); /* Wait max 5 sec for new subflows to be created */ for (i = 0; i < 50; i++) { err = getsockopt(fd, SOL_MPTCP, MPTCP_INFO, &subflows, &len); if (!err && subflows > 0) break; usleep(100000); /* 0.1s */ } } static void run_subflow(void) { int server_fd, client_fd, err; char new[TCP_CA_NAME_MAX]; char cc[TCP_CA_NAME_MAX]; unsigned int mark; socklen_t len; server_fd = start_mptcp_server(AF_INET, ADDR_1, PORT_1, 0); if (!ASSERT_OK_FD(server_fd, "start_mptcp_server")) return; client_fd = connect_to_fd(server_fd, 0); if (!ASSERT_OK_FD(client_fd, "connect_to_fd")) goto close_server; send_byte(client_fd); wait_for_new_subflows(client_fd); len = sizeof(mark); err = getsockopt(client_fd, SOL_SOCKET, SO_MARK, &mark, &len); if (ASSERT_OK(err, "getsockopt(client_fd, SO_MARK)")) ASSERT_EQ(mark, 0, "mark"); len = sizeof(new); err = getsockopt(client_fd, SOL_TCP, TCP_CONGESTION, new, &len); if (ASSERT_OK(err, "getsockopt(client_fd, TCP_CONGESTION)")) { get_msk_ca_name(cc); ASSERT_STREQ(new, cc, "cc"); } close(client_fd); close_server: close(server_fd); } static void test_subflow(void) { struct mptcp_subflow *skel; struct netns_obj *netns; int cgroup_fd; cgroup_fd = test__join_cgroup("/mptcp_subflow"); if (!ASSERT_OK_FD(cgroup_fd, "join_cgroup: mptcp_subflow")) return; skel = mptcp_subflow__open_and_load(); if (!ASSERT_OK_PTR(skel, "skel_open_load: mptcp_subflow")) goto close_cgroup; skel->bss->pid = getpid(); skel->links.mptcp_subflow = bpf_program__attach_cgroup(skel->progs.mptcp_subflow, cgroup_fd); if (!ASSERT_OK_PTR(skel->links.mptcp_subflow, "attach mptcp_subflow")) goto skel_destroy; skel->links._getsockopt_subflow = bpf_program__attach_cgroup(skel->progs._getsockopt_subflow, cgroup_fd); if (!ASSERT_OK_PTR(skel->links._getsockopt_subflow, "attach _getsockopt_subflow")) goto skel_destroy; netns = netns_new(NS_TEST, true); if (!ASSERT_OK_PTR(netns, "netns_new: mptcp_subflow")) goto skel_destroy; if (endpoint_init("subflow") < 0) goto close_netns; run_subflow(); close_netns: netns_free(netns); skel_destroy: mptcp_subflow__destroy(skel); close_cgroup: close(cgroup_fd); } void test_mptcp(void) { if (test__start_subtest("base")) test_base(); if (test__start_subtest("mptcpify")) test_mptcpify(); if (test__start_subtest("subflow")) test_subflow(); }