xref: /openbmc/linux/tools/testing/selftests/net/reuseport_bpf.c (revision 4f2c0a4acffbec01079c28f839422e64ddeff004)
13ca8e402SCraig Gallek /*
23ca8e402SCraig Gallek  * Test functionality of BPF filters for SO_REUSEPORT.  The tests below will use
33ca8e402SCraig Gallek  * a BPF program (both classic and extended) to read the first word from an
43ca8e402SCraig Gallek  * incoming packet (expected to be in network byte-order), calculate a modulus
53ca8e402SCraig Gallek  * of that number, and then dispatch the packet to the Nth socket using the
63ca8e402SCraig Gallek  * result.  These tests are run for each supported address family and protocol.
73ca8e402SCraig Gallek  * Additionally, a few edge cases in the implementation are tested.
83ca8e402SCraig Gallek  */
93ca8e402SCraig Gallek 
103ca8e402SCraig Gallek #include <errno.h>
113ca8e402SCraig Gallek #include <error.h>
124b2a6aedSCraig Gallek #include <fcntl.h>
133ca8e402SCraig Gallek #include <linux/bpf.h>
143ca8e402SCraig Gallek #include <linux/filter.h>
153ca8e402SCraig Gallek #include <linux/unistd.h>
163ca8e402SCraig Gallek #include <netinet/in.h>
174b2a6aedSCraig Gallek #include <netinet/tcp.h>
183ca8e402SCraig Gallek #include <stdio.h>
193ca8e402SCraig Gallek #include <stdlib.h>
203ca8e402SCraig Gallek #include <string.h>
213ca8e402SCraig Gallek #include <sys/epoll.h>
223ca8e402SCraig Gallek #include <sys/types.h>
233ca8e402SCraig Gallek #include <sys/socket.h>
24941ff6f1SDaniel Borkmann #include <sys/resource.h>
253ca8e402SCraig Gallek #include <unistd.h>
263ca8e402SCraig Gallek 
271329e40eSShuah Khan #include "../kselftest.h"
283ca8e402SCraig Gallek 
293ca8e402SCraig Gallek struct test_params {
303ca8e402SCraig Gallek 	int recv_family;
313ca8e402SCraig Gallek 	int send_family;
323ca8e402SCraig Gallek 	int protocol;
333ca8e402SCraig Gallek 	size_t recv_socks;
343ca8e402SCraig Gallek 	uint16_t recv_port;
353ca8e402SCraig Gallek 	uint16_t send_port_min;
363ca8e402SCraig Gallek };
373ca8e402SCraig Gallek 
sockaddr_size(void)383ca8e402SCraig Gallek static size_t sockaddr_size(void)
393ca8e402SCraig Gallek {
403ca8e402SCraig Gallek 	return sizeof(struct sockaddr_storage);
413ca8e402SCraig Gallek }
423ca8e402SCraig Gallek 
new_any_sockaddr(int family,uint16_t port)433ca8e402SCraig Gallek static struct sockaddr *new_any_sockaddr(int family, uint16_t port)
443ca8e402SCraig Gallek {
453ca8e402SCraig Gallek 	struct sockaddr_storage *addr;
463ca8e402SCraig Gallek 	struct sockaddr_in *addr4;
473ca8e402SCraig Gallek 	struct sockaddr_in6 *addr6;
483ca8e402SCraig Gallek 
493ca8e402SCraig Gallek 	addr = malloc(sizeof(struct sockaddr_storage));
503ca8e402SCraig Gallek 	memset(addr, 0, sizeof(struct sockaddr_storage));
513ca8e402SCraig Gallek 
523ca8e402SCraig Gallek 	switch (family) {
533ca8e402SCraig Gallek 	case AF_INET:
543ca8e402SCraig Gallek 		addr4 = (struct sockaddr_in *)addr;
553ca8e402SCraig Gallek 		addr4->sin_family = AF_INET;
563ca8e402SCraig Gallek 		addr4->sin_addr.s_addr = htonl(INADDR_ANY);
573ca8e402SCraig Gallek 		addr4->sin_port = htons(port);
583ca8e402SCraig Gallek 		break;
593ca8e402SCraig Gallek 	case AF_INET6:
603ca8e402SCraig Gallek 		addr6 = (struct sockaddr_in6 *)addr;
613ca8e402SCraig Gallek 		addr6->sin6_family = AF_INET6;
623ca8e402SCraig Gallek 		addr6->sin6_addr = in6addr_any;
633ca8e402SCraig Gallek 		addr6->sin6_port = htons(port);
643ca8e402SCraig Gallek 		break;
653ca8e402SCraig Gallek 	default:
663ca8e402SCraig Gallek 		error(1, 0, "Unsupported family %d", family);
673ca8e402SCraig Gallek 	}
683ca8e402SCraig Gallek 	return (struct sockaddr *)addr;
693ca8e402SCraig Gallek }
703ca8e402SCraig Gallek 
new_loopback_sockaddr(int family,uint16_t port)713ca8e402SCraig Gallek static struct sockaddr *new_loopback_sockaddr(int family, uint16_t port)
723ca8e402SCraig Gallek {
733ca8e402SCraig Gallek 	struct sockaddr *addr = new_any_sockaddr(family, port);
743ca8e402SCraig Gallek 	struct sockaddr_in *addr4;
753ca8e402SCraig Gallek 	struct sockaddr_in6 *addr6;
763ca8e402SCraig Gallek 
773ca8e402SCraig Gallek 	switch (family) {
783ca8e402SCraig Gallek 	case AF_INET:
793ca8e402SCraig Gallek 		addr4 = (struct sockaddr_in *)addr;
803ca8e402SCraig Gallek 		addr4->sin_addr.s_addr = htonl(INADDR_LOOPBACK);
813ca8e402SCraig Gallek 		break;
823ca8e402SCraig Gallek 	case AF_INET6:
833ca8e402SCraig Gallek 		addr6 = (struct sockaddr_in6 *)addr;
843ca8e402SCraig Gallek 		addr6->sin6_addr = in6addr_loopback;
853ca8e402SCraig Gallek 		break;
863ca8e402SCraig Gallek 	default:
873ca8e402SCraig Gallek 		error(1, 0, "Unsupported family %d", family);
883ca8e402SCraig Gallek 	}
893ca8e402SCraig Gallek 	return addr;
903ca8e402SCraig Gallek }
913ca8e402SCraig Gallek 
attach_ebpf(int fd,uint16_t mod)923ca8e402SCraig Gallek static void attach_ebpf(int fd, uint16_t mod)
933ca8e402SCraig Gallek {
943ca8e402SCraig Gallek 	static char bpf_log_buf[65536];
953ca8e402SCraig Gallek 	static const char bpf_license[] = "GPL";
963ca8e402SCraig Gallek 
973ca8e402SCraig Gallek 	int bpf_fd;
983ca8e402SCraig Gallek 	const struct bpf_insn prog[] = {
993ca8e402SCraig Gallek 		/* BPF_MOV64_REG(BPF_REG_6, BPF_REG_1) */
1003ca8e402SCraig Gallek 		{ BPF_ALU64 | BPF_MOV | BPF_X, BPF_REG_6, BPF_REG_1, 0, 0 },
1013ca8e402SCraig Gallek 		/* BPF_LD_ABS(BPF_W, 0) R0 = (uint32_t)skb[0] */
1023ca8e402SCraig Gallek 		{ BPF_LD | BPF_ABS | BPF_W, 0, 0, 0, 0 },
1033ca8e402SCraig Gallek 		/* BPF_ALU64_IMM(BPF_MOD, BPF_REG_0, mod) */
1043ca8e402SCraig Gallek 		{ BPF_ALU64 | BPF_MOD | BPF_K, BPF_REG_0, 0, 0, mod },
1053ca8e402SCraig Gallek 		/* BPF_EXIT_INSN() */
1063ca8e402SCraig Gallek 		{ BPF_JMP | BPF_EXIT, 0, 0, 0, 0 }
1073ca8e402SCraig Gallek 	};
1083ca8e402SCraig Gallek 	union bpf_attr attr;
1093ca8e402SCraig Gallek 
1103ca8e402SCraig Gallek 	memset(&attr, 0, sizeof(attr));
1113ca8e402SCraig Gallek 	attr.prog_type = BPF_PROG_TYPE_SOCKET_FILTER;
1123ca8e402SCraig Gallek 	attr.insn_cnt = ARRAY_SIZE(prog);
113fc100a7fSHelge Deller 	attr.insns = (unsigned long) &prog;
114fc100a7fSHelge Deller 	attr.license = (unsigned long) &bpf_license;
115fc100a7fSHelge Deller 	attr.log_buf = (unsigned long) &bpf_log_buf;
1163ca8e402SCraig Gallek 	attr.log_size = sizeof(bpf_log_buf);
1173ca8e402SCraig Gallek 	attr.log_level = 1;
1183ca8e402SCraig Gallek 	attr.kern_version = 0;
1193ca8e402SCraig Gallek 
1203ca8e402SCraig Gallek 	bpf_fd = syscall(__NR_bpf, BPF_PROG_LOAD, &attr, sizeof(attr));
1213ca8e402SCraig Gallek 	if (bpf_fd < 0)
1223ca8e402SCraig Gallek 		error(1, errno, "ebpf error. log:\n%s\n", bpf_log_buf);
1233ca8e402SCraig Gallek 
1243ca8e402SCraig Gallek 	if (setsockopt(fd, SOL_SOCKET, SO_ATTACH_REUSEPORT_EBPF, &bpf_fd,
1253ca8e402SCraig Gallek 			sizeof(bpf_fd)))
1263ca8e402SCraig Gallek 		error(1, errno, "failed to set SO_ATTACH_REUSEPORT_EBPF");
1271134158bSCraig Gallek 
1281134158bSCraig Gallek 	close(bpf_fd);
1293ca8e402SCraig Gallek }
1303ca8e402SCraig Gallek 
attach_cbpf(int fd,uint16_t mod)1313ca8e402SCraig Gallek static void attach_cbpf(int fd, uint16_t mod)
1323ca8e402SCraig Gallek {
1333ca8e402SCraig Gallek 	struct sock_filter code[] = {
1343ca8e402SCraig Gallek 		/* A = (uint32_t)skb[0] */
1353ca8e402SCraig Gallek 		{ BPF_LD  | BPF_W | BPF_ABS, 0, 0, 0 },
1363ca8e402SCraig Gallek 		/* A = A % mod */
1373ca8e402SCraig Gallek 		{ BPF_ALU | BPF_MOD, 0, 0, mod },
1383ca8e402SCraig Gallek 		/* return A */
1393ca8e402SCraig Gallek 		{ BPF_RET | BPF_A, 0, 0, 0 },
1403ca8e402SCraig Gallek 	};
1413ca8e402SCraig Gallek 	struct sock_fprog p = {
1423ca8e402SCraig Gallek 		.len = ARRAY_SIZE(code),
1433ca8e402SCraig Gallek 		.filter = code,
1443ca8e402SCraig Gallek 	};
1453ca8e402SCraig Gallek 
1463ca8e402SCraig Gallek 	if (setsockopt(fd, SOL_SOCKET, SO_ATTACH_REUSEPORT_CBPF, &p, sizeof(p)))
1473ca8e402SCraig Gallek 		error(1, errno, "failed to set SO_ATTACH_REUSEPORT_CBPF");
1483ca8e402SCraig Gallek }
1493ca8e402SCraig Gallek 
build_recv_group(const struct test_params p,int fd[],uint16_t mod,void (* attach_bpf)(int,uint16_t))1503ca8e402SCraig Gallek static void build_recv_group(const struct test_params p, int fd[], uint16_t mod,
1513ca8e402SCraig Gallek 			     void (*attach_bpf)(int, uint16_t))
1523ca8e402SCraig Gallek {
1533ca8e402SCraig Gallek 	struct sockaddr * const addr =
1543ca8e402SCraig Gallek 		new_any_sockaddr(p.recv_family, p.recv_port);
1553ca8e402SCraig Gallek 	int i, opt;
1563ca8e402SCraig Gallek 
1573ca8e402SCraig Gallek 	for (i = 0; i < p.recv_socks; ++i) {
1583ca8e402SCraig Gallek 		fd[i] = socket(p.recv_family, p.protocol, 0);
1593ca8e402SCraig Gallek 		if (fd[i] < 0)
1603ca8e402SCraig Gallek 			error(1, errno, "failed to create recv %d", i);
1613ca8e402SCraig Gallek 
1623ca8e402SCraig Gallek 		opt = 1;
1633ca8e402SCraig Gallek 		if (setsockopt(fd[i], SOL_SOCKET, SO_REUSEPORT, &opt,
1643ca8e402SCraig Gallek 			       sizeof(opt)))
1653ca8e402SCraig Gallek 			error(1, errno, "failed to set SO_REUSEPORT on %d", i);
1663ca8e402SCraig Gallek 
1673ca8e402SCraig Gallek 		if (i == 0)
1683ca8e402SCraig Gallek 			attach_bpf(fd[i], mod);
1693ca8e402SCraig Gallek 
1703ca8e402SCraig Gallek 		if (bind(fd[i], addr, sockaddr_size()))
1713ca8e402SCraig Gallek 			error(1, errno, "failed to bind recv socket %d", i);
1723ca8e402SCraig Gallek 
1734b2a6aedSCraig Gallek 		if (p.protocol == SOCK_STREAM) {
1744b2a6aedSCraig Gallek 			opt = 4;
1754b2a6aedSCraig Gallek 			if (setsockopt(fd[i], SOL_TCP, TCP_FASTOPEN, &opt,
1764b2a6aedSCraig Gallek 				       sizeof(opt)))
1774b2a6aedSCraig Gallek 				error(1, errno,
1784b2a6aedSCraig Gallek 				      "failed to set TCP_FASTOPEN on %d", i);
1793ca8e402SCraig Gallek 			if (listen(fd[i], p.recv_socks * 10))
1803ca8e402SCraig Gallek 				error(1, errno, "failed to listen on socket");
1813ca8e402SCraig Gallek 		}
1824b2a6aedSCraig Gallek 	}
1833ca8e402SCraig Gallek 	free(addr);
1843ca8e402SCraig Gallek }
1853ca8e402SCraig Gallek 
send_from(struct test_params p,uint16_t sport,char * buf,size_t len)1863ca8e402SCraig Gallek static void send_from(struct test_params p, uint16_t sport, char *buf,
1873ca8e402SCraig Gallek 		      size_t len)
1883ca8e402SCraig Gallek {
1893ca8e402SCraig Gallek 	struct sockaddr * const saddr = new_any_sockaddr(p.send_family, sport);
1903ca8e402SCraig Gallek 	struct sockaddr * const daddr =
1913ca8e402SCraig Gallek 		new_loopback_sockaddr(p.send_family, p.recv_port);
192941ff6f1SDaniel Borkmann 	const int fd = socket(p.send_family, p.protocol, 0), one = 1;
1933ca8e402SCraig Gallek 
1943ca8e402SCraig Gallek 	if (fd < 0)
1953ca8e402SCraig Gallek 		error(1, errno, "failed to create send socket");
1963ca8e402SCraig Gallek 
197941ff6f1SDaniel Borkmann 	if (setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &one, sizeof(one)))
198941ff6f1SDaniel Borkmann 		error(1, errno, "failed to set reuseaddr");
199941ff6f1SDaniel Borkmann 
2003ca8e402SCraig Gallek 	if (bind(fd, saddr, sockaddr_size()))
2013ca8e402SCraig Gallek 		error(1, errno, "failed to bind send socket");
2023ca8e402SCraig Gallek 
2034b2a6aedSCraig Gallek 	if (sendto(fd, buf, len, MSG_FASTOPEN, daddr, sockaddr_size()) < 0)
2043ca8e402SCraig Gallek 		error(1, errno, "failed to send message");
2053ca8e402SCraig Gallek 
2063ca8e402SCraig Gallek 	close(fd);
2073ca8e402SCraig Gallek 	free(saddr);
2083ca8e402SCraig Gallek 	free(daddr);
2093ca8e402SCraig Gallek }
2103ca8e402SCraig Gallek 
test_recv_order(const struct test_params p,int fd[],int mod)2113ca8e402SCraig Gallek static void test_recv_order(const struct test_params p, int fd[], int mod)
2123ca8e402SCraig Gallek {
2133ca8e402SCraig Gallek 	char recv_buf[8], send_buf[8];
2143ca8e402SCraig Gallek 	struct msghdr msg;
2153ca8e402SCraig Gallek 	struct iovec recv_io = { recv_buf, 8 };
2163ca8e402SCraig Gallek 	struct epoll_event ev;
2173ca8e402SCraig Gallek 	int epfd, conn, i, sport, expected;
2183ca8e402SCraig Gallek 	uint32_t data, ndata;
2193ca8e402SCraig Gallek 
2203ca8e402SCraig Gallek 	epfd = epoll_create(1);
2213ca8e402SCraig Gallek 	if (epfd < 0)
2223ca8e402SCraig Gallek 		error(1, errno, "failed to create epoll");
2233ca8e402SCraig Gallek 	for (i = 0; i < p.recv_socks; ++i) {
2243ca8e402SCraig Gallek 		ev.events = EPOLLIN;
2253ca8e402SCraig Gallek 		ev.data.fd = fd[i];
2263ca8e402SCraig Gallek 		if (epoll_ctl(epfd, EPOLL_CTL_ADD, fd[i], &ev))
2273ca8e402SCraig Gallek 			error(1, errno, "failed to register sock %d epoll", i);
2283ca8e402SCraig Gallek 	}
2293ca8e402SCraig Gallek 
2303ca8e402SCraig Gallek 	memset(&msg, 0, sizeof(msg));
2313ca8e402SCraig Gallek 	msg.msg_iov = &recv_io;
2323ca8e402SCraig Gallek 	msg.msg_iovlen = 1;
2333ca8e402SCraig Gallek 
2343ca8e402SCraig Gallek 	for (data = 0; data < p.recv_socks * 2; ++data) {
2353ca8e402SCraig Gallek 		sport = p.send_port_min + data;
2363ca8e402SCraig Gallek 		ndata = htonl(data);
2373ca8e402SCraig Gallek 		memcpy(send_buf, &ndata, sizeof(ndata));
2383ca8e402SCraig Gallek 		send_from(p, sport, send_buf, sizeof(ndata));
2393ca8e402SCraig Gallek 
2403ca8e402SCraig Gallek 		i = epoll_wait(epfd, &ev, 1, -1);
2413ca8e402SCraig Gallek 		if (i < 0)
2423ca8e402SCraig Gallek 			error(1, errno, "epoll wait failed");
2433ca8e402SCraig Gallek 
2443ca8e402SCraig Gallek 		if (p.protocol == SOCK_STREAM) {
2453ca8e402SCraig Gallek 			conn = accept(ev.data.fd, NULL, NULL);
2463ca8e402SCraig Gallek 			if (conn < 0)
2473ca8e402SCraig Gallek 				error(1, errno, "error accepting");
2483ca8e402SCraig Gallek 			i = recvmsg(conn, &msg, 0);
2493ca8e402SCraig Gallek 			close(conn);
2503ca8e402SCraig Gallek 		} else {
2513ca8e402SCraig Gallek 			i = recvmsg(ev.data.fd, &msg, 0);
2523ca8e402SCraig Gallek 		}
2533ca8e402SCraig Gallek 		if (i < 0)
2543ca8e402SCraig Gallek 			error(1, errno, "recvmsg error");
2553ca8e402SCraig Gallek 		if (i != sizeof(ndata))
2563ca8e402SCraig Gallek 			error(1, 0, "expected size %zd got %d",
2573ca8e402SCraig Gallek 			      sizeof(ndata), i);
2583ca8e402SCraig Gallek 
2593ca8e402SCraig Gallek 		for (i = 0; i < p.recv_socks; ++i)
2603ca8e402SCraig Gallek 			if (ev.data.fd == fd[i])
2613ca8e402SCraig Gallek 				break;
2623ca8e402SCraig Gallek 		memcpy(&ndata, recv_buf, sizeof(ndata));
2633ca8e402SCraig Gallek 		fprintf(stderr, "Socket %d: %d\n", i, ntohl(ndata));
2643ca8e402SCraig Gallek 
2653ca8e402SCraig Gallek 		expected = (sport % mod);
2663ca8e402SCraig Gallek 		if (i != expected)
2673ca8e402SCraig Gallek 			error(1, 0, "expected socket %d", expected);
2683ca8e402SCraig Gallek 	}
2693ca8e402SCraig Gallek }
2703ca8e402SCraig Gallek 
test_reuseport_ebpf(struct test_params p)2714b2a6aedSCraig Gallek static void test_reuseport_ebpf(struct test_params p)
2723ca8e402SCraig Gallek {
2733ca8e402SCraig Gallek 	int i, fd[p.recv_socks];
2743ca8e402SCraig Gallek 
2753ca8e402SCraig Gallek 	fprintf(stderr, "Testing EBPF mod %zd...\n", p.recv_socks);
2763ca8e402SCraig Gallek 	build_recv_group(p, fd, p.recv_socks, attach_ebpf);
2773ca8e402SCraig Gallek 	test_recv_order(p, fd, p.recv_socks);
2783ca8e402SCraig Gallek 
2794b2a6aedSCraig Gallek 	p.send_port_min += p.recv_socks * 2;
2803ca8e402SCraig Gallek 	fprintf(stderr, "Reprograming, testing mod %zd...\n", p.recv_socks / 2);
2813ca8e402SCraig Gallek 	attach_ebpf(fd[0], p.recv_socks / 2);
2823ca8e402SCraig Gallek 	test_recv_order(p, fd, p.recv_socks / 2);
2833ca8e402SCraig Gallek 
2843ca8e402SCraig Gallek 	for (i = 0; i < p.recv_socks; ++i)
2853ca8e402SCraig Gallek 		close(fd[i]);
2863ca8e402SCraig Gallek }
2873ca8e402SCraig Gallek 
test_reuseport_cbpf(struct test_params p)2884b2a6aedSCraig Gallek static void test_reuseport_cbpf(struct test_params p)
2893ca8e402SCraig Gallek {
2903ca8e402SCraig Gallek 	int i, fd[p.recv_socks];
2913ca8e402SCraig Gallek 
2923ca8e402SCraig Gallek 	fprintf(stderr, "Testing CBPF mod %zd...\n", p.recv_socks);
2933ca8e402SCraig Gallek 	build_recv_group(p, fd, p.recv_socks, attach_cbpf);
2943ca8e402SCraig Gallek 	test_recv_order(p, fd, p.recv_socks);
2953ca8e402SCraig Gallek 
2964b2a6aedSCraig Gallek 	p.send_port_min += p.recv_socks * 2;
2973ca8e402SCraig Gallek 	fprintf(stderr, "Reprograming, testing mod %zd...\n", p.recv_socks / 2);
2983ca8e402SCraig Gallek 	attach_cbpf(fd[0], p.recv_socks / 2);
2993ca8e402SCraig Gallek 	test_recv_order(p, fd, p.recv_socks / 2);
3003ca8e402SCraig Gallek 
3013ca8e402SCraig Gallek 	for (i = 0; i < p.recv_socks; ++i)
3023ca8e402SCraig Gallek 		close(fd[i]);
3033ca8e402SCraig Gallek }
3043ca8e402SCraig Gallek 
test_extra_filter(const struct test_params p)3053ca8e402SCraig Gallek static void test_extra_filter(const struct test_params p)
3063ca8e402SCraig Gallek {
3073ca8e402SCraig Gallek 	struct sockaddr * const addr =
3083ca8e402SCraig Gallek 		new_any_sockaddr(p.recv_family, p.recv_port);
3093ca8e402SCraig Gallek 	int fd1, fd2, opt;
3103ca8e402SCraig Gallek 
3113ca8e402SCraig Gallek 	fprintf(stderr, "Testing too many filters...\n");
3123ca8e402SCraig Gallek 	fd1 = socket(p.recv_family, p.protocol, 0);
3133ca8e402SCraig Gallek 	if (fd1 < 0)
3143ca8e402SCraig Gallek 		error(1, errno, "failed to create socket 1");
3153ca8e402SCraig Gallek 	fd2 = socket(p.recv_family, p.protocol, 0);
3163ca8e402SCraig Gallek 	if (fd2 < 0)
3173ca8e402SCraig Gallek 		error(1, errno, "failed to create socket 2");
3183ca8e402SCraig Gallek 
3193ca8e402SCraig Gallek 	opt = 1;
3203ca8e402SCraig Gallek 	if (setsockopt(fd1, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)))
3213ca8e402SCraig Gallek 		error(1, errno, "failed to set SO_REUSEPORT on socket 1");
3223ca8e402SCraig Gallek 	if (setsockopt(fd2, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)))
3233ca8e402SCraig Gallek 		error(1, errno, "failed to set SO_REUSEPORT on socket 2");
3243ca8e402SCraig Gallek 
3253ca8e402SCraig Gallek 	attach_ebpf(fd1, 10);
3263ca8e402SCraig Gallek 	attach_ebpf(fd2, 10);
3273ca8e402SCraig Gallek 
3283ca8e402SCraig Gallek 	if (bind(fd1, addr, sockaddr_size()))
3293ca8e402SCraig Gallek 		error(1, errno, "failed to bind recv socket 1");
3303ca8e402SCraig Gallek 
331*bc7a3198SWang Yufen 	if (!bind(fd2, addr, sockaddr_size()) || errno != EADDRINUSE)
3323ca8e402SCraig Gallek 		error(1, errno, "bind socket 2 should fail with EADDRINUSE");
3333ca8e402SCraig Gallek 
3343ca8e402SCraig Gallek 	free(addr);
3353ca8e402SCraig Gallek }
3363ca8e402SCraig Gallek 
test_filter_no_reuseport(const struct test_params p)3373ca8e402SCraig Gallek static void test_filter_no_reuseport(const struct test_params p)
3383ca8e402SCraig Gallek {
3393ca8e402SCraig Gallek 	struct sockaddr * const addr =
3403ca8e402SCraig Gallek 		new_any_sockaddr(p.recv_family, p.recv_port);
3413ca8e402SCraig Gallek 	const char bpf_license[] = "GPL";
3423ca8e402SCraig Gallek 	struct bpf_insn ecode[] = {
3433ca8e402SCraig Gallek 		{ BPF_ALU64 | BPF_MOV | BPF_K, BPF_REG_0, 0, 0, 10 },
3443ca8e402SCraig Gallek 		{ BPF_JMP | BPF_EXIT, 0, 0, 0, 0 }
3453ca8e402SCraig Gallek 	};
3463ca8e402SCraig Gallek 	struct sock_filter ccode[] = {{ BPF_RET | BPF_A, 0, 0, 0 }};
3473ca8e402SCraig Gallek 	union bpf_attr eprog;
3483ca8e402SCraig Gallek 	struct sock_fprog cprog;
3493ca8e402SCraig Gallek 	int fd, bpf_fd;
3503ca8e402SCraig Gallek 
3513ca8e402SCraig Gallek 	fprintf(stderr, "Testing filters on non-SO_REUSEPORT socket...\n");
3523ca8e402SCraig Gallek 
3533ca8e402SCraig Gallek 	memset(&eprog, 0, sizeof(eprog));
3543ca8e402SCraig Gallek 	eprog.prog_type = BPF_PROG_TYPE_SOCKET_FILTER;
3553ca8e402SCraig Gallek 	eprog.insn_cnt = ARRAY_SIZE(ecode);
356fc100a7fSHelge Deller 	eprog.insns = (unsigned long) &ecode;
357fc100a7fSHelge Deller 	eprog.license = (unsigned long) &bpf_license;
3583ca8e402SCraig Gallek 	eprog.kern_version = 0;
3593ca8e402SCraig Gallek 
3603ca8e402SCraig Gallek 	memset(&cprog, 0, sizeof(cprog));
3613ca8e402SCraig Gallek 	cprog.len = ARRAY_SIZE(ccode);
3623ca8e402SCraig Gallek 	cprog.filter = ccode;
3633ca8e402SCraig Gallek 
3643ca8e402SCraig Gallek 
3653ca8e402SCraig Gallek 	bpf_fd = syscall(__NR_bpf, BPF_PROG_LOAD, &eprog, sizeof(eprog));
3663ca8e402SCraig Gallek 	if (bpf_fd < 0)
3673ca8e402SCraig Gallek 		error(1, errno, "ebpf error");
3683ca8e402SCraig Gallek 	fd = socket(p.recv_family, p.protocol, 0);
3693ca8e402SCraig Gallek 	if (fd < 0)
3703ca8e402SCraig Gallek 		error(1, errno, "failed to create socket 1");
3713ca8e402SCraig Gallek 
3723ca8e402SCraig Gallek 	if (bind(fd, addr, sockaddr_size()))
3733ca8e402SCraig Gallek 		error(1, errno, "failed to bind recv socket 1");
3743ca8e402SCraig Gallek 
3753ca8e402SCraig Gallek 	errno = 0;
3763ca8e402SCraig Gallek 	if (!setsockopt(fd, SOL_SOCKET, SO_ATTACH_REUSEPORT_EBPF, &bpf_fd,
3773ca8e402SCraig Gallek 			sizeof(bpf_fd)) || errno != EINVAL)
3783ca8e402SCraig Gallek 		error(1, errno, "setsockopt should have returned EINVAL");
3793ca8e402SCraig Gallek 
3803ca8e402SCraig Gallek 	errno = 0;
3813ca8e402SCraig Gallek 	if (!setsockopt(fd, SOL_SOCKET, SO_ATTACH_REUSEPORT_CBPF, &cprog,
3823ca8e402SCraig Gallek 		       sizeof(cprog)) || errno != EINVAL)
3833ca8e402SCraig Gallek 		error(1, errno, "setsockopt should have returned EINVAL");
3843ca8e402SCraig Gallek 
3853ca8e402SCraig Gallek 	free(addr);
3863ca8e402SCraig Gallek }
3873ca8e402SCraig Gallek 
test_filter_without_bind(void)3883ca8e402SCraig Gallek static void test_filter_without_bind(void)
3893ca8e402SCraig Gallek {
3904b2a6aedSCraig Gallek 	int fd1, fd2, opt = 1;
3913ca8e402SCraig Gallek 
3923ca8e402SCraig Gallek 	fprintf(stderr, "Testing filter add without bind...\n");
3933ca8e402SCraig Gallek 	fd1 = socket(AF_INET, SOCK_DGRAM, 0);
3943ca8e402SCraig Gallek 	if (fd1 < 0)
3953ca8e402SCraig Gallek 		error(1, errno, "failed to create socket 1");
3963ca8e402SCraig Gallek 	fd2 = socket(AF_INET, SOCK_DGRAM, 0);
3973ca8e402SCraig Gallek 	if (fd2 < 0)
3983ca8e402SCraig Gallek 		error(1, errno, "failed to create socket 2");
3994b2a6aedSCraig Gallek 	if (setsockopt(fd1, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)))
4004b2a6aedSCraig Gallek 		error(1, errno, "failed to set SO_REUSEPORT on socket 1");
4014b2a6aedSCraig Gallek 	if (setsockopt(fd2, SOL_SOCKET, SO_REUSEPORT, &opt, sizeof(opt)))
4024b2a6aedSCraig Gallek 		error(1, errno, "failed to set SO_REUSEPORT on socket 2");
4033ca8e402SCraig Gallek 
4043ca8e402SCraig Gallek 	attach_ebpf(fd1, 10);
4053ca8e402SCraig Gallek 	attach_cbpf(fd2, 10);
4063ca8e402SCraig Gallek 
4073ca8e402SCraig Gallek 	close(fd1);
4083ca8e402SCraig Gallek 	close(fd2);
4093ca8e402SCraig Gallek }
4103ca8e402SCraig Gallek 
enable_fastopen(void)4114b2a6aedSCraig Gallek void enable_fastopen(void)
4124b2a6aedSCraig Gallek {
4134b2a6aedSCraig Gallek 	int fd = open("/proc/sys/net/ipv4/tcp_fastopen", 0);
4144b2a6aedSCraig Gallek 	int rw_mask = 3;  /* bit 1: client side; bit-2 server side */
4154b2a6aedSCraig Gallek 	int val, size;
4164b2a6aedSCraig Gallek 	char buf[16];
4174b2a6aedSCraig Gallek 
4184b2a6aedSCraig Gallek 	if (fd < 0)
4194b2a6aedSCraig Gallek 		error(1, errno, "Unable to open tcp_fastopen sysctl");
4204b2a6aedSCraig Gallek 	if (read(fd, buf, sizeof(buf)) <= 0)
4214b2a6aedSCraig Gallek 		error(1, errno, "Unable to read tcp_fastopen sysctl");
4224b2a6aedSCraig Gallek 	val = atoi(buf);
4234b2a6aedSCraig Gallek 	close(fd);
4244b2a6aedSCraig Gallek 
4254b2a6aedSCraig Gallek 	if ((val & rw_mask) != rw_mask) {
4264b2a6aedSCraig Gallek 		fd = open("/proc/sys/net/ipv4/tcp_fastopen", O_RDWR);
4274b2a6aedSCraig Gallek 		if (fd < 0)
4284b2a6aedSCraig Gallek 			error(1, errno,
4294b2a6aedSCraig Gallek 			      "Unable to open tcp_fastopen sysctl for writing");
4304b2a6aedSCraig Gallek 		val |= rw_mask;
4314b2a6aedSCraig Gallek 		size = snprintf(buf, 16, "%d", val);
4324b2a6aedSCraig Gallek 		if (write(fd, buf, size) <= 0)
4334b2a6aedSCraig Gallek 			error(1, errno, "Unable to write tcp_fastopen sysctl");
4344b2a6aedSCraig Gallek 		close(fd);
4354b2a6aedSCraig Gallek 	}
4364b2a6aedSCraig Gallek }
4373ca8e402SCraig Gallek 
438262f9d81SEric Dumazet static struct rlimit rlim_old;
439941ff6f1SDaniel Borkmann 
main_ctor(void)440941ff6f1SDaniel Borkmann static  __attribute__((constructor)) void main_ctor(void)
441941ff6f1SDaniel Borkmann {
442941ff6f1SDaniel Borkmann 	getrlimit(RLIMIT_MEMLOCK, &rlim_old);
443262f9d81SEric Dumazet 
444262f9d81SEric Dumazet 	if (rlim_old.rlim_cur != RLIM_INFINITY) {
445262f9d81SEric Dumazet 		struct rlimit rlim_new;
446262f9d81SEric Dumazet 
447941ff6f1SDaniel Borkmann 		rlim_new.rlim_cur = rlim_old.rlim_cur + (1UL << 20);
448941ff6f1SDaniel Borkmann 		rlim_new.rlim_max = rlim_old.rlim_max + (1UL << 20);
449941ff6f1SDaniel Borkmann 		setrlimit(RLIMIT_MEMLOCK, &rlim_new);
450941ff6f1SDaniel Borkmann 	}
451262f9d81SEric Dumazet }
452941ff6f1SDaniel Borkmann 
main_dtor(void)453941ff6f1SDaniel Borkmann static __attribute__((destructor)) void main_dtor(void)
454941ff6f1SDaniel Borkmann {
455941ff6f1SDaniel Borkmann 	setrlimit(RLIMIT_MEMLOCK, &rlim_old);
456941ff6f1SDaniel Borkmann }
457941ff6f1SDaniel Borkmann 
main(void)4583ca8e402SCraig Gallek int main(void)
4593ca8e402SCraig Gallek {
4603ca8e402SCraig Gallek 	fprintf(stderr, "---- IPv4 UDP ----\n");
4611134158bSCraig Gallek 	/* NOTE: UDP socket lookups traverse a different code path when there
4621134158bSCraig Gallek 	 * are > 10 sockets in a group.  Run the bpf test through both paths.
4631134158bSCraig Gallek 	 */
4643ca8e402SCraig Gallek 	test_reuseport_ebpf((struct test_params) {
4653ca8e402SCraig Gallek 		.recv_family = AF_INET,
4663ca8e402SCraig Gallek 		.send_family = AF_INET,
4673ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
4683ca8e402SCraig Gallek 		.recv_socks = 10,
4693ca8e402SCraig Gallek 		.recv_port = 8000,
4703ca8e402SCraig Gallek 		.send_port_min = 9000});
4711134158bSCraig Gallek 	test_reuseport_ebpf((struct test_params) {
4721134158bSCraig Gallek 		.recv_family = AF_INET,
4731134158bSCraig Gallek 		.send_family = AF_INET,
4741134158bSCraig Gallek 		.protocol = SOCK_DGRAM,
4751134158bSCraig Gallek 		.recv_socks = 20,
4761134158bSCraig Gallek 		.recv_port = 8000,
4771134158bSCraig Gallek 		.send_port_min = 9000});
4783ca8e402SCraig Gallek 	test_reuseport_cbpf((struct test_params) {
4793ca8e402SCraig Gallek 		.recv_family = AF_INET,
4803ca8e402SCraig Gallek 		.send_family = AF_INET,
4813ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
4823ca8e402SCraig Gallek 		.recv_socks = 10,
4833ca8e402SCraig Gallek 		.recv_port = 8001,
4843ca8e402SCraig Gallek 		.send_port_min = 9020});
4851134158bSCraig Gallek 	test_reuseport_cbpf((struct test_params) {
4861134158bSCraig Gallek 		.recv_family = AF_INET,
4871134158bSCraig Gallek 		.send_family = AF_INET,
4881134158bSCraig Gallek 		.protocol = SOCK_DGRAM,
4891134158bSCraig Gallek 		.recv_socks = 20,
4901134158bSCraig Gallek 		.recv_port = 8001,
4911134158bSCraig Gallek 		.send_port_min = 9020});
4923ca8e402SCraig Gallek 	test_extra_filter((struct test_params) {
4933ca8e402SCraig Gallek 		.recv_family = AF_INET,
4943ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
4953ca8e402SCraig Gallek 		.recv_port = 8002});
4963ca8e402SCraig Gallek 	test_filter_no_reuseport((struct test_params) {
4973ca8e402SCraig Gallek 		.recv_family = AF_INET,
4983ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
4993ca8e402SCraig Gallek 		.recv_port = 8008});
5003ca8e402SCraig Gallek 
5013ca8e402SCraig Gallek 	fprintf(stderr, "---- IPv6 UDP ----\n");
5023ca8e402SCraig Gallek 	test_reuseport_ebpf((struct test_params) {
5033ca8e402SCraig Gallek 		.recv_family = AF_INET6,
5043ca8e402SCraig Gallek 		.send_family = AF_INET6,
5053ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
5063ca8e402SCraig Gallek 		.recv_socks = 10,
5073ca8e402SCraig Gallek 		.recv_port = 8003,
5083ca8e402SCraig Gallek 		.send_port_min = 9040});
5091134158bSCraig Gallek 	test_reuseport_ebpf((struct test_params) {
5101134158bSCraig Gallek 		.recv_family = AF_INET6,
5111134158bSCraig Gallek 		.send_family = AF_INET6,
5121134158bSCraig Gallek 		.protocol = SOCK_DGRAM,
5131134158bSCraig Gallek 		.recv_socks = 20,
5141134158bSCraig Gallek 		.recv_port = 8003,
5151134158bSCraig Gallek 		.send_port_min = 9040});
5163ca8e402SCraig Gallek 	test_reuseport_cbpf((struct test_params) {
5173ca8e402SCraig Gallek 		.recv_family = AF_INET6,
5183ca8e402SCraig Gallek 		.send_family = AF_INET6,
5193ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
5203ca8e402SCraig Gallek 		.recv_socks = 10,
5213ca8e402SCraig Gallek 		.recv_port = 8004,
5223ca8e402SCraig Gallek 		.send_port_min = 9060});
5231134158bSCraig Gallek 	test_reuseport_cbpf((struct test_params) {
5241134158bSCraig Gallek 		.recv_family = AF_INET6,
5251134158bSCraig Gallek 		.send_family = AF_INET6,
5261134158bSCraig Gallek 		.protocol = SOCK_DGRAM,
5271134158bSCraig Gallek 		.recv_socks = 20,
5281134158bSCraig Gallek 		.recv_port = 8004,
5291134158bSCraig Gallek 		.send_port_min = 9060});
5303ca8e402SCraig Gallek 	test_extra_filter((struct test_params) {
5313ca8e402SCraig Gallek 		.recv_family = AF_INET6,
5323ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
5333ca8e402SCraig Gallek 		.recv_port = 8005});
5343ca8e402SCraig Gallek 	test_filter_no_reuseport((struct test_params) {
5353ca8e402SCraig Gallek 		.recv_family = AF_INET6,
5363ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
5373ca8e402SCraig Gallek 		.recv_port = 8009});
5383ca8e402SCraig Gallek 
5393ca8e402SCraig Gallek 	fprintf(stderr, "---- IPv6 UDP w/ mapped IPv4 ----\n");
5403ca8e402SCraig Gallek 	test_reuseport_ebpf((struct test_params) {
5413ca8e402SCraig Gallek 		.recv_family = AF_INET6,
5423ca8e402SCraig Gallek 		.send_family = AF_INET,
5433ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
5441134158bSCraig Gallek 		.recv_socks = 20,
5451134158bSCraig Gallek 		.recv_port = 8006,
5461134158bSCraig Gallek 		.send_port_min = 9080});
5471134158bSCraig Gallek 	test_reuseport_ebpf((struct test_params) {
5481134158bSCraig Gallek 		.recv_family = AF_INET6,
5491134158bSCraig Gallek 		.send_family = AF_INET,
5501134158bSCraig Gallek 		.protocol = SOCK_DGRAM,
5513ca8e402SCraig Gallek 		.recv_socks = 10,
5523ca8e402SCraig Gallek 		.recv_port = 8006,
5533ca8e402SCraig Gallek 		.send_port_min = 9080});
5543ca8e402SCraig Gallek 	test_reuseport_cbpf((struct test_params) {
5553ca8e402SCraig Gallek 		.recv_family = AF_INET6,
5563ca8e402SCraig Gallek 		.send_family = AF_INET,
5573ca8e402SCraig Gallek 		.protocol = SOCK_DGRAM,
5583ca8e402SCraig Gallek 		.recv_socks = 10,
5593ca8e402SCraig Gallek 		.recv_port = 8007,
5603ca8e402SCraig Gallek 		.send_port_min = 9100});
5611134158bSCraig Gallek 	test_reuseport_cbpf((struct test_params) {
5621134158bSCraig Gallek 		.recv_family = AF_INET6,
5631134158bSCraig Gallek 		.send_family = AF_INET,
5641134158bSCraig Gallek 		.protocol = SOCK_DGRAM,
5651134158bSCraig Gallek 		.recv_socks = 20,
5661134158bSCraig Gallek 		.recv_port = 8007,
5671134158bSCraig Gallek 		.send_port_min = 9100});
5683ca8e402SCraig Gallek 
5694b2a6aedSCraig Gallek 	/* TCP fastopen is required for the TCP tests */
5704b2a6aedSCraig Gallek 	enable_fastopen();
5714b2a6aedSCraig Gallek 	fprintf(stderr, "---- IPv4 TCP ----\n");
5724b2a6aedSCraig Gallek 	test_reuseport_ebpf((struct test_params) {
5734b2a6aedSCraig Gallek 		.recv_family = AF_INET,
5744b2a6aedSCraig Gallek 		.send_family = AF_INET,
5754b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
5764b2a6aedSCraig Gallek 		.recv_socks = 10,
5774b2a6aedSCraig Gallek 		.recv_port = 8008,
5784b2a6aedSCraig Gallek 		.send_port_min = 9120});
5794b2a6aedSCraig Gallek 	test_reuseport_cbpf((struct test_params) {
5804b2a6aedSCraig Gallek 		.recv_family = AF_INET,
5814b2a6aedSCraig Gallek 		.send_family = AF_INET,
5824b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
5834b2a6aedSCraig Gallek 		.recv_socks = 10,
5844b2a6aedSCraig Gallek 		.recv_port = 8009,
5854b2a6aedSCraig Gallek 		.send_port_min = 9160});
5864b2a6aedSCraig Gallek 	test_extra_filter((struct test_params) {
5874b2a6aedSCraig Gallek 		.recv_family = AF_INET,
5884b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
5894b2a6aedSCraig Gallek 		.recv_port = 8010});
5904b2a6aedSCraig Gallek 	test_filter_no_reuseport((struct test_params) {
5914b2a6aedSCraig Gallek 		.recv_family = AF_INET,
5924b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
5934b2a6aedSCraig Gallek 		.recv_port = 8011});
5944b2a6aedSCraig Gallek 
5954b2a6aedSCraig Gallek 	fprintf(stderr, "---- IPv6 TCP ----\n");
5964b2a6aedSCraig Gallek 	test_reuseport_ebpf((struct test_params) {
5974b2a6aedSCraig Gallek 		.recv_family = AF_INET6,
5984b2a6aedSCraig Gallek 		.send_family = AF_INET6,
5994b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
6004b2a6aedSCraig Gallek 		.recv_socks = 10,
6014b2a6aedSCraig Gallek 		.recv_port = 8012,
6024b2a6aedSCraig Gallek 		.send_port_min = 9200});
6034b2a6aedSCraig Gallek 	test_reuseport_cbpf((struct test_params) {
6044b2a6aedSCraig Gallek 		.recv_family = AF_INET6,
6054b2a6aedSCraig Gallek 		.send_family = AF_INET6,
6064b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
6074b2a6aedSCraig Gallek 		.recv_socks = 10,
6084b2a6aedSCraig Gallek 		.recv_port = 8013,
6094b2a6aedSCraig Gallek 		.send_port_min = 9240});
6104b2a6aedSCraig Gallek 	test_extra_filter((struct test_params) {
6114b2a6aedSCraig Gallek 		.recv_family = AF_INET6,
6124b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
6134b2a6aedSCraig Gallek 		.recv_port = 8014});
6144b2a6aedSCraig Gallek 	test_filter_no_reuseport((struct test_params) {
6154b2a6aedSCraig Gallek 		.recv_family = AF_INET6,
6164b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
6174b2a6aedSCraig Gallek 		.recv_port = 8015});
6184b2a6aedSCraig Gallek 
6194b2a6aedSCraig Gallek 	fprintf(stderr, "---- IPv6 TCP w/ mapped IPv4 ----\n");
6204b2a6aedSCraig Gallek 	test_reuseport_ebpf((struct test_params) {
6214b2a6aedSCraig Gallek 		.recv_family = AF_INET6,
6224b2a6aedSCraig Gallek 		.send_family = AF_INET,
6234b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
6244b2a6aedSCraig Gallek 		.recv_socks = 10,
6254b2a6aedSCraig Gallek 		.recv_port = 8016,
6264b2a6aedSCraig Gallek 		.send_port_min = 9320});
6274b2a6aedSCraig Gallek 	test_reuseport_cbpf((struct test_params) {
6284b2a6aedSCraig Gallek 		.recv_family = AF_INET6,
6294b2a6aedSCraig Gallek 		.send_family = AF_INET,
6304b2a6aedSCraig Gallek 		.protocol = SOCK_STREAM,
6314b2a6aedSCraig Gallek 		.recv_socks = 10,
6324b2a6aedSCraig Gallek 		.recv_port = 8017,
6334b2a6aedSCraig Gallek 		.send_port_min = 9360});
6343ca8e402SCraig Gallek 
6353ca8e402SCraig Gallek 	test_filter_without_bind();
6363ca8e402SCraig Gallek 
6373ca8e402SCraig Gallek 	fprintf(stderr, "SUCCESS\n");
6383ca8e402SCraig Gallek 	return 0;
6393ca8e402SCraig Gallek }
640