Linux Audio

Check our new training course

Loading...
Note: File does not exist in v5.4.
  1// SPDX-License-Identifier: GPL-2.0
  2/* Copyright (c) 2018 Facebook */
  3
  4#include <stdlib.h>
  5#include <unistd.h>
  6#include <stdbool.h>
  7#include <string.h>
  8#include <errno.h>
  9#include <assert.h>
 10#include <fcntl.h>
 11#include <linux/bpf.h>
 12#include <linux/err.h>
 13#include <linux/types.h>
 14#include <linux/if_ether.h>
 15#include <sys/types.h>
 16#include <sys/epoll.h>
 17#include <sys/socket.h>
 18#include <netinet/in.h>
 19#include <bpf/bpf.h>
 20#include <bpf/libbpf.h>
 21#include "bpf_rlimit.h"
 22#include "bpf_util.h"
 23
 24#include "test_progs.h"
 25#include "test_select_reuseport_common.h"
 26
 27#define MAX_TEST_NAME 80
 28#define MIN_TCPHDR_LEN 20
 29#define UDPHDR_LEN 8
 30
 31#define TCP_SYNCOOKIE_SYSCTL "/proc/sys/net/ipv4/tcp_syncookies"
 32#define TCP_FO_SYSCTL "/proc/sys/net/ipv4/tcp_fastopen"
 33#define REUSEPORT_ARRAY_SIZE 32
 34
 35static int result_map, tmp_index_ovr_map, linum_map, data_check_map;
 36static __u32 expected_results[NR_RESULTS];
 37static int sk_fds[REUSEPORT_ARRAY_SIZE];
 38static int reuseport_array = -1, outer_map = -1;
 39static enum bpf_map_type inner_map_type;
 40static int select_by_skb_data_prog;
 41static int saved_tcp_syncookie = -1;
 42static struct bpf_object *obj;
 43static int saved_tcp_fo = -1;
 44static __u32 index_zero;
 45static int epfd;
 46
 47static union sa46 {
 48	struct sockaddr_in6 v6;
 49	struct sockaddr_in v4;
 50	sa_family_t family;
 51} srv_sa;
 52
 53#define RET_IF(condition, tag, format...) ({				\
 54	if (CHECK_FAIL(condition)) {					\
 55		printf(tag " " format);					\
 56		return;							\
 57	}								\
 58})
 59
 60#define RET_ERR(condition, tag, format...) ({				\
 61	if (CHECK_FAIL(condition)) {					\
 62		printf(tag " " format);					\
 63		return -1;						\
 64	}								\
 65})
 66
 67static int create_maps(enum bpf_map_type inner_type)
 68{
 69	struct bpf_create_map_attr attr = {};
 70
 71	inner_map_type = inner_type;
 72
 73	/* Creating reuseport_array */
 74	attr.name = "reuseport_array";
 75	attr.map_type = inner_type;
 76	attr.key_size = sizeof(__u32);
 77	attr.value_size = sizeof(__u32);
 78	attr.max_entries = REUSEPORT_ARRAY_SIZE;
 79
 80	reuseport_array = bpf_create_map_xattr(&attr);
 81	RET_ERR(reuseport_array < 0, "creating reuseport_array",
 82		"reuseport_array:%d errno:%d\n", reuseport_array, errno);
 83
 84	/* Creating outer_map */
 85	attr.name = "outer_map";
 86	attr.map_type = BPF_MAP_TYPE_ARRAY_OF_MAPS;
 87	attr.key_size = sizeof(__u32);
 88	attr.value_size = sizeof(__u32);
 89	attr.max_entries = 1;
 90	attr.inner_map_fd = reuseport_array;
 91	outer_map = bpf_create_map_xattr(&attr);
 92	RET_ERR(outer_map < 0, "creating outer_map",
 93		"outer_map:%d errno:%d\n", outer_map, errno);
 94
 95	return 0;
 96}
 97
 98static int prepare_bpf_obj(void)
 99{
100	struct bpf_program *prog;
101	struct bpf_map *map;
102	int err;
103
104	obj = bpf_object__open("test_select_reuseport_kern.o");
105	err = libbpf_get_error(obj);
106	RET_ERR(err, "open test_select_reuseport_kern.o",
107		"obj:%p PTR_ERR(obj):%d\n", obj, err);
108
109	map = bpf_object__find_map_by_name(obj, "outer_map");
110	RET_ERR(!map, "find outer_map", "!map\n");
111	err = bpf_map__reuse_fd(map, outer_map);
112	RET_ERR(err, "reuse outer_map", "err:%d\n", err);
113
114	err = bpf_object__load(obj);
115	RET_ERR(err, "load bpf_object", "err:%d\n", err);
116
117	prog = bpf_program__next(NULL, obj);
118	RET_ERR(!prog, "get first bpf_program", "!prog\n");
119	select_by_skb_data_prog = bpf_program__fd(prog);
120	RET_ERR(select_by_skb_data_prog < 0, "get prog fd",
121		"select_by_skb_data_prog:%d\n", select_by_skb_data_prog);
122
123	map = bpf_object__find_map_by_name(obj, "result_map");
124	RET_ERR(!map, "find result_map", "!map\n");
125	result_map = bpf_map__fd(map);
126	RET_ERR(result_map < 0, "get result_map fd",
127		"result_map:%d\n", result_map);
128
129	map = bpf_object__find_map_by_name(obj, "tmp_index_ovr_map");
130	RET_ERR(!map, "find tmp_index_ovr_map\n", "!map");
131	tmp_index_ovr_map = bpf_map__fd(map);
132	RET_ERR(tmp_index_ovr_map < 0, "get tmp_index_ovr_map fd",
133		"tmp_index_ovr_map:%d\n", tmp_index_ovr_map);
134
135	map = bpf_object__find_map_by_name(obj, "linum_map");
136	RET_ERR(!map, "find linum_map", "!map\n");
137	linum_map = bpf_map__fd(map);
138	RET_ERR(linum_map < 0, "get linum_map fd",
139		"linum_map:%d\n", linum_map);
140
141	map = bpf_object__find_map_by_name(obj, "data_check_map");
142	RET_ERR(!map, "find data_check_map", "!map\n");
143	data_check_map = bpf_map__fd(map);
144	RET_ERR(data_check_map < 0, "get data_check_map fd",
145		"data_check_map:%d\n", data_check_map);
146
147	return 0;
148}
149
150static void sa46_init_loopback(union sa46 *sa, sa_family_t family)
151{
152	memset(sa, 0, sizeof(*sa));
153	sa->family = family;
154	if (sa->family == AF_INET6)
155		sa->v6.sin6_addr = in6addr_loopback;
156	else
157		sa->v4.sin_addr.s_addr = htonl(INADDR_LOOPBACK);
158}
159
160static void sa46_init_inany(union sa46 *sa, sa_family_t family)
161{
162	memset(sa, 0, sizeof(*sa));
163	sa->family = family;
164	if (sa->family == AF_INET6)
165		sa->v6.sin6_addr = in6addr_any;
166	else
167		sa->v4.sin_addr.s_addr = INADDR_ANY;
168}
169
170static int read_int_sysctl(const char *sysctl)
171{
172	char buf[16];
173	int fd, ret;
174
175	fd = open(sysctl, 0);
176	RET_ERR(fd == -1, "open(sysctl)",
177		"sysctl:%s fd:%d errno:%d\n", sysctl, fd, errno);
178
179	ret = read(fd, buf, sizeof(buf));
180	RET_ERR(ret <= 0, "read(sysctl)",
181		"sysctl:%s ret:%d errno:%d\n", sysctl, ret, errno);
182
183	close(fd);
184	return atoi(buf);
185}
186
187static int write_int_sysctl(const char *sysctl, int v)
188{
189	int fd, ret, size;
190	char buf[16];
191
192	fd = open(sysctl, O_RDWR);
193	RET_ERR(fd == -1, "open(sysctl)",
194		"sysctl:%s fd:%d errno:%d\n", sysctl, fd, errno);
195
196	size = snprintf(buf, sizeof(buf), "%d", v);
197	ret = write(fd, buf, size);
198	RET_ERR(ret != size, "write(sysctl)",
199		"sysctl:%s ret:%d size:%d errno:%d\n",
200		sysctl, ret, size, errno);
201
202	close(fd);
203	return 0;
204}
205
206static void restore_sysctls(void)
207{
208	if (saved_tcp_fo != -1)
209		write_int_sysctl(TCP_FO_SYSCTL, saved_tcp_fo);
210	if (saved_tcp_syncookie != -1)
211		write_int_sysctl(TCP_SYNCOOKIE_SYSCTL, saved_tcp_syncookie);
212}
213
214static int enable_fastopen(void)
215{
216	int fo;
217
218	fo = read_int_sysctl(TCP_FO_SYSCTL);
219	if (fo < 0)
220		return -1;
221
222	return write_int_sysctl(TCP_FO_SYSCTL, fo | 7);
223}
224
225static int enable_syncookie(void)
226{
227	return write_int_sysctl(TCP_SYNCOOKIE_SYSCTL, 2);
228}
229
230static int disable_syncookie(void)
231{
232	return write_int_sysctl(TCP_SYNCOOKIE_SYSCTL, 0);
233}
234
235static long get_linum(void)
236{
237	__u32 linum;
238	int err;
239
240	err = bpf_map_lookup_elem(linum_map, &index_zero, &linum);
241	RET_ERR(err < 0, "lookup_elem(linum_map)", "err:%d errno:%d\n",
242		err, errno);
243
244	return linum;
245}
246
247static void check_data(int type, sa_family_t family, const struct cmd *cmd,
248		       int cli_fd)
249{
250	struct data_check expected = {}, result;
251	union sa46 cli_sa;
252	socklen_t addrlen;
253	int err;
254
255	addrlen = sizeof(cli_sa);
256	err = getsockname(cli_fd, (struct sockaddr *)&cli_sa,
257			  &addrlen);
258	RET_IF(err < 0, "getsockname(cli_fd)", "err:%d errno:%d\n",
259	       err, errno);
260
261	err = bpf_map_lookup_elem(data_check_map, &index_zero, &result);
262	RET_IF(err < 0, "lookup_elem(data_check_map)", "err:%d errno:%d\n",
263	       err, errno);
264
265	if (type == SOCK_STREAM) {
266		expected.len = MIN_TCPHDR_LEN;
267		expected.ip_protocol = IPPROTO_TCP;
268	} else {
269		expected.len = UDPHDR_LEN;
270		expected.ip_protocol = IPPROTO_UDP;
271	}
272
273	if (family == AF_INET6) {
274		expected.eth_protocol = htons(ETH_P_IPV6);
275		expected.bind_inany = !srv_sa.v6.sin6_addr.s6_addr32[3] &&
276			!srv_sa.v6.sin6_addr.s6_addr32[2] &&
277			!srv_sa.v6.sin6_addr.s6_addr32[1] &&
278			!srv_sa.v6.sin6_addr.s6_addr32[0];
279
280		memcpy(&expected.skb_addrs[0], cli_sa.v6.sin6_addr.s6_addr32,
281		       sizeof(cli_sa.v6.sin6_addr));
282		memcpy(&expected.skb_addrs[4], &in6addr_loopback,
283		       sizeof(in6addr_loopback));
284		expected.skb_ports[0] = cli_sa.v6.sin6_port;
285		expected.skb_ports[1] = srv_sa.v6.sin6_port;
286	} else {
287		expected.eth_protocol = htons(ETH_P_IP);
288		expected.bind_inany = !srv_sa.v4.sin_addr.s_addr;
289
290		expected.skb_addrs[0] = cli_sa.v4.sin_addr.s_addr;
291		expected.skb_addrs[1] = htonl(INADDR_LOOPBACK);
292		expected.skb_ports[0] = cli_sa.v4.sin_port;
293		expected.skb_ports[1] = srv_sa.v4.sin_port;
294	}
295
296	if (memcmp(&result, &expected, offsetof(struct data_check,
297						equal_check_end))) {
298		printf("unexpected data_check\n");
299		printf("  result: (0x%x, %u, %u)\n",
300		       result.eth_protocol, result.ip_protocol,
301		       result.bind_inany);
302		printf("expected: (0x%x, %u, %u)\n",
303		       expected.eth_protocol, expected.ip_protocol,
304		       expected.bind_inany);
305		RET_IF(1, "data_check result != expected",
306		       "bpf_prog_linum:%ld\n", get_linum());
307	}
308
309	RET_IF(!result.hash, "data_check result.hash empty",
310	       "result.hash:%u", result.hash);
311
312	expected.len += cmd ? sizeof(*cmd) : 0;
313	if (type == SOCK_STREAM)
314		RET_IF(expected.len > result.len, "expected.len > result.len",
315		       "expected.len:%u result.len:%u bpf_prog_linum:%ld\n",
316		       expected.len, result.len, get_linum());
317	else
318		RET_IF(expected.len != result.len, "expected.len != result.len",
319		       "expected.len:%u result.len:%u bpf_prog_linum:%ld\n",
320		       expected.len, result.len, get_linum());
321}
322
323static const char *result_to_str(enum result res)
324{
325	switch (res) {
326	case DROP_ERR_INNER_MAP:
327		return "DROP_ERR_INNER_MAP";
328	case DROP_ERR_SKB_DATA:
329		return "DROP_ERR_SKB_DATA";
330	case DROP_ERR_SK_SELECT_REUSEPORT:
331		return "DROP_ERR_SK_SELECT_REUSEPORT";
332	case DROP_MISC:
333		return "DROP_MISC";
334	case PASS:
335		return "PASS";
336	case PASS_ERR_SK_SELECT_REUSEPORT:
337		return "PASS_ERR_SK_SELECT_REUSEPORT";
338	default:
339		return "UNKNOWN";
340	}
341}
342
343static void check_results(void)
344{
345	__u32 results[NR_RESULTS];
346	__u32 i, broken = 0;
347	int err;
348
349	for (i = 0; i < NR_RESULTS; i++) {
350		err = bpf_map_lookup_elem(result_map, &i, &results[i]);
351		RET_IF(err < 0, "lookup_elem(result_map)",
352		       "i:%u err:%d errno:%d\n", i, err, errno);
353	}
354
355	for (i = 0; i < NR_RESULTS; i++) {
356		if (results[i] != expected_results[i]) {
357			broken = i;
358			break;
359		}
360	}
361
362	if (i == NR_RESULTS)
363		return;
364
365	printf("unexpected result\n");
366	printf(" result: [");
367	printf("%u", results[0]);
368	for (i = 1; i < NR_RESULTS; i++)
369		printf(", %u", results[i]);
370	printf("]\n");
371
372	printf("expected: [");
373	printf("%u", expected_results[0]);
374	for (i = 1; i < NR_RESULTS; i++)
375		printf(", %u", expected_results[i]);
376	printf("]\n");
377
378	printf("mismatch on %s (bpf_prog_linum:%ld)\n", result_to_str(broken),
379	       get_linum());
380
381	CHECK_FAIL(true);
382}
383
384static int send_data(int type, sa_family_t family, void *data, size_t len,
385		     enum result expected)
386{
387	union sa46 cli_sa;
388	int fd, err;
389
390	fd = socket(family, type, 0);
391	RET_ERR(fd == -1, "socket()", "fd:%d errno:%d\n", fd, errno);
392
393	sa46_init_loopback(&cli_sa, family);
394	err = bind(fd, (struct sockaddr *)&cli_sa, sizeof(cli_sa));
395	RET_ERR(fd == -1, "bind(cli_sa)", "err:%d errno:%d\n", err, errno);
396
397	err = sendto(fd, data, len, MSG_FASTOPEN, (struct sockaddr *)&srv_sa,
398		     sizeof(srv_sa));
399	RET_ERR(err != len && expected >= PASS,
400		"sendto()", "family:%u err:%d errno:%d expected:%d\n",
401		family, err, errno, expected);
402
403	return fd;
404}
405
406static void do_test(int type, sa_family_t family, struct cmd *cmd,
407		    enum result expected)
408{
409	int nev, srv_fd, cli_fd;
410	struct epoll_event ev;
411	struct cmd rcv_cmd;
412	ssize_t nread;
413
414	cli_fd = send_data(type, family, cmd, cmd ? sizeof(*cmd) : 0,
415			   expected);
416	if (cli_fd < 0)
417		return;
418	nev = epoll_wait(epfd, &ev, 1, expected >= PASS ? 5 : 0);
419	RET_IF((nev <= 0 && expected >= PASS) ||
420	       (nev > 0 && expected < PASS),
421	       "nev <> expected",
422	       "nev:%d expected:%d type:%d family:%d data:(%d, %d)\n",
423	       nev, expected, type, family,
424	       cmd ? cmd->reuseport_index : -1,
425	       cmd ? cmd->pass_on_failure : -1);
426	check_results();
427	check_data(type, family, cmd, cli_fd);
428
429	if (expected < PASS)
430		return;
431
432	RET_IF(expected != PASS_ERR_SK_SELECT_REUSEPORT &&
433	       cmd->reuseport_index != ev.data.u32,
434	       "check cmd->reuseport_index",
435	       "cmd:(%u, %u) ev.data.u32:%u\n",
436	       cmd->pass_on_failure, cmd->reuseport_index, ev.data.u32);
437
438	srv_fd = sk_fds[ev.data.u32];
439	if (type == SOCK_STREAM) {
440		int new_fd = accept(srv_fd, NULL, 0);
441
442		RET_IF(new_fd == -1, "accept(srv_fd)",
443		       "ev.data.u32:%u new_fd:%d errno:%d\n",
444		       ev.data.u32, new_fd, errno);
445
446		nread = recv(new_fd, &rcv_cmd, sizeof(rcv_cmd), MSG_DONTWAIT);
447		RET_IF(nread != sizeof(rcv_cmd),
448		       "recv(new_fd)",
449		       "ev.data.u32:%u nread:%zd sizeof(rcv_cmd):%zu errno:%d\n",
450		       ev.data.u32, nread, sizeof(rcv_cmd), errno);
451
452		close(new_fd);
453	} else {
454		nread = recv(srv_fd, &rcv_cmd, sizeof(rcv_cmd), MSG_DONTWAIT);
455		RET_IF(nread != sizeof(rcv_cmd),
456		       "recv(sk_fds)",
457		       "ev.data.u32:%u nread:%zd sizeof(rcv_cmd):%zu errno:%d\n",
458		       ev.data.u32, nread, sizeof(rcv_cmd), errno);
459	}
460
461	close(cli_fd);
462}
463
464static void test_err_inner_map(int type, sa_family_t family)
465{
466	struct cmd cmd = {
467		.reuseport_index = 0,
468		.pass_on_failure = 0,
469	};
470
471	expected_results[DROP_ERR_INNER_MAP]++;
472	do_test(type, family, &cmd, DROP_ERR_INNER_MAP);
473}
474
475static void test_err_skb_data(int type, sa_family_t family)
476{
477	expected_results[DROP_ERR_SKB_DATA]++;
478	do_test(type, family, NULL, DROP_ERR_SKB_DATA);
479}
480
481static void test_err_sk_select_port(int type, sa_family_t family)
482{
483	struct cmd cmd = {
484		.reuseport_index = REUSEPORT_ARRAY_SIZE,
485		.pass_on_failure = 0,
486	};
487
488	expected_results[DROP_ERR_SK_SELECT_REUSEPORT]++;
489	do_test(type, family, &cmd, DROP_ERR_SK_SELECT_REUSEPORT);
490}
491
492static void test_pass(int type, sa_family_t family)
493{
494	struct cmd cmd;
495	int i;
496
497	cmd.pass_on_failure = 0;
498	for (i = 0; i < REUSEPORT_ARRAY_SIZE; i++) {
499		expected_results[PASS]++;
500		cmd.reuseport_index = i;
501		do_test(type, family, &cmd, PASS);
502	}
503}
504
505static void test_syncookie(int type, sa_family_t family)
506{
507	int err, tmp_index = 1;
508	struct cmd cmd = {
509		.reuseport_index = 0,
510		.pass_on_failure = 0,
511	};
512
513	/*
514	 * +1 for TCP-SYN and
515	 * +1 for the TCP-ACK (ack the syncookie)
516	 */
517	expected_results[PASS] += 2;
518	enable_syncookie();
519	/*
520	 * Simulate TCP-SYN and TCP-ACK are handled by two different sk:
521	 * TCP-SYN: select sk_fds[tmp_index = 1] tmp_index is from the
522	 *          tmp_index_ovr_map
523	 * TCP-ACK: select sk_fds[reuseport_index = 0] reuseport_index
524	 *          is from the cmd.reuseport_index
525	 */
526	err = bpf_map_update_elem(tmp_index_ovr_map, &index_zero,
527				  &tmp_index, BPF_ANY);
528	RET_IF(err < 0, "update_elem(tmp_index_ovr_map, 0, 1)",
529	       "err:%d errno:%d\n", err, errno);
530	do_test(type, family, &cmd, PASS);
531	err = bpf_map_lookup_elem(tmp_index_ovr_map, &index_zero,
532				  &tmp_index);
533	RET_IF(err < 0 || tmp_index >= 0,
534	       "lookup_elem(tmp_index_ovr_map)",
535	       "err:%d errno:%d tmp_index:%d\n",
536	       err, errno, tmp_index);
537	disable_syncookie();
538}
539
540static void test_pass_on_err(int type, sa_family_t family)
541{
542	struct cmd cmd = {
543		.reuseport_index = REUSEPORT_ARRAY_SIZE,
544		.pass_on_failure = 1,
545	};
546
547	expected_results[PASS_ERR_SK_SELECT_REUSEPORT] += 1;
548	do_test(type, family, &cmd, PASS_ERR_SK_SELECT_REUSEPORT);
549}
550
551static void test_detach_bpf(int type, sa_family_t family)
552{
553#ifdef SO_DETACH_REUSEPORT_BPF
554	__u32 nr_run_before = 0, nr_run_after = 0, tmp, i;
555	struct epoll_event ev;
556	int cli_fd, err, nev;
557	struct cmd cmd = {};
558	int optvalue = 0;
559
560	err = setsockopt(sk_fds[0], SOL_SOCKET, SO_DETACH_REUSEPORT_BPF,
561			 &optvalue, sizeof(optvalue));
562	RET_IF(err == -1, "setsockopt(SO_DETACH_REUSEPORT_BPF)",
563	       "err:%d errno:%d\n", err, errno);
564
565	err = setsockopt(sk_fds[1], SOL_SOCKET, SO_DETACH_REUSEPORT_BPF,
566			 &optvalue, sizeof(optvalue));
567	RET_IF(err == 0 || errno != ENOENT,
568	       "setsockopt(SO_DETACH_REUSEPORT_BPF)",
569	       "err:%d errno:%d\n", err, errno);
570
571	for (i = 0; i < NR_RESULTS; i++) {
572		err = bpf_map_lookup_elem(result_map, &i, &tmp);
573		RET_IF(err < 0, "lookup_elem(result_map)",
574		       "i:%u err:%d errno:%d\n", i, err, errno);
575		nr_run_before += tmp;
576	}
577
578	cli_fd = send_data(type, family, &cmd, sizeof(cmd), PASS);
579	if (cli_fd < 0)
580		return;
581	nev = epoll_wait(epfd, &ev, 1, 5);
582	RET_IF(nev <= 0, "nev <= 0",
583	       "nev:%d expected:1 type:%d family:%d data:(0, 0)\n",
584	       nev,  type, family);
585
586	for (i = 0; i < NR_RESULTS; i++) {
587		err = bpf_map_lookup_elem(result_map, &i, &tmp);
588		RET_IF(err < 0, "lookup_elem(result_map)",
589		       "i:%u err:%d errno:%d\n", i, err, errno);
590		nr_run_after += tmp;
591	}
592
593	RET_IF(nr_run_before != nr_run_after,
594	       "nr_run_before != nr_run_after",
595	       "nr_run_before:%u nr_run_after:%u\n",
596	       nr_run_before, nr_run_after);
597
598	close(cli_fd);
599#else
600	test__skip();
601#endif
602}
603
604static void prepare_sk_fds(int type, sa_family_t family, bool inany)
605{
606	const int first = REUSEPORT_ARRAY_SIZE - 1;
607	int i, err, optval = 1;
608	struct epoll_event ev;
609	socklen_t addrlen;
610
611	if (inany)
612		sa46_init_inany(&srv_sa, family);
613	else
614		sa46_init_loopback(&srv_sa, family);
615	addrlen = sizeof(srv_sa);
616
617	/*
618	 * The sk_fds[] is filled from the back such that the order
619	 * is exactly opposite to the (struct sock_reuseport *)reuse->socks[].
620	 */
621	for (i = first; i >= 0; i--) {
622		sk_fds[i] = socket(family, type, 0);
623		RET_IF(sk_fds[i] == -1, "socket()", "sk_fds[%d]:%d errno:%d\n",
624		       i, sk_fds[i], errno);
625		err = setsockopt(sk_fds[i], SOL_SOCKET, SO_REUSEPORT,
626				 &optval, sizeof(optval));
627		RET_IF(err == -1, "setsockopt(SO_REUSEPORT)",
628		       "sk_fds[%d] err:%d errno:%d\n",
629		       i, err, errno);
630
631		if (i == first) {
632			err = setsockopt(sk_fds[i], SOL_SOCKET,
633					 SO_ATTACH_REUSEPORT_EBPF,
634					 &select_by_skb_data_prog,
635					 sizeof(select_by_skb_data_prog));
636			RET_IF(err < 0, "setsockopt(SO_ATTACH_REUEPORT_EBPF)",
637			       "err:%d errno:%d\n", err, errno);
638		}
639
640		err = bind(sk_fds[i], (struct sockaddr *)&srv_sa, addrlen);
641		RET_IF(err < 0, "bind()", "sk_fds[%d] err:%d errno:%d\n",
642		       i, err, errno);
643
644		if (type == SOCK_STREAM) {
645			err = listen(sk_fds[i], 10);
646			RET_IF(err < 0, "listen()",
647			       "sk_fds[%d] err:%d errno:%d\n",
648			       i, err, errno);
649		}
650
651		err = bpf_map_update_elem(reuseport_array, &i, &sk_fds[i],
652					  BPF_NOEXIST);
653		RET_IF(err < 0, "update_elem(reuseport_array)",
654		       "sk_fds[%d] err:%d errno:%d\n", i, err, errno);
655
656		if (i == first) {
657			socklen_t addrlen = sizeof(srv_sa);
658
659			err = getsockname(sk_fds[i], (struct sockaddr *)&srv_sa,
660					  &addrlen);
661			RET_IF(err == -1, "getsockname()",
662			       "sk_fds[%d] err:%d errno:%d\n", i, err, errno);
663		}
664	}
665
666	epfd = epoll_create(1);
667	RET_IF(epfd == -1, "epoll_create(1)",
668	       "epfd:%d errno:%d\n", epfd, errno);
669
670	ev.events = EPOLLIN;
671	for (i = 0; i < REUSEPORT_ARRAY_SIZE; i++) {
672		ev.data.u32 = i;
673		err = epoll_ctl(epfd, EPOLL_CTL_ADD, sk_fds[i], &ev);
674		RET_IF(err, "epoll_ctl(EPOLL_CTL_ADD)", "sk_fds[%d]\n", i);
675	}
676}
677
678static void setup_per_test(int type, sa_family_t family, bool inany,
679			   bool no_inner_map)
680{
681	int ovr = -1, err;
682
683	prepare_sk_fds(type, family, inany);
684	err = bpf_map_update_elem(tmp_index_ovr_map, &index_zero, &ovr,
685				  BPF_ANY);
686	RET_IF(err < 0, "update_elem(tmp_index_ovr_map, 0, -1)",
687	       "err:%d errno:%d\n", err, errno);
688
689	/* Install reuseport_array to outer_map? */
690	if (no_inner_map)
691		return;
692
693	err = bpf_map_update_elem(outer_map, &index_zero, &reuseport_array,
694				  BPF_ANY);
695	RET_IF(err < 0, "update_elem(outer_map, 0, reuseport_array)",
696	       "err:%d errno:%d\n", err, errno);
697}
698
699static void cleanup_per_test(bool no_inner_map)
700{
701	int i, err, zero = 0;
702
703	memset(expected_results, 0, sizeof(expected_results));
704
705	for (i = 0; i < NR_RESULTS; i++) {
706		err = bpf_map_update_elem(result_map, &i, &zero, BPF_ANY);
707		RET_IF(err, "reset elem in result_map",
708		       "i:%u err:%d errno:%d\n", i, err, errno);
709	}
710
711	err = bpf_map_update_elem(linum_map, &zero, &zero, BPF_ANY);
712	RET_IF(err, "reset line number in linum_map", "err:%d errno:%d\n",
713	       err, errno);
714
715	for (i = 0; i < REUSEPORT_ARRAY_SIZE; i++)
716		close(sk_fds[i]);
717	close(epfd);
718
719	/* Delete reuseport_array from outer_map? */
720	if (no_inner_map)
721		return;
722
723	err = bpf_map_delete_elem(outer_map, &index_zero);
724	RET_IF(err < 0, "delete_elem(outer_map)",
725	       "err:%d errno:%d\n", err, errno);
726}
727
728static void cleanup(void)
729{
730	if (outer_map >= 0) {
731		close(outer_map);
732		outer_map = -1;
733	}
734
735	if (reuseport_array >= 0) {
736		close(reuseport_array);
737		reuseport_array = -1;
738	}
739
740	if (obj) {
741		bpf_object__close(obj);
742		obj = NULL;
743	}
744
745	memset(expected_results, 0, sizeof(expected_results));
746}
747
748static const char *maptype_str(enum bpf_map_type type)
749{
750	switch (type) {
751	case BPF_MAP_TYPE_REUSEPORT_SOCKARRAY:
752		return "reuseport_sockarray";
753	case BPF_MAP_TYPE_SOCKMAP:
754		return "sockmap";
755	case BPF_MAP_TYPE_SOCKHASH:
756		return "sockhash";
757	default:
758		return "unknown";
759	}
760}
761
762static const char *family_str(sa_family_t family)
763{
764	switch (family) {
765	case AF_INET:
766		return "IPv4";
767	case AF_INET6:
768		return "IPv6";
769	default:
770		return "unknown";
771	}
772}
773
774static const char *sotype_str(int sotype)
775{
776	switch (sotype) {
777	case SOCK_STREAM:
778		return "TCP";
779	case SOCK_DGRAM:
780		return "UDP";
781	default:
782		return "unknown";
783	}
784}
785
786#define TEST_INIT(fn_, ...) { .fn = fn_, .name = #fn_, __VA_ARGS__ }
787
788static void test_config(int sotype, sa_family_t family, bool inany)
789{
790	const struct test {
791		void (*fn)(int sotype, sa_family_t family);
792		const char *name;
793		bool no_inner_map;
794		int need_sotype;
795	} tests[] = {
796		TEST_INIT(test_err_inner_map,
797			  .no_inner_map = true),
798		TEST_INIT(test_err_skb_data),
799		TEST_INIT(test_err_sk_select_port),
800		TEST_INIT(test_pass),
801		TEST_INIT(test_syncookie,
802			  .need_sotype = SOCK_STREAM),
803		TEST_INIT(test_pass_on_err),
804		TEST_INIT(test_detach_bpf),
805	};
806	char s[MAX_TEST_NAME];
807	const struct test *t;
808
809	for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
810		if (t->need_sotype && t->need_sotype != sotype)
811			continue; /* test not compatible with socket type */
812
813		snprintf(s, sizeof(s), "%s %s/%s %s %s",
814			 maptype_str(inner_map_type),
815			 family_str(family), sotype_str(sotype),
816			 inany ? "INANY" : "LOOPBACK", t->name);
817
818		if (!test__start_subtest(s))
819			continue;
820
821		setup_per_test(sotype, family, inany, t->no_inner_map);
822		t->fn(sotype, family);
823		cleanup_per_test(t->no_inner_map);
824	}
825}
826
827#define BIND_INANY true
828
829static void test_all(void)
830{
831	const struct config {
832		int sotype;
833		sa_family_t family;
834		bool inany;
835	} configs[] = {
836		{ SOCK_STREAM, AF_INET },
837		{ SOCK_STREAM, AF_INET, BIND_INANY },
838		{ SOCK_STREAM, AF_INET6 },
839		{ SOCK_STREAM, AF_INET6, BIND_INANY },
840		{ SOCK_DGRAM, AF_INET },
841		{ SOCK_DGRAM, AF_INET6 },
842	};
843	const struct config *c;
844
845	for (c = configs; c < configs + ARRAY_SIZE(configs); c++)
846		test_config(c->sotype, c->family, c->inany);
847}
848
849void test_map_type(enum bpf_map_type mt)
850{
851	if (create_maps(mt))
852		goto out;
853	if (prepare_bpf_obj())
854		goto out;
855
856	test_all();
857out:
858	cleanup();
859}
860
861void test_select_reuseport(void)
862{
863	saved_tcp_fo = read_int_sysctl(TCP_FO_SYSCTL);
864	if (saved_tcp_fo < 0)
865		goto out;
866	saved_tcp_syncookie = read_int_sysctl(TCP_SYNCOOKIE_SYSCTL);
867	if (saved_tcp_syncookie < 0)
868		goto out;
869
870	if (enable_fastopen())
871		goto out;
872	if (disable_syncookie())
873		goto out;
874
875	test_map_type(BPF_MAP_TYPE_REUSEPORT_SOCKARRAY);
876	test_map_type(BPF_MAP_TYPE_SOCKMAP);
877	test_map_type(BPF_MAP_TYPE_SOCKHASH);
878out:
879	restore_sysctls();
880}