1 // SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause
2 // Copyright (c) 2020 Cloudflare
4 * Test BPF attach point for INET socket lookup (BPF_SK_LOOKUP).
7 * - attaching/detaching/querying programs to BPF_SK_LOOKUP hook,
8 * - redirecting socket lookup to a socket selected by BPF program,
9 * - failing a socket lookup on BPF program's request,
10 * - error scenarios for selecting a socket from BPF program,
11 * - accessing BPF program context,
12 * - attaching and running multiple BPF programs.
14 * Tests run in a dedicated network namespace.
18 #include <arpa/inet.h>
25 #include <sys/types.h>
29 #include <bpf/libbpf.h>
32 #include "test_progs.h"
33 #include "bpf_rlimit.h"
35 #include "cgroup_helpers.h"
36 #include "network_helpers.h"
37 #include "testing_helpers.h"
38 #include "test_sk_lookup.skel.h"
40 /* External (address, port) pairs the client sends packets to. */
41 #define EXT_IP4 "127.0.0.1"
42 #define EXT_IP6 "fd00::1"
45 /* Internal (address, port) pairs the server listens/receives at. */
46 #define INT_IP4 "127.0.0.2"
47 #define INT_IP4_V6 "::ffff:127.0.0.2"
48 #define INT_IP6 "fd00::2"
51 #define IO_TIMEOUT_SEC 3
71 struct bpf_program *lookup_prog;
72 struct bpf_program *reuseport_prog;
73 struct bpf_map *sock_map;
75 struct inet_addr connect_to;
76 struct inet_addr listen_at;
77 enum server accept_on;
78 bool reuseport_has_conns; /* Add a connected socket to reuseport group */
81 static __u32 duration; /* for CHECK macro */
83 static bool is_ipv6(const char *ip)
85 return !!strchr(ip, ':');
88 static int attach_reuseport(int sock_fd, struct bpf_program *reuseport_prog)
92 prog_fd = bpf_program__fd(reuseport_prog);
98 err = setsockopt(sock_fd, SOL_SOCKET, SO_ATTACH_REUSEPORT_EBPF,
99 &prog_fd, sizeof(prog_fd));
106 static socklen_t inetaddr_len(const struct sockaddr_storage *addr)
108 return (addr->ss_family == AF_INET ? sizeof(struct sockaddr_in) :
109 addr->ss_family == AF_INET6 ? sizeof(struct sockaddr_in6) : 0);
112 static int make_socket(int sotype, const char *ip, int port,
113 struct sockaddr_storage *addr)
115 struct timeval timeo = { .tv_sec = IO_TIMEOUT_SEC };
118 family = is_ipv6(ip) ? AF_INET6 : AF_INET;
119 err = make_sockaddr(family, ip, port, addr, NULL);
120 if (CHECK(err, "make_address", "failed\n"))
123 fd = socket(addr->ss_family, sotype, 0);
124 if (CHECK(fd < 0, "socket", "failed\n")) {
125 log_err("failed to make socket");
129 err = setsockopt(fd, SOL_SOCKET, SO_SNDTIMEO, &timeo, sizeof(timeo));
130 if (CHECK(err, "setsockopt(SO_SNDTIMEO)", "failed\n")) {
131 log_err("failed to set SNDTIMEO");
136 err = setsockopt(fd, SOL_SOCKET, SO_RCVTIMEO, &timeo, sizeof(timeo));
137 if (CHECK(err, "setsockopt(SO_RCVTIMEO)", "failed\n")) {
138 log_err("failed to set RCVTIMEO");
146 static int make_server(int sotype, const char *ip, int port,
147 struct bpf_program *reuseport_prog)
149 struct sockaddr_storage addr = {0};
153 fd = make_socket(sotype, ip, port, &addr);
157 /* Enabled for UDPv6 sockets for IPv4-mapped IPv6 to work. */
158 if (sotype == SOCK_DGRAM) {
159 err = setsockopt(fd, SOL_IP, IP_RECVORIGDSTADDR, &one,
161 if (CHECK(err, "setsockopt(IP_RECVORIGDSTADDR)", "failed\n")) {
162 log_err("failed to enable IP_RECVORIGDSTADDR");
167 if (sotype == SOCK_DGRAM && addr.ss_family == AF_INET6) {
168 err = setsockopt(fd, SOL_IPV6, IPV6_RECVORIGDSTADDR, &one,
170 if (CHECK(err, "setsockopt(IPV6_RECVORIGDSTADDR)", "failed\n")) {
171 log_err("failed to enable IPV6_RECVORIGDSTADDR");
176 if (sotype == SOCK_STREAM) {
177 err = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &one,
179 if (CHECK(err, "setsockopt(SO_REUSEADDR)", "failed\n")) {
180 log_err("failed to enable SO_REUSEADDR");
185 if (reuseport_prog) {
186 err = setsockopt(fd, SOL_SOCKET, SO_REUSEPORT, &one,
188 if (CHECK(err, "setsockopt(SO_REUSEPORT)", "failed\n")) {
189 log_err("failed to enable SO_REUSEPORT");
194 err = bind(fd, (void *)&addr, inetaddr_len(&addr));
195 if (CHECK(err, "bind", "failed\n")) {
196 log_err("failed to bind listen socket");
200 if (sotype == SOCK_STREAM) {
201 err = listen(fd, SOMAXCONN);
202 if (CHECK(err, "make_server", "listen")) {
203 log_err("failed to listen on port %d", port);
208 /* Late attach reuseport prog so we can have one init path */
209 if (reuseport_prog) {
210 err = attach_reuseport(fd, reuseport_prog);
211 if (CHECK(err, "attach_reuseport", "failed\n")) {
212 log_err("failed to attach reuseport prog");
223 static int make_client(int sotype, const char *ip, int port)
225 struct sockaddr_storage addr = {0};
228 fd = make_socket(sotype, ip, port, &addr);
232 err = connect(fd, (void *)&addr, inetaddr_len(&addr));
233 if (CHECK(err, "make_client", "connect")) {
234 log_err("failed to connect client socket");
244 static int send_byte(int fd)
249 n = send(fd, "a", 1, 0);
250 if (CHECK(n <= 0, "send_byte", "send")) {
251 log_err("failed/partial send");
257 static int recv_byte(int fd)
262 n = recv(fd, buf, sizeof(buf), 0);
263 if (CHECK(n <= 0, "recv_byte", "recv")) {
264 log_err("failed/partial recv");
270 static int tcp_recv_send(int server_fd)
276 fd = accept(server_fd, NULL, NULL);
277 if (CHECK(fd < 0, "accept", "failed\n")) {
278 log_err("failed to accept");
282 n = recv(fd, buf, sizeof(buf), 0);
283 if (CHECK(n <= 0, "recv", "failed\n")) {
284 log_err("failed/partial recv");
289 n = send(fd, buf, n, 0);
290 if (CHECK(n <= 0, "send", "failed\n")) {
291 log_err("failed/partial send");
302 static void v4_to_v6(struct sockaddr_storage *ss)
304 struct sockaddr_in6 *v6 = (struct sockaddr_in6 *)ss;
305 struct sockaddr_in v4 = *(struct sockaddr_in *)ss;
307 v6->sin6_family = AF_INET6;
308 v6->sin6_port = v4.sin_port;
309 v6->sin6_addr.s6_addr[10] = 0xff;
310 v6->sin6_addr.s6_addr[11] = 0xff;
311 memcpy(&v6->sin6_addr.s6_addr[12], &v4.sin_addr.s_addr, 4);
314 static int udp_recv_send(int server_fd)
316 char cmsg_buf[CMSG_SPACE(sizeof(struct sockaddr_storage))];
317 struct sockaddr_storage _src_addr = { 0 };
318 struct sockaddr_storage *src_addr = &_src_addr;
319 struct sockaddr_storage *dst_addr = NULL;
320 struct msghdr msg = { 0 };
321 struct iovec iov = { 0 };
328 iov.iov_len = sizeof(buf);
330 msg.msg_name = src_addr;
331 msg.msg_namelen = sizeof(*src_addr);
334 msg.msg_control = cmsg_buf;
335 msg.msg_controllen = sizeof(cmsg_buf);
338 n = recvmsg(server_fd, &msg, 0);
339 if (CHECK(n <= 0, "recvmsg", "failed\n")) {
340 log_err("failed to receive");
343 if (CHECK(msg.msg_flags & MSG_CTRUNC, "recvmsg", "truncated cmsg\n"))
346 for (cm = CMSG_FIRSTHDR(&msg); cm; cm = CMSG_NXTHDR(&msg, cm)) {
347 if ((cm->cmsg_level == SOL_IP &&
348 cm->cmsg_type == IP_ORIGDSTADDR) ||
349 (cm->cmsg_level == SOL_IPV6 &&
350 cm->cmsg_type == IPV6_ORIGDSTADDR)) {
351 dst_addr = (struct sockaddr_storage *)CMSG_DATA(cm);
354 log_err("warning: ignored cmsg at level %d type %d",
355 cm->cmsg_level, cm->cmsg_type);
357 if (CHECK(!dst_addr, "recvmsg", "missing ORIGDSTADDR\n"))
360 /* Server socket bound to IPv4-mapped IPv6 address */
361 if (src_addr->ss_family == AF_INET6 &&
362 dst_addr->ss_family == AF_INET) {
366 /* Reply from original destination address. */
367 fd = socket(dst_addr->ss_family, SOCK_DGRAM, 0);
368 if (CHECK(fd < 0, "socket", "failed\n")) {
369 log_err("failed to create tx socket");
373 ret = bind(fd, (struct sockaddr *)dst_addr, sizeof(*dst_addr));
374 if (CHECK(ret, "bind", "failed\n")) {
375 log_err("failed to bind tx socket");
379 msg.msg_control = NULL;
380 msg.msg_controllen = 0;
381 n = sendmsg(fd, &msg, 0);
382 if (CHECK(n <= 0, "sendmsg", "failed\n")) {
383 log_err("failed to send echo reply");
394 static int tcp_echo_test(int client_fd, int server_fd)
398 err = send_byte(client_fd);
401 err = tcp_recv_send(server_fd);
404 err = recv_byte(client_fd);
411 static int udp_echo_test(int client_fd, int server_fd)
415 err = send_byte(client_fd);
418 err = udp_recv_send(server_fd);
421 err = recv_byte(client_fd);
428 static struct bpf_link *attach_lookup_prog(struct bpf_program *prog)
430 struct bpf_link *link;
433 net_fd = open("/proc/self/ns/net", O_RDONLY);
434 if (CHECK(net_fd < 0, "open", "failed\n")) {
435 log_err("failed to open /proc/self/ns/net");
439 link = bpf_program__attach_netns(prog, net_fd);
440 if (CHECK(IS_ERR(link), "bpf_program__attach_netns", "failed\n")) {
441 errno = -PTR_ERR(link);
442 log_err("failed to attach program '%s' to netns",
443 bpf_program__name(prog));
451 static int update_lookup_map(struct bpf_map *map, int index, int sock_fd)
456 map_fd = bpf_map__fd(map);
457 if (CHECK(map_fd < 0, "bpf_map__fd", "failed\n")) {
459 log_err("failed to get map FD");
463 value = (uint64_t)sock_fd;
464 err = bpf_map_update_elem(map_fd, &index, &value, BPF_NOEXIST);
465 if (CHECK(err, "bpf_map_update_elem", "failed\n")) {
466 log_err("failed to update redir_map @ %d", index);
473 static void query_lookup_prog(struct test_sk_lookup *skel)
475 struct bpf_link *link[3] = {};
476 struct bpf_link_info info;
477 __u32 attach_flags = 0;
478 __u32 prog_ids[3] = {};
484 net_fd = open("/proc/self/ns/net", O_RDONLY);
485 if (CHECK(net_fd < 0, "open", "failed\n")) {
486 log_err("failed to open /proc/self/ns/net");
490 link[0] = attach_lookup_prog(skel->progs.lookup_pass);
493 link[1] = attach_lookup_prog(skel->progs.lookup_pass);
496 link[2] = attach_lookup_prog(skel->progs.lookup_drop);
500 err = bpf_prog_query(net_fd, BPF_SK_LOOKUP, 0 /* query flags */,
501 &attach_flags, prog_ids, &prog_cnt);
502 if (CHECK(err, "bpf_prog_query", "failed\n")) {
503 log_err("failed to query lookup prog");
508 if (CHECK(attach_flags != 0, "bpf_prog_query",
509 "wrong attach_flags on query: %u", attach_flags))
511 if (CHECK(prog_cnt != 3, "bpf_prog_query",
512 "wrong program count on query: %u", prog_cnt))
514 prog_id = link_info_prog_id(link[0], &info);
515 CHECK(prog_ids[0] != prog_id, "bpf_prog_query",
516 "invalid program #0 id on query: %u != %u\n",
517 prog_ids[0], prog_id);
518 CHECK(info.netns.netns_ino == 0, "netns_ino",
519 "unexpected netns_ino: %u\n", info.netns.netns_ino);
520 prog_id = link_info_prog_id(link[1], &info);
521 CHECK(prog_ids[1] != prog_id, "bpf_prog_query",
522 "invalid program #1 id on query: %u != %u\n",
523 prog_ids[1], prog_id);
524 CHECK(info.netns.netns_ino == 0, "netns_ino",
525 "unexpected netns_ino: %u\n", info.netns.netns_ino);
526 prog_id = link_info_prog_id(link[2], &info);
527 CHECK(prog_ids[2] != prog_id, "bpf_prog_query",
528 "invalid program #2 id on query: %u != %u\n",
529 prog_ids[2], prog_id);
530 CHECK(info.netns.netns_ino == 0, "netns_ino",
531 "unexpected netns_ino: %u\n", info.netns.netns_ino);
533 err = bpf_link__detach(link[0]);
534 if (CHECK(err, "link_detach", "failed %d\n", err))
537 /* prog id is still there, but netns_ino is zeroed out */
538 prog_id = link_info_prog_id(link[0], &info);
539 CHECK(prog_ids[0] != prog_id, "bpf_prog_query",
540 "invalid program #0 id on query: %u != %u\n",
541 prog_ids[0], prog_id);
542 CHECK(info.netns.netns_ino != 0, "netns_ino",
543 "unexpected netns_ino: %u\n", info.netns.netns_ino);
547 bpf_link__destroy(link[2]);
549 bpf_link__destroy(link[1]);
551 bpf_link__destroy(link[0]);
556 static void run_lookup_prog(const struct test *t)
558 int server_fds[MAX_SERVERS] = { -1 };
559 int client_fd, reuse_conn_fd = -1;
560 struct bpf_link *lookup_link;
563 lookup_link = attach_lookup_prog(t->lookup_prog);
567 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
568 server_fds[i] = make_server(t->sotype, t->listen_at.ip,
571 if (server_fds[i] < 0)
574 err = update_lookup_map(t->sock_map, i, server_fds[i]);
578 /* want just one server for non-reuseport test */
579 if (!t->reuseport_prog)
583 /* Regular UDP socket lookup with reuseport behaves
584 * differently when reuseport group contains connected
585 * sockets. Check that adding a connected UDP socket to the
586 * reuseport group does not affect how reuseport works with
589 if (t->reuseport_has_conns) {
590 struct sockaddr_storage addr = {};
591 socklen_t len = sizeof(addr);
593 /* Add an extra socket to reuseport group */
594 reuse_conn_fd = make_server(t->sotype, t->listen_at.ip,
597 if (reuse_conn_fd < 0)
600 /* Connect the extra socket to itself */
601 err = getsockname(reuse_conn_fd, (void *)&addr, &len);
602 if (CHECK(err, "getsockname", "errno %d\n", errno))
604 err = connect(reuse_conn_fd, (void *)&addr, len);
605 if (CHECK(err, "connect", "errno %d\n", errno))
609 client_fd = make_client(t->sotype, t->connect_to.ip, t->connect_to.port);
613 if (t->sotype == SOCK_STREAM)
614 tcp_echo_test(client_fd, server_fds[t->accept_on]);
616 udp_echo_test(client_fd, server_fds[t->accept_on]);
620 if (reuse_conn_fd != -1)
621 close(reuse_conn_fd);
622 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
623 if (server_fds[i] != -1)
624 close(server_fds[i]);
626 bpf_link__destroy(lookup_link);
629 static void test_redirect_lookup(struct test_sk_lookup *skel)
631 const struct test tests[] = {
633 .desc = "TCP IPv4 redir port",
634 .lookup_prog = skel->progs.redir_port,
635 .sock_map = skel->maps.redir_map,
636 .sotype = SOCK_STREAM,
637 .connect_to = { EXT_IP4, EXT_PORT },
638 .listen_at = { EXT_IP4, INT_PORT },
641 .desc = "TCP IPv4 redir addr",
642 .lookup_prog = skel->progs.redir_ip4,
643 .sock_map = skel->maps.redir_map,
644 .sotype = SOCK_STREAM,
645 .connect_to = { EXT_IP4, EXT_PORT },
646 .listen_at = { INT_IP4, EXT_PORT },
649 .desc = "TCP IPv4 redir with reuseport",
650 .lookup_prog = skel->progs.select_sock_a,
651 .reuseport_prog = skel->progs.select_sock_b,
652 .sock_map = skel->maps.redir_map,
653 .sotype = SOCK_STREAM,
654 .connect_to = { EXT_IP4, EXT_PORT },
655 .listen_at = { INT_IP4, INT_PORT },
656 .accept_on = SERVER_B,
659 .desc = "TCP IPv4 redir skip reuseport",
660 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
661 .reuseport_prog = skel->progs.select_sock_b,
662 .sock_map = skel->maps.redir_map,
663 .sotype = SOCK_STREAM,
664 .connect_to = { EXT_IP4, EXT_PORT },
665 .listen_at = { INT_IP4, INT_PORT },
666 .accept_on = SERVER_A,
669 .desc = "TCP IPv6 redir port",
670 .lookup_prog = skel->progs.redir_port,
671 .sock_map = skel->maps.redir_map,
672 .sotype = SOCK_STREAM,
673 .connect_to = { EXT_IP6, EXT_PORT },
674 .listen_at = { EXT_IP6, INT_PORT },
677 .desc = "TCP IPv6 redir addr",
678 .lookup_prog = skel->progs.redir_ip6,
679 .sock_map = skel->maps.redir_map,
680 .sotype = SOCK_STREAM,
681 .connect_to = { EXT_IP6, EXT_PORT },
682 .listen_at = { INT_IP6, EXT_PORT },
685 .desc = "TCP IPv4->IPv6 redir port",
686 .lookup_prog = skel->progs.redir_port,
687 .sock_map = skel->maps.redir_map,
688 .sotype = SOCK_STREAM,
689 .connect_to = { EXT_IP4, EXT_PORT },
690 .listen_at = { INT_IP4_V6, INT_PORT },
693 .desc = "TCP IPv6 redir with reuseport",
694 .lookup_prog = skel->progs.select_sock_a,
695 .reuseport_prog = skel->progs.select_sock_b,
696 .sock_map = skel->maps.redir_map,
697 .sotype = SOCK_STREAM,
698 .connect_to = { EXT_IP6, EXT_PORT },
699 .listen_at = { INT_IP6, INT_PORT },
700 .accept_on = SERVER_B,
703 .desc = "TCP IPv6 redir skip reuseport",
704 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
705 .reuseport_prog = skel->progs.select_sock_b,
706 .sock_map = skel->maps.redir_map,
707 .sotype = SOCK_STREAM,
708 .connect_to = { EXT_IP6, EXT_PORT },
709 .listen_at = { INT_IP6, INT_PORT },
710 .accept_on = SERVER_A,
713 .desc = "UDP IPv4 redir port",
714 .lookup_prog = skel->progs.redir_port,
715 .sock_map = skel->maps.redir_map,
716 .sotype = SOCK_DGRAM,
717 .connect_to = { EXT_IP4, EXT_PORT },
718 .listen_at = { EXT_IP4, INT_PORT },
721 .desc = "UDP IPv4 redir addr",
722 .lookup_prog = skel->progs.redir_ip4,
723 .sock_map = skel->maps.redir_map,
724 .sotype = SOCK_DGRAM,
725 .connect_to = { EXT_IP4, EXT_PORT },
726 .listen_at = { INT_IP4, EXT_PORT },
729 .desc = "UDP IPv4 redir with reuseport",
730 .lookup_prog = skel->progs.select_sock_a,
731 .reuseport_prog = skel->progs.select_sock_b,
732 .sock_map = skel->maps.redir_map,
733 .sotype = SOCK_DGRAM,
734 .connect_to = { EXT_IP4, EXT_PORT },
735 .listen_at = { INT_IP4, INT_PORT },
736 .accept_on = SERVER_B,
739 .desc = "UDP IPv4 redir and reuseport with conns",
740 .lookup_prog = skel->progs.select_sock_a,
741 .reuseport_prog = skel->progs.select_sock_b,
742 .sock_map = skel->maps.redir_map,
743 .sotype = SOCK_DGRAM,
744 .connect_to = { EXT_IP4, EXT_PORT },
745 .listen_at = { INT_IP4, INT_PORT },
746 .accept_on = SERVER_B,
747 .reuseport_has_conns = true,
750 .desc = "UDP IPv4 redir skip reuseport",
751 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
752 .reuseport_prog = skel->progs.select_sock_b,
753 .sock_map = skel->maps.redir_map,
754 .sotype = SOCK_DGRAM,
755 .connect_to = { EXT_IP4, EXT_PORT },
756 .listen_at = { INT_IP4, INT_PORT },
757 .accept_on = SERVER_A,
760 .desc = "UDP IPv6 redir port",
761 .lookup_prog = skel->progs.redir_port,
762 .sock_map = skel->maps.redir_map,
763 .sotype = SOCK_DGRAM,
764 .connect_to = { EXT_IP6, EXT_PORT },
765 .listen_at = { EXT_IP6, INT_PORT },
768 .desc = "UDP IPv6 redir addr",
769 .lookup_prog = skel->progs.redir_ip6,
770 .sock_map = skel->maps.redir_map,
771 .sotype = SOCK_DGRAM,
772 .connect_to = { EXT_IP6, EXT_PORT },
773 .listen_at = { INT_IP6, EXT_PORT },
776 .desc = "UDP IPv4->IPv6 redir port",
777 .lookup_prog = skel->progs.redir_port,
778 .sock_map = skel->maps.redir_map,
779 .sotype = SOCK_DGRAM,
780 .listen_at = { INT_IP4_V6, INT_PORT },
781 .connect_to = { EXT_IP4, EXT_PORT },
784 .desc = "UDP IPv6 redir and reuseport",
785 .lookup_prog = skel->progs.select_sock_a,
786 .reuseport_prog = skel->progs.select_sock_b,
787 .sock_map = skel->maps.redir_map,
788 .sotype = SOCK_DGRAM,
789 .connect_to = { EXT_IP6, EXT_PORT },
790 .listen_at = { INT_IP6, INT_PORT },
791 .accept_on = SERVER_B,
794 .desc = "UDP IPv6 redir and reuseport with conns",
795 .lookup_prog = skel->progs.select_sock_a,
796 .reuseport_prog = skel->progs.select_sock_b,
797 .sock_map = skel->maps.redir_map,
798 .sotype = SOCK_DGRAM,
799 .connect_to = { EXT_IP6, EXT_PORT },
800 .listen_at = { INT_IP6, INT_PORT },
801 .accept_on = SERVER_B,
802 .reuseport_has_conns = true,
805 .desc = "UDP IPv6 redir skip reuseport",
806 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
807 .reuseport_prog = skel->progs.select_sock_b,
808 .sock_map = skel->maps.redir_map,
809 .sotype = SOCK_DGRAM,
810 .connect_to = { EXT_IP6, EXT_PORT },
811 .listen_at = { INT_IP6, INT_PORT },
812 .accept_on = SERVER_A,
815 const struct test *t;
817 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
818 if (test__start_subtest(t->desc))
823 static void drop_on_lookup(const struct test *t)
825 struct sockaddr_storage dst = {};
826 int client_fd, server_fd, err;
827 struct bpf_link *lookup_link;
830 lookup_link = attach_lookup_prog(t->lookup_prog);
834 server_fd = make_server(t->sotype, t->listen_at.ip, t->listen_at.port,
839 client_fd = make_socket(t->sotype, t->connect_to.ip,
840 t->connect_to.port, &dst);
844 err = connect(client_fd, (void *)&dst, inetaddr_len(&dst));
845 if (t->sotype == SOCK_DGRAM) {
846 err = send_byte(client_fd);
850 /* Read out asynchronous error */
851 n = recv(client_fd, NULL, 0, 0);
854 if (CHECK(!err || errno != ECONNREFUSED, "connect",
855 "unexpected success or error\n"))
856 log_err("expected ECONNREFUSED on connect");
863 bpf_link__destroy(lookup_link);
866 static void test_drop_on_lookup(struct test_sk_lookup *skel)
868 const struct test tests[] = {
870 .desc = "TCP IPv4 drop on lookup",
871 .lookup_prog = skel->progs.lookup_drop,
872 .sotype = SOCK_STREAM,
873 .connect_to = { EXT_IP4, EXT_PORT },
874 .listen_at = { EXT_IP4, EXT_PORT },
877 .desc = "TCP IPv6 drop on lookup",
878 .lookup_prog = skel->progs.lookup_drop,
879 .sotype = SOCK_STREAM,
880 .connect_to = { EXT_IP6, EXT_PORT },
881 .listen_at = { EXT_IP6, EXT_PORT },
884 .desc = "UDP IPv4 drop on lookup",
885 .lookup_prog = skel->progs.lookup_drop,
886 .sotype = SOCK_DGRAM,
887 .connect_to = { EXT_IP4, EXT_PORT },
888 .listen_at = { EXT_IP4, EXT_PORT },
891 .desc = "UDP IPv6 drop on lookup",
892 .lookup_prog = skel->progs.lookup_drop,
893 .sotype = SOCK_DGRAM,
894 .connect_to = { EXT_IP6, EXT_PORT },
895 .listen_at = { EXT_IP6, INT_PORT },
898 const struct test *t;
900 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
901 if (test__start_subtest(t->desc))
906 static void drop_on_reuseport(const struct test *t)
908 struct sockaddr_storage dst = { 0 };
909 int client, server1, server2, err;
910 struct bpf_link *lookup_link;
913 lookup_link = attach_lookup_prog(t->lookup_prog);
917 server1 = make_server(t->sotype, t->listen_at.ip, t->listen_at.port,
922 err = update_lookup_map(t->sock_map, SERVER_A, server1);
926 /* second server on destination address we should never reach */
927 server2 = make_server(t->sotype, t->connect_to.ip, t->connect_to.port,
928 NULL /* reuseport prog */);
932 client = make_socket(t->sotype, t->connect_to.ip,
933 t->connect_to.port, &dst);
937 err = connect(client, (void *)&dst, inetaddr_len(&dst));
938 if (t->sotype == SOCK_DGRAM) {
939 err = send_byte(client);
943 /* Read out asynchronous error */
944 n = recv(client, NULL, 0, 0);
947 if (CHECK(!err || errno != ECONNREFUSED, "connect",
948 "unexpected success or error\n"))
949 log_err("expected ECONNREFUSED on connect");
958 bpf_link__destroy(lookup_link);
961 static void test_drop_on_reuseport(struct test_sk_lookup *skel)
963 const struct test tests[] = {
965 .desc = "TCP IPv4 drop on reuseport",
966 .lookup_prog = skel->progs.select_sock_a,
967 .reuseport_prog = skel->progs.reuseport_drop,
968 .sock_map = skel->maps.redir_map,
969 .sotype = SOCK_STREAM,
970 .connect_to = { EXT_IP4, EXT_PORT },
971 .listen_at = { INT_IP4, INT_PORT },
974 .desc = "TCP IPv6 drop on reuseport",
975 .lookup_prog = skel->progs.select_sock_a,
976 .reuseport_prog = skel->progs.reuseport_drop,
977 .sock_map = skel->maps.redir_map,
978 .sotype = SOCK_STREAM,
979 .connect_to = { EXT_IP6, EXT_PORT },
980 .listen_at = { INT_IP6, INT_PORT },
983 .desc = "UDP IPv4 drop on reuseport",
984 .lookup_prog = skel->progs.select_sock_a,
985 .reuseport_prog = skel->progs.reuseport_drop,
986 .sock_map = skel->maps.redir_map,
987 .sotype = SOCK_DGRAM,
988 .connect_to = { EXT_IP4, EXT_PORT },
989 .listen_at = { INT_IP4, INT_PORT },
992 .desc = "TCP IPv6 drop on reuseport",
993 .lookup_prog = skel->progs.select_sock_a,
994 .reuseport_prog = skel->progs.reuseport_drop,
995 .sock_map = skel->maps.redir_map,
996 .sotype = SOCK_STREAM,
997 .connect_to = { EXT_IP6, EXT_PORT },
998 .listen_at = { INT_IP6, INT_PORT },
1001 const struct test *t;
1003 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
1004 if (test__start_subtest(t->desc))
1005 drop_on_reuseport(t);
1009 static void run_sk_assign(struct test_sk_lookup *skel,
1010 struct bpf_program *lookup_prog,
1011 const char *listen_ip, const char *connect_ip)
1013 int client_fd, peer_fd, server_fds[MAX_SERVERS] = { -1 };
1014 struct bpf_link *lookup_link;
1017 lookup_link = attach_lookup_prog(lookup_prog);
1021 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
1022 server_fds[i] = make_server(SOCK_STREAM, listen_ip, 0, NULL);
1023 if (server_fds[i] < 0)
1026 err = update_lookup_map(skel->maps.redir_map, i,
1032 client_fd = make_client(SOCK_STREAM, connect_ip, EXT_PORT);
1036 peer_fd = accept(server_fds[SERVER_B], NULL, NULL);
1037 if (CHECK(peer_fd < 0, "accept", "failed\n"))
1044 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
1045 if (server_fds[i] != -1)
1046 close(server_fds[i]);
1048 bpf_link__destroy(lookup_link);
1051 static void run_sk_assign_v4(struct test_sk_lookup *skel,
1052 struct bpf_program *lookup_prog)
1054 run_sk_assign(skel, lookup_prog, INT_IP4, EXT_IP4);
1057 static void run_sk_assign_v6(struct test_sk_lookup *skel,
1058 struct bpf_program *lookup_prog)
1060 run_sk_assign(skel, lookup_prog, INT_IP6, EXT_IP6);
1063 static void run_sk_assign_connected(struct test_sk_lookup *skel,
1066 int err, client_fd, connected_fd, server_fd;
1067 struct bpf_link *lookup_link;
1069 server_fd = make_server(sotype, EXT_IP4, EXT_PORT, NULL);
1073 connected_fd = make_client(sotype, EXT_IP4, EXT_PORT);
1074 if (connected_fd < 0)
1075 goto out_close_server;
1077 /* Put a connected socket in redirect map */
1078 err = update_lookup_map(skel->maps.redir_map, SERVER_A, connected_fd);
1080 goto out_close_connected;
1082 lookup_link = attach_lookup_prog(skel->progs.sk_assign_esocknosupport);
1084 goto out_close_connected;
1086 /* Try to redirect TCP SYN / UDP packet to a connected socket */
1087 client_fd = make_client(sotype, EXT_IP4, EXT_PORT);
1089 goto out_unlink_prog;
1090 if (sotype == SOCK_DGRAM) {
1091 send_byte(client_fd);
1092 recv_byte(server_fd);
1097 bpf_link__destroy(lookup_link);
1098 out_close_connected:
1099 close(connected_fd);
1104 static void test_sk_assign_helper(struct test_sk_lookup *skel)
1106 if (test__start_subtest("sk_assign returns EEXIST"))
1107 run_sk_assign_v4(skel, skel->progs.sk_assign_eexist);
1108 if (test__start_subtest("sk_assign honors F_REPLACE"))
1109 run_sk_assign_v4(skel, skel->progs.sk_assign_replace_flag);
1110 if (test__start_subtest("sk_assign accepts NULL socket"))
1111 run_sk_assign_v4(skel, skel->progs.sk_assign_null);
1112 if (test__start_subtest("access ctx->sk"))
1113 run_sk_assign_v4(skel, skel->progs.access_ctx_sk);
1114 if (test__start_subtest("narrow access to ctx v4"))
1115 run_sk_assign_v4(skel, skel->progs.ctx_narrow_access);
1116 if (test__start_subtest("narrow access to ctx v6"))
1117 run_sk_assign_v6(skel, skel->progs.ctx_narrow_access);
1118 if (test__start_subtest("sk_assign rejects TCP established"))
1119 run_sk_assign_connected(skel, SOCK_STREAM);
1120 if (test__start_subtest("sk_assign rejects UDP connected"))
1121 run_sk_assign_connected(skel, SOCK_DGRAM);
1124 struct test_multi_prog {
1126 struct bpf_program *prog1;
1127 struct bpf_program *prog2;
1128 struct bpf_map *redir_map;
1129 struct bpf_map *run_map;
1131 struct inet_addr listen_at;
1134 static void run_multi_prog_lookup(const struct test_multi_prog *t)
1136 struct sockaddr_storage dst = {};
1137 int map_fd, server_fd, client_fd;
1138 struct bpf_link *link1, *link2;
1139 int prog_idx, done, err;
1141 map_fd = bpf_map__fd(t->run_map);
1145 err = bpf_map_update_elem(map_fd, &prog_idx, &done, BPF_ANY);
1146 if (CHECK(err, "bpf_map_update_elem", "failed\n"))
1149 err = bpf_map_update_elem(map_fd, &prog_idx, &done, BPF_ANY);
1150 if (CHECK(err, "bpf_map_update_elem", "failed\n"))
1153 link1 = attach_lookup_prog(t->prog1);
1156 link2 = attach_lookup_prog(t->prog2);
1160 server_fd = make_server(SOCK_STREAM, t->listen_at.ip,
1161 t->listen_at.port, NULL);
1165 err = update_lookup_map(t->redir_map, SERVER_A, server_fd);
1167 goto out_close_server;
1169 client_fd = make_socket(SOCK_STREAM, EXT_IP4, EXT_PORT, &dst);
1171 goto out_close_server;
1173 err = connect(client_fd, (void *)&dst, inetaddr_len(&dst));
1174 if (CHECK(err && !t->expect_errno, "connect",
1175 "unexpected error %d\n", errno))
1176 goto out_close_client;
1177 if (CHECK(err && t->expect_errno && errno != t->expect_errno,
1178 "connect", "unexpected error %d\n", errno))
1179 goto out_close_client;
1183 err = bpf_map_lookup_elem(map_fd, &prog_idx, &done);
1184 CHECK(err, "bpf_map_lookup_elem", "failed\n");
1185 CHECK(!done, "bpf_map_lookup_elem", "PROG1 !done\n");
1189 err = bpf_map_lookup_elem(map_fd, &prog_idx, &done);
1190 CHECK(err, "bpf_map_lookup_elem", "failed\n");
1191 CHECK(!done, "bpf_map_lookup_elem", "PROG2 !done\n");
1198 bpf_link__destroy(link2);
1200 bpf_link__destroy(link1);
1203 static void test_multi_prog_lookup(struct test_sk_lookup *skel)
1205 struct test_multi_prog tests[] = {
1207 .desc = "multi prog - pass, pass",
1208 .prog1 = skel->progs.multi_prog_pass1,
1209 .prog2 = skel->progs.multi_prog_pass2,
1210 .listen_at = { EXT_IP4, EXT_PORT },
1213 .desc = "multi prog - drop, drop",
1214 .prog1 = skel->progs.multi_prog_drop1,
1215 .prog2 = skel->progs.multi_prog_drop2,
1216 .listen_at = { EXT_IP4, EXT_PORT },
1217 .expect_errno = ECONNREFUSED,
1220 .desc = "multi prog - pass, drop",
1221 .prog1 = skel->progs.multi_prog_pass1,
1222 .prog2 = skel->progs.multi_prog_drop2,
1223 .listen_at = { EXT_IP4, EXT_PORT },
1224 .expect_errno = ECONNREFUSED,
1227 .desc = "multi prog - drop, pass",
1228 .prog1 = skel->progs.multi_prog_drop1,
1229 .prog2 = skel->progs.multi_prog_pass2,
1230 .listen_at = { EXT_IP4, EXT_PORT },
1231 .expect_errno = ECONNREFUSED,
1234 .desc = "multi prog - pass, redir",
1235 .prog1 = skel->progs.multi_prog_pass1,
1236 .prog2 = skel->progs.multi_prog_redir2,
1237 .listen_at = { INT_IP4, INT_PORT },
1240 .desc = "multi prog - redir, pass",
1241 .prog1 = skel->progs.multi_prog_redir1,
1242 .prog2 = skel->progs.multi_prog_pass2,
1243 .listen_at = { INT_IP4, INT_PORT },
1246 .desc = "multi prog - drop, redir",
1247 .prog1 = skel->progs.multi_prog_drop1,
1248 .prog2 = skel->progs.multi_prog_redir2,
1249 .listen_at = { INT_IP4, INT_PORT },
1252 .desc = "multi prog - redir, drop",
1253 .prog1 = skel->progs.multi_prog_redir1,
1254 .prog2 = skel->progs.multi_prog_drop2,
1255 .listen_at = { INT_IP4, INT_PORT },
1258 .desc = "multi prog - redir, redir",
1259 .prog1 = skel->progs.multi_prog_redir1,
1260 .prog2 = skel->progs.multi_prog_redir2,
1261 .listen_at = { INT_IP4, INT_PORT },
1264 struct test_multi_prog *t;
1266 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
1267 t->redir_map = skel->maps.redir_map;
1268 t->run_map = skel->maps.run_map;
1269 if (test__start_subtest(t->desc))
1270 run_multi_prog_lookup(t);
1274 static void run_tests(struct test_sk_lookup *skel)
1276 if (test__start_subtest("query lookup prog"))
1277 query_lookup_prog(skel);
1278 test_redirect_lookup(skel);
1279 test_drop_on_lookup(skel);
1280 test_drop_on_reuseport(skel);
1281 test_sk_assign_helper(skel);
1282 test_multi_prog_lookup(skel);
1285 static int switch_netns(void)
1287 static const char * const setup_script[] = {
1288 "ip -6 addr add dev lo " EXT_IP6 "/128",
1289 "ip -6 addr add dev lo " INT_IP6 "/128",
1290 "ip link set dev lo up",
1293 const char * const *cmd;
1296 err = unshare(CLONE_NEWNET);
1297 if (CHECK(err, "unshare", "failed\n")) {
1298 log_err("unshare(CLONE_NEWNET)");
1302 for (cmd = setup_script; *cmd; cmd++) {
1304 if (CHECK(err, "system", "failed\n")) {
1305 log_err("system(%s)", *cmd);
1313 void test_sk_lookup(void)
1315 struct test_sk_lookup *skel;
1318 err = switch_netns();
1322 skel = test_sk_lookup__open_and_load();
1323 if (CHECK(!skel, "skel open_and_load", "failed\n"))
1328 test_sk_lookup__destroy(skel);