1 // SPDX-License-Identifier: GPL-2.0
2 // Copyright (c) 2018 Facebook
10 #include <arpa/inet.h>
11 #include <netinet/in.h>
12 #include <sys/types.h>
13 #include <sys/select.h>
14 #include <sys/socket.h>
16 #include <linux/filter.h>
19 #include <bpf/libbpf.h>
21 #include "cgroup_helpers.h"
22 #include "bpf_rlimit.h"
29 #define CG_PATH "/foo"
30 #define CONNECT4_PROG_PATH "./connect4_prog.o"
31 #define CONNECT6_PROG_PATH "./connect6_prog.o"
32 #define SENDMSG4_PROG_PATH "./sendmsg4_prog.o"
33 #define SENDMSG6_PROG_PATH "./sendmsg6_prog.o"
35 #define SERV4_IP "192.168.1.254"
36 #define SERV4_REWRITE_IP "127.0.0.1"
37 #define SRC4_IP "172.16.0.1"
38 #define SRC4_REWRITE_IP "127.0.0.4"
39 #define SERV4_PORT 4040
40 #define SERV4_REWRITE_PORT 4444
42 #define SERV6_IP "face:b00c:1234:5678::abcd"
43 #define SERV6_REWRITE_IP "::1"
44 #define SERV6_V4MAPPED_IP "::ffff:192.168.0.4"
46 #define SRC6_REWRITE_IP "::6"
47 #define WILDCARD6_IP "::"
48 #define SERV6_PORT 6060
49 #define SERV6_REWRITE_PORT 6666
51 #define INET_NTOP_BUF 40
53 struct sock_addr_test;
55 typedef int (*load_fn)(const struct sock_addr_test *test);
56 typedef int (*info_fn)(int, struct sockaddr *, socklen_t *);
58 char bpf_log_buf[BPF_LOG_BUF_SIZE];
60 struct sock_addr_test {
62 /* BPF prog properties */
64 enum bpf_attach_type expected_attach_type;
65 enum bpf_attach_type attach_type;
66 /* Socket properties */
69 /* IP:port pairs for BPF prog to override */
70 const char *requested_ip;
71 unsigned short requested_port;
72 const char *expected_ip;
73 unsigned short expected_port;
74 const char *expected_src_ip;
75 /* Expected test result */
86 static int bind4_prog_load(const struct sock_addr_test *test);
87 static int bind6_prog_load(const struct sock_addr_test *test);
88 static int connect4_prog_load(const struct sock_addr_test *test);
89 static int connect6_prog_load(const struct sock_addr_test *test);
90 static int sendmsg_allow_prog_load(const struct sock_addr_test *test);
91 static int sendmsg_deny_prog_load(const struct sock_addr_test *test);
92 static int recvmsg_allow_prog_load(const struct sock_addr_test *test);
93 static int recvmsg_deny_prog_load(const struct sock_addr_test *test);
94 static int sendmsg4_rw_asm_prog_load(const struct sock_addr_test *test);
95 static int recvmsg4_rw_asm_prog_load(const struct sock_addr_test *test);
96 static int sendmsg4_rw_c_prog_load(const struct sock_addr_test *test);
97 static int sendmsg6_rw_asm_prog_load(const struct sock_addr_test *test);
98 static int recvmsg6_rw_asm_prog_load(const struct sock_addr_test *test);
99 static int sendmsg6_rw_c_prog_load(const struct sock_addr_test *test);
100 static int sendmsg6_rw_v4mapped_prog_load(const struct sock_addr_test *test);
101 static int sendmsg6_rw_wildcard_prog_load(const struct sock_addr_test *test);
103 static struct sock_addr_test tests[] = {
106 "bind4: load prog with wrong expected attach type",
108 BPF_CGROUP_INET6_BIND,
109 BPF_CGROUP_INET4_BIND,
120 "bind4: attach prog with wrong attach type",
122 BPF_CGROUP_INET4_BIND,
123 BPF_CGROUP_INET6_BIND,
134 "bind4: rewrite IP & TCP port in",
136 BPF_CGROUP_INET4_BIND,
137 BPF_CGROUP_INET4_BIND,
148 "bind4: rewrite IP & UDP port in",
150 BPF_CGROUP_INET4_BIND,
151 BPF_CGROUP_INET4_BIND,
162 "bind6: load prog with wrong expected attach type",
164 BPF_CGROUP_INET4_BIND,
165 BPF_CGROUP_INET6_BIND,
176 "bind6: attach prog with wrong attach type",
178 BPF_CGROUP_INET6_BIND,
179 BPF_CGROUP_INET4_BIND,
190 "bind6: rewrite IP & TCP port in",
192 BPF_CGROUP_INET6_BIND,
193 BPF_CGROUP_INET6_BIND,
204 "bind6: rewrite IP & UDP port in",
206 BPF_CGROUP_INET6_BIND,
207 BPF_CGROUP_INET6_BIND,
220 "connect4: load prog with wrong expected attach type",
222 BPF_CGROUP_INET6_CONNECT,
223 BPF_CGROUP_INET4_CONNECT,
234 "connect4: attach prog with wrong attach type",
236 BPF_CGROUP_INET4_CONNECT,
237 BPF_CGROUP_INET6_CONNECT,
248 "connect4: rewrite IP & TCP port",
250 BPF_CGROUP_INET4_CONNECT,
251 BPF_CGROUP_INET4_CONNECT,
262 "connect4: rewrite IP & UDP port",
264 BPF_CGROUP_INET4_CONNECT,
265 BPF_CGROUP_INET4_CONNECT,
276 "connect6: load prog with wrong expected attach type",
278 BPF_CGROUP_INET4_CONNECT,
279 BPF_CGROUP_INET6_CONNECT,
290 "connect6: attach prog with wrong attach type",
292 BPF_CGROUP_INET6_CONNECT,
293 BPF_CGROUP_INET4_CONNECT,
304 "connect6: rewrite IP & TCP port",
306 BPF_CGROUP_INET6_CONNECT,
307 BPF_CGROUP_INET6_CONNECT,
318 "connect6: rewrite IP & UDP port",
320 BPF_CGROUP_INET6_CONNECT,
321 BPF_CGROUP_INET6_CONNECT,
334 "sendmsg4: load prog with wrong expected attach type",
335 sendmsg4_rw_asm_prog_load,
336 BPF_CGROUP_UDP6_SENDMSG,
337 BPF_CGROUP_UDP4_SENDMSG,
348 "sendmsg4: attach prog with wrong attach type",
349 sendmsg4_rw_asm_prog_load,
350 BPF_CGROUP_UDP4_SENDMSG,
351 BPF_CGROUP_UDP6_SENDMSG,
362 "sendmsg4: rewrite IP & port (asm)",
363 sendmsg4_rw_asm_prog_load,
364 BPF_CGROUP_UDP4_SENDMSG,
365 BPF_CGROUP_UDP4_SENDMSG,
376 "sendmsg4: rewrite IP & port (C)",
377 sendmsg4_rw_c_prog_load,
378 BPF_CGROUP_UDP4_SENDMSG,
379 BPF_CGROUP_UDP4_SENDMSG,
390 "sendmsg4: deny call",
391 sendmsg_deny_prog_load,
392 BPF_CGROUP_UDP4_SENDMSG,
393 BPF_CGROUP_UDP4_SENDMSG,
404 "sendmsg6: load prog with wrong expected attach type",
405 sendmsg6_rw_asm_prog_load,
406 BPF_CGROUP_UDP4_SENDMSG,
407 BPF_CGROUP_UDP6_SENDMSG,
418 "sendmsg6: attach prog with wrong attach type",
419 sendmsg6_rw_asm_prog_load,
420 BPF_CGROUP_UDP6_SENDMSG,
421 BPF_CGROUP_UDP4_SENDMSG,
432 "sendmsg6: rewrite IP & port (asm)",
433 sendmsg6_rw_asm_prog_load,
434 BPF_CGROUP_UDP6_SENDMSG,
435 BPF_CGROUP_UDP6_SENDMSG,
446 "sendmsg6: rewrite IP & port (C)",
447 sendmsg6_rw_c_prog_load,
448 BPF_CGROUP_UDP6_SENDMSG,
449 BPF_CGROUP_UDP6_SENDMSG,
460 "sendmsg6: IPv4-mapped IPv6",
461 sendmsg6_rw_v4mapped_prog_load,
462 BPF_CGROUP_UDP6_SENDMSG,
463 BPF_CGROUP_UDP6_SENDMSG,
474 "sendmsg6: set dst IP = [::] (BSD'ism)",
475 sendmsg6_rw_wildcard_prog_load,
476 BPF_CGROUP_UDP6_SENDMSG,
477 BPF_CGROUP_UDP6_SENDMSG,
488 "sendmsg6: preserve dst IP = [::] (BSD'ism)",
489 sendmsg_allow_prog_load,
490 BPF_CGROUP_UDP6_SENDMSG,
491 BPF_CGROUP_UDP6_SENDMSG,
502 "sendmsg6: deny call",
503 sendmsg_deny_prog_load,
504 BPF_CGROUP_UDP6_SENDMSG,
505 BPF_CGROUP_UDP6_SENDMSG,
518 "recvmsg4: return code ok",
519 recvmsg_allow_prog_load,
520 BPF_CGROUP_UDP4_RECVMSG,
521 BPF_CGROUP_UDP4_RECVMSG,
532 "recvmsg4: return code !ok",
533 recvmsg_deny_prog_load,
534 BPF_CGROUP_UDP4_RECVMSG,
535 BPF_CGROUP_UDP4_RECVMSG,
546 "recvmsg6: return code ok",
547 recvmsg_allow_prog_load,
548 BPF_CGROUP_UDP6_RECVMSG,
549 BPF_CGROUP_UDP6_RECVMSG,
560 "recvmsg6: return code !ok",
561 recvmsg_deny_prog_load,
562 BPF_CGROUP_UDP6_RECVMSG,
563 BPF_CGROUP_UDP6_RECVMSG,
574 "recvmsg4: rewrite IP & port (asm)",
575 recvmsg4_rw_asm_prog_load,
576 BPF_CGROUP_UDP4_RECVMSG,
577 BPF_CGROUP_UDP4_RECVMSG,
588 "recvmsg6: rewrite IP & port (asm)",
589 recvmsg6_rw_asm_prog_load,
590 BPF_CGROUP_UDP6_RECVMSG,
591 BPF_CGROUP_UDP6_RECVMSG,
603 static int mk_sockaddr(int domain, const char *ip, unsigned short port,
604 struct sockaddr *addr, socklen_t addr_len)
606 struct sockaddr_in6 *addr6;
607 struct sockaddr_in *addr4;
609 if (domain != AF_INET && domain != AF_INET6) {
610 log_err("Unsupported address family");
614 memset(addr, 0, addr_len);
616 if (domain == AF_INET) {
617 if (addr_len < sizeof(struct sockaddr_in))
619 addr4 = (struct sockaddr_in *)addr;
620 addr4->sin_family = domain;
621 addr4->sin_port = htons(port);
622 if (inet_pton(domain, ip, (void *)&addr4->sin_addr) != 1) {
623 log_err("Invalid IPv4: %s", ip);
626 } else if (domain == AF_INET6) {
627 if (addr_len < sizeof(struct sockaddr_in6))
629 addr6 = (struct sockaddr_in6 *)addr;
630 addr6->sin6_family = domain;
631 addr6->sin6_port = htons(port);
632 if (inet_pton(domain, ip, (void *)&addr6->sin6_addr) != 1) {
633 log_err("Invalid IPv6: %s", ip);
641 static int load_insns(const struct sock_addr_test *test,
642 const struct bpf_insn *insns, size_t insns_cnt)
644 struct bpf_load_program_attr load_attr;
647 memset(&load_attr, 0, sizeof(struct bpf_load_program_attr));
648 load_attr.prog_type = BPF_PROG_TYPE_CGROUP_SOCK_ADDR;
649 load_attr.expected_attach_type = test->expected_attach_type;
650 load_attr.insns = insns;
651 load_attr.insns_cnt = insns_cnt;
652 load_attr.license = "GPL";
654 ret = bpf_load_program_xattr(&load_attr, bpf_log_buf, BPF_LOG_BUF_SIZE);
655 if (ret < 0 && test->expected_result != LOAD_REJECT) {
656 log_err(">>> Loading program error.\n"
657 ">>> Verifier output:\n%s\n-------\n", bpf_log_buf);
663 /* [1] These testing programs try to read different context fields, including
664 * narrow loads of different sizes from user_ip4 and user_ip6, and write to
665 * those allowed to be overridden.
667 * [2] BPF_LD_IMM64 & BPF_JMP_REG are used below whenever there is a need to
668 * compare a register with unsigned 32bit integer. BPF_JMP_IMM can't be used
669 * in such cases since it accepts only _signed_ 32bit integer as IMM
670 * argument. Also note that BPF_LD_IMM64 contains 2 instructions what matters
671 * to count jumps properly.
674 static int bind4_prog_load(const struct sock_addr_test *test)
678 uint16_t u4_addr16[2];
681 struct sockaddr_in addr4_rw;
683 if (inet_pton(AF_INET, SERV4_IP, (void *)&ip4) != 1) {
684 log_err("Invalid IPv4: %s", SERV4_IP);
688 port.u4_addr32 = htons(SERV4_PORT);
690 if (mk_sockaddr(AF_INET, SERV4_REWRITE_IP, SERV4_REWRITE_PORT,
691 (struct sockaddr *)&addr4_rw, sizeof(addr4_rw)) == -1)
695 struct bpf_insn insns[] = {
696 BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
698 /* if (sk.family == AF_INET && */
699 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
700 offsetof(struct bpf_sock_addr, family)),
701 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, AF_INET, 32),
703 /* (sk.type == SOCK_DGRAM || sk.type == SOCK_STREAM) && */
704 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
705 offsetof(struct bpf_sock_addr, type)),
706 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, SOCK_DGRAM, 1),
708 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, SOCK_STREAM, 28),
710 /* 1st_byte_of_user_ip4 == expected && */
711 BPF_LDX_MEM(BPF_B, BPF_REG_7, BPF_REG_6,
712 offsetof(struct bpf_sock_addr, user_ip4)),
713 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip4.u4_addr8[0], 26),
715 /* 2nd_byte_of_user_ip4 == expected && */
716 BPF_LDX_MEM(BPF_B, BPF_REG_7, BPF_REG_6,
717 offsetof(struct bpf_sock_addr, user_ip4) + 1),
718 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip4.u4_addr8[1], 24),
720 /* 3rd_byte_of_user_ip4 == expected && */
721 BPF_LDX_MEM(BPF_B, BPF_REG_7, BPF_REG_6,
722 offsetof(struct bpf_sock_addr, user_ip4) + 2),
723 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip4.u4_addr8[2], 22),
725 /* 4th_byte_of_user_ip4 == expected && */
726 BPF_LDX_MEM(BPF_B, BPF_REG_7, BPF_REG_6,
727 offsetof(struct bpf_sock_addr, user_ip4) + 3),
728 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip4.u4_addr8[3], 20),
730 /* 1st_half_of_user_ip4 == expected && */
731 BPF_LDX_MEM(BPF_H, BPF_REG_7, BPF_REG_6,
732 offsetof(struct bpf_sock_addr, user_ip4)),
733 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip4.u4_addr16[0], 18),
735 /* 2nd_half_of_user_ip4 == expected && */
736 BPF_LDX_MEM(BPF_H, BPF_REG_7, BPF_REG_6,
737 offsetof(struct bpf_sock_addr, user_ip4) + 2),
738 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip4.u4_addr16[1], 16),
740 /* whole_user_ip4 == expected && */
741 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
742 offsetof(struct bpf_sock_addr, user_ip4)),
743 BPF_LD_IMM64(BPF_REG_8, ip4.u4_addr32), /* See [2]. */
744 BPF_JMP_REG(BPF_JNE, BPF_REG_7, BPF_REG_8, 12),
746 /* 1st_byte_of_user_port == expected && */
747 BPF_LDX_MEM(BPF_B, BPF_REG_7, BPF_REG_6,
748 offsetof(struct bpf_sock_addr, user_port)),
749 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, port.u4_addr8[0], 10),
751 /* 1st_half_of_user_port == expected && */
752 BPF_LDX_MEM(BPF_H, BPF_REG_7, BPF_REG_6,
753 offsetof(struct bpf_sock_addr, user_port)),
754 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, port.u4_addr16[0], 8),
756 /* user_port == expected) { */
757 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
758 offsetof(struct bpf_sock_addr, user_port)),
759 BPF_LD_IMM64(BPF_REG_8, port.u4_addr32), /* See [2]. */
760 BPF_JMP_REG(BPF_JNE, BPF_REG_7, BPF_REG_8, 4),
762 /* user_ip4 = addr4_rw.sin_addr */
763 BPF_MOV32_IMM(BPF_REG_7, addr4_rw.sin_addr.s_addr),
764 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
765 offsetof(struct bpf_sock_addr, user_ip4)),
767 /* user_port = addr4_rw.sin_port */
768 BPF_MOV32_IMM(BPF_REG_7, addr4_rw.sin_port),
769 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
770 offsetof(struct bpf_sock_addr, user_port)),
774 BPF_MOV64_IMM(BPF_REG_0, 1),
778 return load_insns(test, insns, sizeof(insns) / sizeof(struct bpf_insn));
781 static int bind6_prog_load(const struct sock_addr_test *test)
783 struct sockaddr_in6 addr6_rw;
786 if (inet_pton(AF_INET6, SERV6_IP, (void *)&ip6) != 1) {
787 log_err("Invalid IPv6: %s", SERV6_IP);
791 if (mk_sockaddr(AF_INET6, SERV6_REWRITE_IP, SERV6_REWRITE_PORT,
792 (struct sockaddr *)&addr6_rw, sizeof(addr6_rw)) == -1)
796 struct bpf_insn insns[] = {
797 BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
799 /* if (sk.family == AF_INET6 && */
800 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
801 offsetof(struct bpf_sock_addr, family)),
802 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, AF_INET6, 18),
804 /* 5th_byte_of_user_ip6 == expected && */
805 BPF_LDX_MEM(BPF_B, BPF_REG_7, BPF_REG_6,
806 offsetof(struct bpf_sock_addr, user_ip6[1])),
807 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip6.s6_addr[4], 16),
809 /* 3rd_half_of_user_ip6 == expected && */
810 BPF_LDX_MEM(BPF_H, BPF_REG_7, BPF_REG_6,
811 offsetof(struct bpf_sock_addr, user_ip6[1])),
812 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, ip6.s6_addr16[2], 14),
814 /* last_word_of_user_ip6 == expected) { */
815 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
816 offsetof(struct bpf_sock_addr, user_ip6[3])),
817 BPF_LD_IMM64(BPF_REG_8, ip6.s6_addr32[3]), /* See [2]. */
818 BPF_JMP_REG(BPF_JNE, BPF_REG_7, BPF_REG_8, 10),
821 #define STORE_IPV6_WORD(N) \
822 BPF_MOV32_IMM(BPF_REG_7, addr6_rw.sin6_addr.s6_addr32[N]), \
823 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7, \
824 offsetof(struct bpf_sock_addr, user_ip6[N]))
826 /* user_ip6 = addr6_rw.sin6_addr */
832 /* user_port = addr6_rw.sin6_port */
833 BPF_MOV32_IMM(BPF_REG_7, addr6_rw.sin6_port),
834 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
835 offsetof(struct bpf_sock_addr, user_port)),
840 BPF_MOV64_IMM(BPF_REG_0, 1),
844 return load_insns(test, insns, sizeof(insns) / sizeof(struct bpf_insn));
847 static int load_path(const struct sock_addr_test *test, const char *path)
849 struct bpf_prog_load_attr attr;
850 struct bpf_object *obj;
853 memset(&attr, 0, sizeof(struct bpf_prog_load_attr));
855 attr.prog_type = BPF_PROG_TYPE_CGROUP_SOCK_ADDR;
856 attr.expected_attach_type = test->expected_attach_type;
857 attr.prog_flags = BPF_F_TEST_RND_HI32;
859 if (bpf_prog_load_xattr(&attr, &obj, &prog_fd)) {
860 if (test->expected_result != LOAD_REJECT)
861 log_err(">>> Loading program (%s) error.\n", path);
868 static int connect4_prog_load(const struct sock_addr_test *test)
870 return load_path(test, CONNECT4_PROG_PATH);
873 static int connect6_prog_load(const struct sock_addr_test *test)
875 return load_path(test, CONNECT6_PROG_PATH);
878 static int xmsg_ret_only_prog_load(const struct sock_addr_test *test,
881 struct bpf_insn insns[] = {
883 BPF_MOV64_IMM(BPF_REG_0, rc),
886 return load_insns(test, insns, sizeof(insns) / sizeof(struct bpf_insn));
889 static int sendmsg_allow_prog_load(const struct sock_addr_test *test)
891 return xmsg_ret_only_prog_load(test, /*rc*/ 1);
894 static int sendmsg_deny_prog_load(const struct sock_addr_test *test)
896 return xmsg_ret_only_prog_load(test, /*rc*/ 0);
899 static int recvmsg_allow_prog_load(const struct sock_addr_test *test)
901 return xmsg_ret_only_prog_load(test, /*rc*/ 1);
904 static int recvmsg_deny_prog_load(const struct sock_addr_test *test)
906 return xmsg_ret_only_prog_load(test, /*rc*/ 0);
909 static int sendmsg4_rw_asm_prog_load(const struct sock_addr_test *test)
911 struct sockaddr_in dst4_rw_addr;
912 struct in_addr src4_rw_ip;
914 if (inet_pton(AF_INET, SRC4_REWRITE_IP, (void *)&src4_rw_ip) != 1) {
915 log_err("Invalid IPv4: %s", SRC4_REWRITE_IP);
919 if (mk_sockaddr(AF_INET, SERV4_REWRITE_IP, SERV4_REWRITE_PORT,
920 (struct sockaddr *)&dst4_rw_addr,
921 sizeof(dst4_rw_addr)) == -1)
924 struct bpf_insn insns[] = {
925 BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
927 /* if (sk.family == AF_INET && */
928 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
929 offsetof(struct bpf_sock_addr, family)),
930 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, AF_INET, 8),
932 /* sk.type == SOCK_DGRAM) { */
933 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
934 offsetof(struct bpf_sock_addr, type)),
935 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, SOCK_DGRAM, 6),
937 /* msg_src_ip4 = src4_rw_ip */
938 BPF_MOV32_IMM(BPF_REG_7, src4_rw_ip.s_addr),
939 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
940 offsetof(struct bpf_sock_addr, msg_src_ip4)),
942 /* user_ip4 = dst4_rw_addr.sin_addr */
943 BPF_MOV32_IMM(BPF_REG_7, dst4_rw_addr.sin_addr.s_addr),
944 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
945 offsetof(struct bpf_sock_addr, user_ip4)),
947 /* user_port = dst4_rw_addr.sin_port */
948 BPF_MOV32_IMM(BPF_REG_7, dst4_rw_addr.sin_port),
949 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
950 offsetof(struct bpf_sock_addr, user_port)),
954 BPF_MOV64_IMM(BPF_REG_0, 1),
958 return load_insns(test, insns, sizeof(insns) / sizeof(struct bpf_insn));
961 static int recvmsg4_rw_asm_prog_load(const struct sock_addr_test *test)
963 struct sockaddr_in src4_rw_addr;
965 if (mk_sockaddr(AF_INET, SERV4_IP, SERV4_PORT,
966 (struct sockaddr *)&src4_rw_addr,
967 sizeof(src4_rw_addr)) == -1)
970 struct bpf_insn insns[] = {
971 BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
973 /* if (sk.family == AF_INET && */
974 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
975 offsetof(struct bpf_sock_addr, family)),
976 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, AF_INET, 6),
978 /* sk.type == SOCK_DGRAM) { */
979 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
980 offsetof(struct bpf_sock_addr, type)),
981 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, SOCK_DGRAM, 4),
983 /* user_ip4 = src4_rw_addr.sin_addr */
984 BPF_MOV32_IMM(BPF_REG_7, src4_rw_addr.sin_addr.s_addr),
985 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
986 offsetof(struct bpf_sock_addr, user_ip4)),
988 /* user_port = src4_rw_addr.sin_port */
989 BPF_MOV32_IMM(BPF_REG_7, src4_rw_addr.sin_port),
990 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
991 offsetof(struct bpf_sock_addr, user_port)),
995 BPF_MOV64_IMM(BPF_REG_0, 1),
999 return load_insns(test, insns, sizeof(insns) / sizeof(struct bpf_insn));
1002 static int sendmsg4_rw_c_prog_load(const struct sock_addr_test *test)
1004 return load_path(test, SENDMSG4_PROG_PATH);
1007 static int sendmsg6_rw_dst_asm_prog_load(const struct sock_addr_test *test,
1008 const char *rw_dst_ip)
1010 struct sockaddr_in6 dst6_rw_addr;
1011 struct in6_addr src6_rw_ip;
1013 if (inet_pton(AF_INET6, SRC6_REWRITE_IP, (void *)&src6_rw_ip) != 1) {
1014 log_err("Invalid IPv6: %s", SRC6_REWRITE_IP);
1018 if (mk_sockaddr(AF_INET6, rw_dst_ip, SERV6_REWRITE_PORT,
1019 (struct sockaddr *)&dst6_rw_addr,
1020 sizeof(dst6_rw_addr)) == -1)
1023 struct bpf_insn insns[] = {
1024 BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
1026 /* if (sk.family == AF_INET6) { */
1027 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
1028 offsetof(struct bpf_sock_addr, family)),
1029 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, AF_INET6, 18),
1031 #define STORE_IPV6_WORD_N(DST, SRC, N) \
1032 BPF_MOV32_IMM(BPF_REG_7, SRC[N]), \
1033 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7, \
1034 offsetof(struct bpf_sock_addr, DST[N]))
1036 #define STORE_IPV6(DST, SRC) \
1037 STORE_IPV6_WORD_N(DST, SRC, 0), \
1038 STORE_IPV6_WORD_N(DST, SRC, 1), \
1039 STORE_IPV6_WORD_N(DST, SRC, 2), \
1040 STORE_IPV6_WORD_N(DST, SRC, 3)
1042 STORE_IPV6(msg_src_ip6, src6_rw_ip.s6_addr32),
1043 STORE_IPV6(user_ip6, dst6_rw_addr.sin6_addr.s6_addr32),
1045 /* user_port = dst6_rw_addr.sin6_port */
1046 BPF_MOV32_IMM(BPF_REG_7, dst6_rw_addr.sin6_port),
1047 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
1048 offsetof(struct bpf_sock_addr, user_port)),
1053 BPF_MOV64_IMM(BPF_REG_0, 1),
1057 return load_insns(test, insns, sizeof(insns) / sizeof(struct bpf_insn));
1060 static int sendmsg6_rw_asm_prog_load(const struct sock_addr_test *test)
1062 return sendmsg6_rw_dst_asm_prog_load(test, SERV6_REWRITE_IP);
1065 static int recvmsg6_rw_asm_prog_load(const struct sock_addr_test *test)
1067 struct sockaddr_in6 src6_rw_addr;
1069 if (mk_sockaddr(AF_INET6, SERV6_IP, SERV6_PORT,
1070 (struct sockaddr *)&src6_rw_addr,
1071 sizeof(src6_rw_addr)) == -1)
1074 struct bpf_insn insns[] = {
1075 BPF_MOV64_REG(BPF_REG_6, BPF_REG_1),
1077 /* if (sk.family == AF_INET6) { */
1078 BPF_LDX_MEM(BPF_W, BPF_REG_7, BPF_REG_6,
1079 offsetof(struct bpf_sock_addr, family)),
1080 BPF_JMP_IMM(BPF_JNE, BPF_REG_7, AF_INET6, 10),
1082 STORE_IPV6(user_ip6, src6_rw_addr.sin6_addr.s6_addr32),
1084 /* user_port = dst6_rw_addr.sin6_port */
1085 BPF_MOV32_IMM(BPF_REG_7, src6_rw_addr.sin6_port),
1086 BPF_STX_MEM(BPF_W, BPF_REG_6, BPF_REG_7,
1087 offsetof(struct bpf_sock_addr, user_port)),
1091 BPF_MOV64_IMM(BPF_REG_0, 1),
1095 return load_insns(test, insns, sizeof(insns) / sizeof(struct bpf_insn));
1098 static int sendmsg6_rw_v4mapped_prog_load(const struct sock_addr_test *test)
1100 return sendmsg6_rw_dst_asm_prog_load(test, SERV6_V4MAPPED_IP);
1103 static int sendmsg6_rw_wildcard_prog_load(const struct sock_addr_test *test)
1105 return sendmsg6_rw_dst_asm_prog_load(test, WILDCARD6_IP);
1108 static int sendmsg6_rw_c_prog_load(const struct sock_addr_test *test)
1110 return load_path(test, SENDMSG6_PROG_PATH);
1113 static int cmp_addr(const struct sockaddr_storage *addr1,
1114 const struct sockaddr_storage *addr2, int cmp_port)
1116 const struct sockaddr_in *four1, *four2;
1117 const struct sockaddr_in6 *six1, *six2;
1119 if (addr1->ss_family != addr2->ss_family)
1122 if (addr1->ss_family == AF_INET) {
1123 four1 = (const struct sockaddr_in *)addr1;
1124 four2 = (const struct sockaddr_in *)addr2;
1125 return !((four1->sin_port == four2->sin_port || !cmp_port) &&
1126 four1->sin_addr.s_addr == four2->sin_addr.s_addr);
1127 } else if (addr1->ss_family == AF_INET6) {
1128 six1 = (const struct sockaddr_in6 *)addr1;
1129 six2 = (const struct sockaddr_in6 *)addr2;
1130 return !((six1->sin6_port == six2->sin6_port || !cmp_port) &&
1131 !memcmp(&six1->sin6_addr, &six2->sin6_addr,
1132 sizeof(struct in6_addr)));
1138 static int cmp_sock_addr(info_fn fn, int sock1,
1139 const struct sockaddr_storage *addr2, int cmp_port)
1141 struct sockaddr_storage addr1;
1142 socklen_t len1 = sizeof(addr1);
1144 memset(&addr1, 0, len1);
1145 if (fn(sock1, (struct sockaddr *)&addr1, (socklen_t *)&len1) != 0)
1148 return cmp_addr(&addr1, addr2, cmp_port);
1151 static int cmp_local_ip(int sock1, const struct sockaddr_storage *addr2)
1153 return cmp_sock_addr(getsockname, sock1, addr2, /*cmp_port*/ 0);
1156 static int cmp_local_addr(int sock1, const struct sockaddr_storage *addr2)
1158 return cmp_sock_addr(getsockname, sock1, addr2, /*cmp_port*/ 1);
1161 static int cmp_peer_addr(int sock1, const struct sockaddr_storage *addr2)
1163 return cmp_sock_addr(getpeername, sock1, addr2, /*cmp_port*/ 1);
1166 static int start_server(int type, const struct sockaddr_storage *addr,
1171 fd = socket(addr->ss_family, type, 0);
1173 log_err("Failed to create server socket");
1177 if (bind(fd, (const struct sockaddr *)addr, addr_len) == -1) {
1178 log_err("Failed to bind server socket");
1182 if (type == SOCK_STREAM) {
1183 if (listen(fd, 128) == -1) {
1184 log_err("Failed to listen on server socket");
1197 static int connect_to_server(int type, const struct sockaddr_storage *addr,
1203 domain = addr->ss_family;
1205 if (domain != AF_INET && domain != AF_INET6) {
1206 log_err("Unsupported address family");
1210 fd = socket(domain, type, 0);
1212 log_err("Failed to create client socket");
1216 if (connect(fd, (const struct sockaddr *)addr, addr_len) == -1) {
1217 log_err("Fail to connect to server");
1229 int init_pktinfo(int domain, struct cmsghdr *cmsg)
1231 struct in6_pktinfo *pktinfo6;
1232 struct in_pktinfo *pktinfo4;
1234 if (domain == AF_INET) {
1235 cmsg->cmsg_level = SOL_IP;
1236 cmsg->cmsg_type = IP_PKTINFO;
1237 cmsg->cmsg_len = CMSG_LEN(sizeof(struct in_pktinfo));
1238 pktinfo4 = (struct in_pktinfo *)CMSG_DATA(cmsg);
1239 memset(pktinfo4, 0, sizeof(struct in_pktinfo));
1240 if (inet_pton(domain, SRC4_IP,
1241 (void *)&pktinfo4->ipi_spec_dst) != 1)
1243 } else if (domain == AF_INET6) {
1244 cmsg->cmsg_level = SOL_IPV6;
1245 cmsg->cmsg_type = IPV6_PKTINFO;
1246 cmsg->cmsg_len = CMSG_LEN(sizeof(struct in6_pktinfo));
1247 pktinfo6 = (struct in6_pktinfo *)CMSG_DATA(cmsg);
1248 memset(pktinfo6, 0, sizeof(struct in6_pktinfo));
1249 if (inet_pton(domain, SRC6_IP,
1250 (void *)&pktinfo6->ipi6_addr) != 1)
1259 static int sendmsg_to_server(int type, const struct sockaddr_storage *addr,
1260 socklen_t addr_len, int set_cmsg, int flags,
1264 char buf[CMSG_SPACE(sizeof(struct in6_pktinfo))];
1265 struct cmsghdr align;
1268 char buf[CMSG_SPACE(sizeof(struct in_pktinfo))];
1269 struct cmsghdr align;
1277 domain = addr->ss_family;
1279 if (domain != AF_INET && domain != AF_INET6) {
1280 log_err("Unsupported address family");
1284 fd = socket(domain, type, 0);
1286 log_err("Failed to create client socket");
1290 memset(&iov, 0, sizeof(iov));
1291 iov.iov_base = &data;
1292 iov.iov_len = sizeof(data);
1294 memset(&hdr, 0, sizeof(hdr));
1295 hdr.msg_name = (void *)addr;
1296 hdr.msg_namelen = addr_len;
1301 if (domain == AF_INET) {
1302 hdr.msg_control = &control4;
1303 hdr.msg_controllen = sizeof(control4.buf);
1304 } else if (domain == AF_INET6) {
1305 hdr.msg_control = &control6;
1306 hdr.msg_controllen = sizeof(control6.buf);
1308 if (init_pktinfo(domain, CMSG_FIRSTHDR(&hdr))) {
1309 log_err("Fail to init pktinfo");
1314 if (sendmsg(fd, &hdr, flags) != sizeof(data)) {
1315 log_err("Fail to send message to server");
1316 *syscall_err = errno;
1328 static int fastconnect_to_server(const struct sockaddr_storage *addr,
1333 return sendmsg_to_server(SOCK_STREAM, addr, addr_len, /*set_cmsg*/0,
1334 MSG_FASTOPEN, &sendmsg_err);
1337 static int recvmsg_from_client(int sockfd, struct sockaddr_storage *src_addr)
1346 FD_SET(sockfd, &rfds);
1351 if (select(sockfd + 1, &rfds, NULL, NULL, &tv) <= 0 ||
1352 !FD_ISSET(sockfd, &rfds))
1355 memset(&iov, 0, sizeof(iov));
1356 iov.iov_base = data;
1357 iov.iov_len = sizeof(data);
1359 memset(&hdr, 0, sizeof(hdr));
1360 hdr.msg_name = src_addr;
1361 hdr.msg_namelen = sizeof(struct sockaddr_storage);
1365 return recvmsg(sockfd, &hdr, 0);
1368 static int init_addrs(const struct sock_addr_test *test,
1369 struct sockaddr_storage *requested_addr,
1370 struct sockaddr_storage *expected_addr,
1371 struct sockaddr_storage *expected_src_addr)
1373 socklen_t addr_len = sizeof(struct sockaddr_storage);
1375 if (mk_sockaddr(test->domain, test->expected_ip, test->expected_port,
1376 (struct sockaddr *)expected_addr, addr_len) == -1)
1379 if (mk_sockaddr(test->domain, test->requested_ip, test->requested_port,
1380 (struct sockaddr *)requested_addr, addr_len) == -1)
1383 if (test->expected_src_ip &&
1384 mk_sockaddr(test->domain, test->expected_src_ip, 0,
1385 (struct sockaddr *)expected_src_addr, addr_len) == -1)
1393 static int run_bind_test_case(const struct sock_addr_test *test)
1395 socklen_t addr_len = sizeof(struct sockaddr_storage);
1396 struct sockaddr_storage requested_addr;
1397 struct sockaddr_storage expected_addr;
1402 if (init_addrs(test, &requested_addr, &expected_addr, NULL))
1405 servfd = start_server(test->type, &requested_addr, addr_len);
1409 if (cmp_local_addr(servfd, &expected_addr))
1412 /* Try to connect to server just in case */
1413 clientfd = connect_to_server(test->type, &expected_addr, addr_len);
1426 static int run_connect_test_case(const struct sock_addr_test *test)
1428 socklen_t addr_len = sizeof(struct sockaddr_storage);
1429 struct sockaddr_storage expected_src_addr;
1430 struct sockaddr_storage requested_addr;
1431 struct sockaddr_storage expected_addr;
1436 if (init_addrs(test, &requested_addr, &expected_addr,
1437 &expected_src_addr))
1440 /* Prepare server to connect to */
1441 servfd = start_server(test->type, &expected_addr, addr_len);
1445 clientfd = connect_to_server(test->type, &requested_addr, addr_len);
1449 /* Make sure src and dst addrs were overridden properly */
1450 if (cmp_peer_addr(clientfd, &expected_addr))
1453 if (cmp_local_ip(clientfd, &expected_src_addr))
1456 if (test->type == SOCK_STREAM) {
1457 /* Test TCP Fast Open scenario */
1458 clientfd = fastconnect_to_server(&requested_addr, addr_len);
1462 /* Make sure src and dst addrs were overridden properly */
1463 if (cmp_peer_addr(clientfd, &expected_addr))
1466 if (cmp_local_ip(clientfd, &expected_src_addr))
1479 static int run_xmsg_test_case(const struct sock_addr_test *test, int max_cmsg)
1481 socklen_t addr_len = sizeof(struct sockaddr_storage);
1482 struct sockaddr_storage expected_addr;
1483 struct sockaddr_storage server_addr;
1484 struct sockaddr_storage sendmsg_addr;
1485 struct sockaddr_storage recvmsg_addr;
1491 if (test->type != SOCK_DGRAM)
1494 if (init_addrs(test, &sendmsg_addr, &server_addr, &expected_addr))
1497 /* Prepare server to sendmsg to */
1498 servfd = start_server(test->type, &server_addr, addr_len);
1502 for (set_cmsg = 0; set_cmsg <= max_cmsg; ++set_cmsg) {
1506 clientfd = sendmsg_to_server(test->type, &sendmsg_addr,
1507 addr_len, set_cmsg, /*flags*/0,
1511 else if (clientfd == -1)
1514 /* Try to receive message on server instead of using
1515 * getpeername(2) on client socket, to check that client's
1516 * destination address was rewritten properly, since
1517 * getpeername(2) doesn't work with unconnected datagram
1520 * Get source address from recvmsg(2) as well to make sure
1521 * source was rewritten properly: getsockname(2) can't be used
1522 * since socket is unconnected and source defined for one
1523 * specific packet may differ from the one used by default and
1524 * returned by getsockname(2).
1526 if (recvmsg_from_client(servfd, &recvmsg_addr) == -1)
1529 if (cmp_addr(&recvmsg_addr, &expected_addr, /*cmp_port*/0))
1542 static int run_test_case(int cgfd, const struct sock_addr_test *test)
1547 printf("Test case: %s .. ", test->descr);
1549 progfd = test->loadfn(test);
1550 if (test->expected_result == LOAD_REJECT && progfd < 0)
1552 else if (test->expected_result == LOAD_REJECT || progfd < 0)
1555 err = bpf_prog_attach(progfd, cgfd, test->attach_type,
1556 BPF_F_ALLOW_OVERRIDE);
1557 if (test->expected_result == ATTACH_REJECT && err) {
1558 err = 0; /* error was expected, reset it */
1560 } else if (test->expected_result == ATTACH_REJECT || err) {
1562 } else if (test->expected_result == ATTACH_OKAY) {
1567 switch (test->attach_type) {
1568 case BPF_CGROUP_INET4_BIND:
1569 case BPF_CGROUP_INET6_BIND:
1570 err = run_bind_test_case(test);
1572 case BPF_CGROUP_INET4_CONNECT:
1573 case BPF_CGROUP_INET6_CONNECT:
1574 err = run_connect_test_case(test);
1576 case BPF_CGROUP_UDP4_SENDMSG:
1577 case BPF_CGROUP_UDP6_SENDMSG:
1578 err = run_xmsg_test_case(test, 1);
1580 case BPF_CGROUP_UDP4_RECVMSG:
1581 case BPF_CGROUP_UDP6_RECVMSG:
1582 err = run_xmsg_test_case(test, 0);
1588 if (test->expected_result == SYSCALL_EPERM && err == EPERM) {
1589 err = 0; /* error was expected, reset it */
1593 if (test->expected_result == SYSCALL_ENOTSUPP && err == ENOTSUPP) {
1594 err = 0; /* error was expected, reset it */
1598 if (err || test->expected_result != SUCCESS)
1605 /* Detaching w/o checking return code: best effort attempt. */
1607 bpf_prog_detach(cgfd, test->attach_type);
1609 printf("[%s]\n", err ? "FAIL" : "PASS");
1613 static int run_tests(int cgfd)
1619 for (i = 0; i < ARRAY_SIZE(tests); ++i) {
1620 if (run_test_case(cgfd, &tests[i]))
1625 printf("Summary: %d PASSED, %d FAILED\n", passes, fails);
1626 return fails ? -1 : 0;
1629 int main(int argc, char **argv)
1636 "%s has to be run via %s.sh. Skip direct run.\n",
1641 cgfd = cgroup_setup_and_join(CG_PATH);
1645 if (run_tests(cgfd))
1653 cleanup_cgroup_environment();