1 // SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause
2 // Copyright (c) 2020 Cloudflare
4 * Test BPF attach point for INET socket lookup (BPF_SK_LOOKUP).
7 * - attaching/detaching/querying programs to BPF_SK_LOOKUP hook,
8 * - redirecting socket lookup to a socket selected by BPF program,
9 * - failing a socket lookup on BPF program's request,
10 * - error scenarios for selecting a socket from BPF program,
11 * - accessing BPF program context,
12 * - attaching and running multiple BPF programs.
14 * Tests run in a dedicated network namespace.
18 #include <arpa/inet.h>
25 #include <sys/types.h>
29 #include <bpf/libbpf.h>
32 #include "test_progs.h"
34 #include "cgroup_helpers.h"
35 #include "network_helpers.h"
36 #include "testing_helpers.h"
37 #include "test_sk_lookup.skel.h"
39 /* External (address, port) pairs the client sends packets to. */
40 #define EXT_IP4 "127.0.0.1"
41 #define EXT_IP6 "fd00::1"
44 /* Internal (address, port) pairs the server listens/receives at. */
45 #define INT_IP4 "127.0.0.2"
46 #define INT_IP4_V6 "::ffff:127.0.0.2"
47 #define INT_IP6 "fd00::2"
50 #define IO_TIMEOUT_SEC 3
70 struct bpf_program *lookup_prog;
71 struct bpf_program *reuseport_prog;
72 struct bpf_map *sock_map;
74 struct inet_addr connect_to;
75 struct inet_addr listen_at;
76 enum server accept_on;
77 bool reuseport_has_conns; /* Add a connected socket to reuseport group */
80 static __u32 duration; /* for CHECK macro */
82 static bool is_ipv6(const char *ip)
84 return !!strchr(ip, ':');
87 static int attach_reuseport(int sock_fd, struct bpf_program *reuseport_prog)
91 prog_fd = bpf_program__fd(reuseport_prog);
97 err = setsockopt(sock_fd, SOL_SOCKET, SO_ATTACH_REUSEPORT_EBPF,
98 &prog_fd, sizeof(prog_fd));
105 static socklen_t inetaddr_len(const struct sockaddr_storage *addr)
107 return (addr->ss_family == AF_INET ? sizeof(struct sockaddr_in) :
108 addr->ss_family == AF_INET6 ? sizeof(struct sockaddr_in6) : 0);
111 static int make_socket(int sotype, const char *ip, int port,
112 struct sockaddr_storage *addr)
114 struct timeval timeo = { .tv_sec = IO_TIMEOUT_SEC };
117 family = is_ipv6(ip) ? AF_INET6 : AF_INET;
118 err = make_sockaddr(family, ip, port, addr, NULL);
119 if (CHECK(err, "make_address", "failed\n"))
122 fd = socket(addr->ss_family, sotype, 0);
123 if (CHECK(fd < 0, "socket", "failed\n")) {
124 log_err("failed to make socket");
128 err = setsockopt(fd, SOL_SOCKET, SO_SNDTIMEO, &timeo, sizeof(timeo));
129 if (CHECK(err, "setsockopt(SO_SNDTIMEO)", "failed\n")) {
130 log_err("failed to set SNDTIMEO");
135 err = setsockopt(fd, SOL_SOCKET, SO_RCVTIMEO, &timeo, sizeof(timeo));
136 if (CHECK(err, "setsockopt(SO_RCVTIMEO)", "failed\n")) {
137 log_err("failed to set RCVTIMEO");
145 static int make_server(int sotype, const char *ip, int port,
146 struct bpf_program *reuseport_prog)
148 struct sockaddr_storage addr = {0};
152 fd = make_socket(sotype, ip, port, &addr);
156 /* Enabled for UDPv6 sockets for IPv4-mapped IPv6 to work. */
157 if (sotype == SOCK_DGRAM) {
158 err = setsockopt(fd, SOL_IP, IP_RECVORIGDSTADDR, &one,
160 if (CHECK(err, "setsockopt(IP_RECVORIGDSTADDR)", "failed\n")) {
161 log_err("failed to enable IP_RECVORIGDSTADDR");
166 if (sotype == SOCK_DGRAM && addr.ss_family == AF_INET6) {
167 err = setsockopt(fd, SOL_IPV6, IPV6_RECVORIGDSTADDR, &one,
169 if (CHECK(err, "setsockopt(IPV6_RECVORIGDSTADDR)", "failed\n")) {
170 log_err("failed to enable IPV6_RECVORIGDSTADDR");
175 if (sotype == SOCK_STREAM) {
176 err = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &one,
178 if (CHECK(err, "setsockopt(SO_REUSEADDR)", "failed\n")) {
179 log_err("failed to enable SO_REUSEADDR");
184 if (reuseport_prog) {
185 err = setsockopt(fd, SOL_SOCKET, SO_REUSEPORT, &one,
187 if (CHECK(err, "setsockopt(SO_REUSEPORT)", "failed\n")) {
188 log_err("failed to enable SO_REUSEPORT");
193 err = bind(fd, (void *)&addr, inetaddr_len(&addr));
194 if (CHECK(err, "bind", "failed\n")) {
195 log_err("failed to bind listen socket");
199 if (sotype == SOCK_STREAM) {
200 err = listen(fd, SOMAXCONN);
201 if (CHECK(err, "make_server", "listen")) {
202 log_err("failed to listen on port %d", port);
207 /* Late attach reuseport prog so we can have one init path */
208 if (reuseport_prog) {
209 err = attach_reuseport(fd, reuseport_prog);
210 if (CHECK(err, "attach_reuseport", "failed\n")) {
211 log_err("failed to attach reuseport prog");
222 static int make_client(int sotype, const char *ip, int port)
224 struct sockaddr_storage addr = {0};
227 fd = make_socket(sotype, ip, port, &addr);
231 err = connect(fd, (void *)&addr, inetaddr_len(&addr));
232 if (CHECK(err, "make_client", "connect")) {
233 log_err("failed to connect client socket");
243 static __u64 socket_cookie(int fd)
246 socklen_t cookie_len = sizeof(cookie);
248 if (CHECK(getsockopt(fd, SOL_SOCKET, SO_COOKIE, &cookie, &cookie_len) < 0,
249 "getsockopt(SO_COOKIE)", "%s\n", strerror(errno)))
254 static int fill_sk_lookup_ctx(struct bpf_sk_lookup *ctx, const char *local_ip, __u16 local_port,
255 const char *remote_ip, __u16 remote_port)
257 void *local, *remote;
260 memset(ctx, 0, sizeof(*ctx));
261 ctx->local_port = local_port;
262 ctx->remote_port = htons(remote_port);
264 if (is_ipv6(local_ip)) {
265 ctx->family = AF_INET6;
266 local = &ctx->local_ip6[0];
267 remote = &ctx->remote_ip6[0];
269 ctx->family = AF_INET;
270 local = &ctx->local_ip4;
271 remote = &ctx->remote_ip4;
274 err = inet_pton(ctx->family, local_ip, local);
275 if (CHECK(err != 1, "inet_pton", "local_ip failed\n"))
278 err = inet_pton(ctx->family, remote_ip, remote);
279 if (CHECK(err != 1, "inet_pton", "remote_ip failed\n"))
285 static int send_byte(int fd)
290 n = send(fd, "a", 1, 0);
291 if (CHECK(n <= 0, "send_byte", "send")) {
292 log_err("failed/partial send");
298 static int recv_byte(int fd)
303 n = recv(fd, buf, sizeof(buf), 0);
304 if (CHECK(n <= 0, "recv_byte", "recv")) {
305 log_err("failed/partial recv");
311 static int tcp_recv_send(int server_fd)
317 fd = accept(server_fd, NULL, NULL);
318 if (CHECK(fd < 0, "accept", "failed\n")) {
319 log_err("failed to accept");
323 n = recv(fd, buf, sizeof(buf), 0);
324 if (CHECK(n <= 0, "recv", "failed\n")) {
325 log_err("failed/partial recv");
330 n = send(fd, buf, n, 0);
331 if (CHECK(n <= 0, "send", "failed\n")) {
332 log_err("failed/partial send");
343 static void v4_to_v6(struct sockaddr_storage *ss)
345 struct sockaddr_in6 *v6 = (struct sockaddr_in6 *)ss;
346 struct sockaddr_in v4 = *(struct sockaddr_in *)ss;
348 v6->sin6_family = AF_INET6;
349 v6->sin6_port = v4.sin_port;
350 v6->sin6_addr.s6_addr[10] = 0xff;
351 v6->sin6_addr.s6_addr[11] = 0xff;
352 memcpy(&v6->sin6_addr.s6_addr[12], &v4.sin_addr.s_addr, 4);
353 memset(&v6->sin6_addr.s6_addr[0], 0, 10);
356 static int udp_recv_send(int server_fd)
358 char cmsg_buf[CMSG_SPACE(sizeof(struct sockaddr_storage))];
359 struct sockaddr_storage _src_addr = { 0 };
360 struct sockaddr_storage *src_addr = &_src_addr;
361 struct sockaddr_storage *dst_addr = NULL;
362 struct msghdr msg = { 0 };
363 struct iovec iov = { 0 };
370 iov.iov_len = sizeof(buf);
372 msg.msg_name = src_addr;
373 msg.msg_namelen = sizeof(*src_addr);
376 msg.msg_control = cmsg_buf;
377 msg.msg_controllen = sizeof(cmsg_buf);
380 n = recvmsg(server_fd, &msg, 0);
381 if (CHECK(n <= 0, "recvmsg", "failed\n")) {
382 log_err("failed to receive");
385 if (CHECK(msg.msg_flags & MSG_CTRUNC, "recvmsg", "truncated cmsg\n"))
388 for (cm = CMSG_FIRSTHDR(&msg); cm; cm = CMSG_NXTHDR(&msg, cm)) {
389 if ((cm->cmsg_level == SOL_IP &&
390 cm->cmsg_type == IP_ORIGDSTADDR) ||
391 (cm->cmsg_level == SOL_IPV6 &&
392 cm->cmsg_type == IPV6_ORIGDSTADDR)) {
393 dst_addr = (struct sockaddr_storage *)CMSG_DATA(cm);
396 log_err("warning: ignored cmsg at level %d type %d",
397 cm->cmsg_level, cm->cmsg_type);
399 if (CHECK(!dst_addr, "recvmsg", "missing ORIGDSTADDR\n"))
402 /* Server socket bound to IPv4-mapped IPv6 address */
403 if (src_addr->ss_family == AF_INET6 &&
404 dst_addr->ss_family == AF_INET) {
408 /* Reply from original destination address. */
409 fd = socket(dst_addr->ss_family, SOCK_DGRAM, 0);
410 if (CHECK(fd < 0, "socket", "failed\n")) {
411 log_err("failed to create tx socket");
415 ret = bind(fd, (struct sockaddr *)dst_addr, sizeof(*dst_addr));
416 if (CHECK(ret, "bind", "failed\n")) {
417 log_err("failed to bind tx socket");
421 msg.msg_control = NULL;
422 msg.msg_controllen = 0;
423 n = sendmsg(fd, &msg, 0);
424 if (CHECK(n <= 0, "sendmsg", "failed\n")) {
425 log_err("failed to send echo reply");
436 static int tcp_echo_test(int client_fd, int server_fd)
440 err = send_byte(client_fd);
443 err = tcp_recv_send(server_fd);
446 err = recv_byte(client_fd);
453 static int udp_echo_test(int client_fd, int server_fd)
457 err = send_byte(client_fd);
460 err = udp_recv_send(server_fd);
463 err = recv_byte(client_fd);
470 static struct bpf_link *attach_lookup_prog(struct bpf_program *prog)
472 struct bpf_link *link;
475 net_fd = open("/proc/self/ns/net", O_RDONLY);
476 if (CHECK(net_fd < 0, "open", "failed\n")) {
477 log_err("failed to open /proc/self/ns/net");
481 link = bpf_program__attach_netns(prog, net_fd);
482 if (!ASSERT_OK_PTR(link, "bpf_program__attach_netns")) {
483 errno = -PTR_ERR(link);
484 log_err("failed to attach program '%s' to netns",
485 bpf_program__name(prog));
493 static int update_lookup_map(struct bpf_map *map, int index, int sock_fd)
498 map_fd = bpf_map__fd(map);
499 if (CHECK(map_fd < 0, "bpf_map__fd", "failed\n")) {
501 log_err("failed to get map FD");
505 value = (uint64_t)sock_fd;
506 err = bpf_map_update_elem(map_fd, &index, &value, BPF_NOEXIST);
507 if (CHECK(err, "bpf_map_update_elem", "failed\n")) {
508 log_err("failed to update redir_map @ %d", index);
515 static void query_lookup_prog(struct test_sk_lookup *skel)
517 struct bpf_link *link[3] = {};
518 struct bpf_link_info info;
519 __u32 attach_flags = 0;
520 __u32 prog_ids[3] = {};
526 net_fd = open("/proc/self/ns/net", O_RDONLY);
527 if (CHECK(net_fd < 0, "open", "failed\n")) {
528 log_err("failed to open /proc/self/ns/net");
532 link[0] = attach_lookup_prog(skel->progs.lookup_pass);
535 link[1] = attach_lookup_prog(skel->progs.lookup_pass);
538 link[2] = attach_lookup_prog(skel->progs.lookup_drop);
542 err = bpf_prog_query(net_fd, BPF_SK_LOOKUP, 0 /* query flags */,
543 &attach_flags, prog_ids, &prog_cnt);
544 if (CHECK(err, "bpf_prog_query", "failed\n")) {
545 log_err("failed to query lookup prog");
550 if (CHECK(attach_flags != 0, "bpf_prog_query",
551 "wrong attach_flags on query: %u", attach_flags))
553 if (CHECK(prog_cnt != 3, "bpf_prog_query",
554 "wrong program count on query: %u", prog_cnt))
556 prog_id = link_info_prog_id(link[0], &info);
557 CHECK(prog_ids[0] != prog_id, "bpf_prog_query",
558 "invalid program #0 id on query: %u != %u\n",
559 prog_ids[0], prog_id);
560 CHECK(info.netns.netns_ino == 0, "netns_ino",
561 "unexpected netns_ino: %u\n", info.netns.netns_ino);
562 prog_id = link_info_prog_id(link[1], &info);
563 CHECK(prog_ids[1] != prog_id, "bpf_prog_query",
564 "invalid program #1 id on query: %u != %u\n",
565 prog_ids[1], prog_id);
566 CHECK(info.netns.netns_ino == 0, "netns_ino",
567 "unexpected netns_ino: %u\n", info.netns.netns_ino);
568 prog_id = link_info_prog_id(link[2], &info);
569 CHECK(prog_ids[2] != prog_id, "bpf_prog_query",
570 "invalid program #2 id on query: %u != %u\n",
571 prog_ids[2], prog_id);
572 CHECK(info.netns.netns_ino == 0, "netns_ino",
573 "unexpected netns_ino: %u\n", info.netns.netns_ino);
575 err = bpf_link__detach(link[0]);
576 if (CHECK(err, "link_detach", "failed %d\n", err))
579 /* prog id is still there, but netns_ino is zeroed out */
580 prog_id = link_info_prog_id(link[0], &info);
581 CHECK(prog_ids[0] != prog_id, "bpf_prog_query",
582 "invalid program #0 id on query: %u != %u\n",
583 prog_ids[0], prog_id);
584 CHECK(info.netns.netns_ino != 0, "netns_ino",
585 "unexpected netns_ino: %u\n", info.netns.netns_ino);
589 bpf_link__destroy(link[2]);
591 bpf_link__destroy(link[1]);
593 bpf_link__destroy(link[0]);
598 static void run_lookup_prog(const struct test *t)
600 int server_fds[] = { [0 ... MAX_SERVERS - 1] = -1 };
601 int client_fd, reuse_conn_fd = -1;
602 struct bpf_link *lookup_link;
605 lookup_link = attach_lookup_prog(t->lookup_prog);
609 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
610 server_fds[i] = make_server(t->sotype, t->listen_at.ip,
613 if (server_fds[i] < 0)
616 err = update_lookup_map(t->sock_map, i, server_fds[i]);
620 /* want just one server for non-reuseport test */
621 if (!t->reuseport_prog)
625 /* Regular UDP socket lookup with reuseport behaves
626 * differently when reuseport group contains connected
627 * sockets. Check that adding a connected UDP socket to the
628 * reuseport group does not affect how reuseport works with
631 if (t->reuseport_has_conns) {
632 struct sockaddr_storage addr = {};
633 socklen_t len = sizeof(addr);
635 /* Add an extra socket to reuseport group */
636 reuse_conn_fd = make_server(t->sotype, t->listen_at.ip,
639 if (reuse_conn_fd < 0)
642 /* Connect the extra socket to itself */
643 err = getsockname(reuse_conn_fd, (void *)&addr, &len);
644 if (CHECK(err, "getsockname", "errno %d\n", errno))
646 err = connect(reuse_conn_fd, (void *)&addr, len);
647 if (CHECK(err, "connect", "errno %d\n", errno))
651 client_fd = make_client(t->sotype, t->connect_to.ip, t->connect_to.port);
655 if (t->sotype == SOCK_STREAM)
656 tcp_echo_test(client_fd, server_fds[t->accept_on]);
658 udp_echo_test(client_fd, server_fds[t->accept_on]);
662 if (reuse_conn_fd != -1)
663 close(reuse_conn_fd);
664 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
665 if (server_fds[i] != -1)
666 close(server_fds[i]);
668 bpf_link__destroy(lookup_link);
671 static void test_redirect_lookup(struct test_sk_lookup *skel)
673 const struct test tests[] = {
675 .desc = "TCP IPv4 redir port",
676 .lookup_prog = skel->progs.redir_port,
677 .sock_map = skel->maps.redir_map,
678 .sotype = SOCK_STREAM,
679 .connect_to = { EXT_IP4, EXT_PORT },
680 .listen_at = { EXT_IP4, INT_PORT },
683 .desc = "TCP IPv4 redir addr",
684 .lookup_prog = skel->progs.redir_ip4,
685 .sock_map = skel->maps.redir_map,
686 .sotype = SOCK_STREAM,
687 .connect_to = { EXT_IP4, EXT_PORT },
688 .listen_at = { INT_IP4, EXT_PORT },
691 .desc = "TCP IPv4 redir with reuseport",
692 .lookup_prog = skel->progs.select_sock_a,
693 .reuseport_prog = skel->progs.select_sock_b,
694 .sock_map = skel->maps.redir_map,
695 .sotype = SOCK_STREAM,
696 .connect_to = { EXT_IP4, EXT_PORT },
697 .listen_at = { INT_IP4, INT_PORT },
698 .accept_on = SERVER_B,
701 .desc = "TCP IPv4 redir skip reuseport",
702 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
703 .reuseport_prog = skel->progs.select_sock_b,
704 .sock_map = skel->maps.redir_map,
705 .sotype = SOCK_STREAM,
706 .connect_to = { EXT_IP4, EXT_PORT },
707 .listen_at = { INT_IP4, INT_PORT },
708 .accept_on = SERVER_A,
711 .desc = "TCP IPv6 redir port",
712 .lookup_prog = skel->progs.redir_port,
713 .sock_map = skel->maps.redir_map,
714 .sotype = SOCK_STREAM,
715 .connect_to = { EXT_IP6, EXT_PORT },
716 .listen_at = { EXT_IP6, INT_PORT },
719 .desc = "TCP IPv6 redir addr",
720 .lookup_prog = skel->progs.redir_ip6,
721 .sock_map = skel->maps.redir_map,
722 .sotype = SOCK_STREAM,
723 .connect_to = { EXT_IP6, EXT_PORT },
724 .listen_at = { INT_IP6, EXT_PORT },
727 .desc = "TCP IPv4->IPv6 redir port",
728 .lookup_prog = skel->progs.redir_port,
729 .sock_map = skel->maps.redir_map,
730 .sotype = SOCK_STREAM,
731 .connect_to = { EXT_IP4, EXT_PORT },
732 .listen_at = { INT_IP4_V6, INT_PORT },
735 .desc = "TCP IPv6 redir with reuseport",
736 .lookup_prog = skel->progs.select_sock_a,
737 .reuseport_prog = skel->progs.select_sock_b,
738 .sock_map = skel->maps.redir_map,
739 .sotype = SOCK_STREAM,
740 .connect_to = { EXT_IP6, EXT_PORT },
741 .listen_at = { INT_IP6, INT_PORT },
742 .accept_on = SERVER_B,
745 .desc = "TCP IPv6 redir skip reuseport",
746 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
747 .reuseport_prog = skel->progs.select_sock_b,
748 .sock_map = skel->maps.redir_map,
749 .sotype = SOCK_STREAM,
750 .connect_to = { EXT_IP6, EXT_PORT },
751 .listen_at = { INT_IP6, INT_PORT },
752 .accept_on = SERVER_A,
755 .desc = "UDP IPv4 redir port",
756 .lookup_prog = skel->progs.redir_port,
757 .sock_map = skel->maps.redir_map,
758 .sotype = SOCK_DGRAM,
759 .connect_to = { EXT_IP4, EXT_PORT },
760 .listen_at = { EXT_IP4, INT_PORT },
763 .desc = "UDP IPv4 redir addr",
764 .lookup_prog = skel->progs.redir_ip4,
765 .sock_map = skel->maps.redir_map,
766 .sotype = SOCK_DGRAM,
767 .connect_to = { EXT_IP4, EXT_PORT },
768 .listen_at = { INT_IP4, EXT_PORT },
771 .desc = "UDP IPv4 redir with reuseport",
772 .lookup_prog = skel->progs.select_sock_a,
773 .reuseport_prog = skel->progs.select_sock_b,
774 .sock_map = skel->maps.redir_map,
775 .sotype = SOCK_DGRAM,
776 .connect_to = { EXT_IP4, EXT_PORT },
777 .listen_at = { INT_IP4, INT_PORT },
778 .accept_on = SERVER_B,
781 .desc = "UDP IPv4 redir and reuseport with conns",
782 .lookup_prog = skel->progs.select_sock_a,
783 .reuseport_prog = skel->progs.select_sock_b,
784 .sock_map = skel->maps.redir_map,
785 .sotype = SOCK_DGRAM,
786 .connect_to = { EXT_IP4, EXT_PORT },
787 .listen_at = { INT_IP4, INT_PORT },
788 .accept_on = SERVER_B,
789 .reuseport_has_conns = true,
792 .desc = "UDP IPv4 redir skip reuseport",
793 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
794 .reuseport_prog = skel->progs.select_sock_b,
795 .sock_map = skel->maps.redir_map,
796 .sotype = SOCK_DGRAM,
797 .connect_to = { EXT_IP4, EXT_PORT },
798 .listen_at = { INT_IP4, INT_PORT },
799 .accept_on = SERVER_A,
802 .desc = "UDP IPv6 redir port",
803 .lookup_prog = skel->progs.redir_port,
804 .sock_map = skel->maps.redir_map,
805 .sotype = SOCK_DGRAM,
806 .connect_to = { EXT_IP6, EXT_PORT },
807 .listen_at = { EXT_IP6, INT_PORT },
810 .desc = "UDP IPv6 redir addr",
811 .lookup_prog = skel->progs.redir_ip6,
812 .sock_map = skel->maps.redir_map,
813 .sotype = SOCK_DGRAM,
814 .connect_to = { EXT_IP6, EXT_PORT },
815 .listen_at = { INT_IP6, EXT_PORT },
818 .desc = "UDP IPv4->IPv6 redir port",
819 .lookup_prog = skel->progs.redir_port,
820 .sock_map = skel->maps.redir_map,
821 .sotype = SOCK_DGRAM,
822 .listen_at = { INT_IP4_V6, INT_PORT },
823 .connect_to = { EXT_IP4, EXT_PORT },
826 .desc = "UDP IPv6 redir and reuseport",
827 .lookup_prog = skel->progs.select_sock_a,
828 .reuseport_prog = skel->progs.select_sock_b,
829 .sock_map = skel->maps.redir_map,
830 .sotype = SOCK_DGRAM,
831 .connect_to = { EXT_IP6, EXT_PORT },
832 .listen_at = { INT_IP6, INT_PORT },
833 .accept_on = SERVER_B,
836 .desc = "UDP IPv6 redir and reuseport with conns",
837 .lookup_prog = skel->progs.select_sock_a,
838 .reuseport_prog = skel->progs.select_sock_b,
839 .sock_map = skel->maps.redir_map,
840 .sotype = SOCK_DGRAM,
841 .connect_to = { EXT_IP6, EXT_PORT },
842 .listen_at = { INT_IP6, INT_PORT },
843 .accept_on = SERVER_B,
844 .reuseport_has_conns = true,
847 .desc = "UDP IPv6 redir skip reuseport",
848 .lookup_prog = skel->progs.select_sock_a_no_reuseport,
849 .reuseport_prog = skel->progs.select_sock_b,
850 .sock_map = skel->maps.redir_map,
851 .sotype = SOCK_DGRAM,
852 .connect_to = { EXT_IP6, EXT_PORT },
853 .listen_at = { INT_IP6, INT_PORT },
854 .accept_on = SERVER_A,
857 const struct test *t;
859 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
860 if (test__start_subtest(t->desc))
865 static void drop_on_lookup(const struct test *t)
867 struct sockaddr_storage dst = {};
868 int client_fd, server_fd, err;
869 struct bpf_link *lookup_link;
872 lookup_link = attach_lookup_prog(t->lookup_prog);
876 server_fd = make_server(t->sotype, t->listen_at.ip, t->listen_at.port,
881 client_fd = make_socket(t->sotype, t->connect_to.ip,
882 t->connect_to.port, &dst);
886 err = connect(client_fd, (void *)&dst, inetaddr_len(&dst));
887 if (t->sotype == SOCK_DGRAM) {
888 err = send_byte(client_fd);
892 /* Read out asynchronous error */
893 n = recv(client_fd, NULL, 0, 0);
896 if (CHECK(!err || errno != ECONNREFUSED, "connect",
897 "unexpected success or error\n"))
898 log_err("expected ECONNREFUSED on connect");
905 bpf_link__destroy(lookup_link);
908 static void test_drop_on_lookup(struct test_sk_lookup *skel)
910 const struct test tests[] = {
912 .desc = "TCP IPv4 drop on lookup",
913 .lookup_prog = skel->progs.lookup_drop,
914 .sotype = SOCK_STREAM,
915 .connect_to = { EXT_IP4, EXT_PORT },
916 .listen_at = { EXT_IP4, EXT_PORT },
919 .desc = "TCP IPv6 drop on lookup",
920 .lookup_prog = skel->progs.lookup_drop,
921 .sotype = SOCK_STREAM,
922 .connect_to = { EXT_IP6, EXT_PORT },
923 .listen_at = { EXT_IP6, EXT_PORT },
926 .desc = "UDP IPv4 drop on lookup",
927 .lookup_prog = skel->progs.lookup_drop,
928 .sotype = SOCK_DGRAM,
929 .connect_to = { EXT_IP4, EXT_PORT },
930 .listen_at = { EXT_IP4, EXT_PORT },
933 .desc = "UDP IPv6 drop on lookup",
934 .lookup_prog = skel->progs.lookup_drop,
935 .sotype = SOCK_DGRAM,
936 .connect_to = { EXT_IP6, EXT_PORT },
937 .listen_at = { EXT_IP6, INT_PORT },
939 /* The program will drop on success, meaning that the ifindex
943 .desc = "TCP IPv4 drop on valid ifindex",
944 .lookup_prog = skel->progs.check_ifindex,
945 .sotype = SOCK_STREAM,
946 .connect_to = { EXT_IP4, EXT_PORT },
947 .listen_at = { EXT_IP4, EXT_PORT },
950 .desc = "TCP IPv6 drop on valid ifindex",
951 .lookup_prog = skel->progs.check_ifindex,
952 .sotype = SOCK_STREAM,
953 .connect_to = { EXT_IP6, EXT_PORT },
954 .listen_at = { EXT_IP6, EXT_PORT },
957 .desc = "UDP IPv4 drop on valid ifindex",
958 .lookup_prog = skel->progs.check_ifindex,
959 .sotype = SOCK_DGRAM,
960 .connect_to = { EXT_IP4, EXT_PORT },
961 .listen_at = { EXT_IP4, EXT_PORT },
964 .desc = "UDP IPv6 drop on valid ifindex",
965 .lookup_prog = skel->progs.check_ifindex,
966 .sotype = SOCK_DGRAM,
967 .connect_to = { EXT_IP6, EXT_PORT },
968 .listen_at = { EXT_IP6, EXT_PORT },
971 const struct test *t;
973 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
974 if (test__start_subtest(t->desc))
979 static void drop_on_reuseport(const struct test *t)
981 struct sockaddr_storage dst = { 0 };
982 int client, server1, server2, err;
983 struct bpf_link *lookup_link;
986 lookup_link = attach_lookup_prog(t->lookup_prog);
990 server1 = make_server(t->sotype, t->listen_at.ip, t->listen_at.port,
995 err = update_lookup_map(t->sock_map, SERVER_A, server1);
999 /* second server on destination address we should never reach */
1000 server2 = make_server(t->sotype, t->connect_to.ip, t->connect_to.port,
1001 NULL /* reuseport prog */);
1005 client = make_socket(t->sotype, t->connect_to.ip,
1006 t->connect_to.port, &dst);
1010 err = connect(client, (void *)&dst, inetaddr_len(&dst));
1011 if (t->sotype == SOCK_DGRAM) {
1012 err = send_byte(client);
1016 /* Read out asynchronous error */
1017 n = recv(client, NULL, 0, 0);
1020 if (CHECK(!err || errno != ECONNREFUSED, "connect",
1021 "unexpected success or error\n"))
1022 log_err("expected ECONNREFUSED on connect");
1031 bpf_link__destroy(lookup_link);
1034 static void test_drop_on_reuseport(struct test_sk_lookup *skel)
1036 const struct test tests[] = {
1038 .desc = "TCP IPv4 drop on reuseport",
1039 .lookup_prog = skel->progs.select_sock_a,
1040 .reuseport_prog = skel->progs.reuseport_drop,
1041 .sock_map = skel->maps.redir_map,
1042 .sotype = SOCK_STREAM,
1043 .connect_to = { EXT_IP4, EXT_PORT },
1044 .listen_at = { INT_IP4, INT_PORT },
1047 .desc = "TCP IPv6 drop on reuseport",
1048 .lookup_prog = skel->progs.select_sock_a,
1049 .reuseport_prog = skel->progs.reuseport_drop,
1050 .sock_map = skel->maps.redir_map,
1051 .sotype = SOCK_STREAM,
1052 .connect_to = { EXT_IP6, EXT_PORT },
1053 .listen_at = { INT_IP6, INT_PORT },
1056 .desc = "UDP IPv4 drop on reuseport",
1057 .lookup_prog = skel->progs.select_sock_a,
1058 .reuseport_prog = skel->progs.reuseport_drop,
1059 .sock_map = skel->maps.redir_map,
1060 .sotype = SOCK_DGRAM,
1061 .connect_to = { EXT_IP4, EXT_PORT },
1062 .listen_at = { INT_IP4, INT_PORT },
1065 .desc = "TCP IPv6 drop on reuseport",
1066 .lookup_prog = skel->progs.select_sock_a,
1067 .reuseport_prog = skel->progs.reuseport_drop,
1068 .sock_map = skel->maps.redir_map,
1069 .sotype = SOCK_STREAM,
1070 .connect_to = { EXT_IP6, EXT_PORT },
1071 .listen_at = { INT_IP6, INT_PORT },
1074 const struct test *t;
1076 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
1077 if (test__start_subtest(t->desc))
1078 drop_on_reuseport(t);
1082 static void run_sk_assign(struct test_sk_lookup *skel,
1083 struct bpf_program *lookup_prog,
1084 const char *remote_ip, const char *local_ip)
1086 int server_fds[] = { [0 ... MAX_SERVERS - 1] = -1 };
1087 struct bpf_sk_lookup ctx;
1088 __u64 server_cookie;
1091 DECLARE_LIBBPF_OPTS(bpf_test_run_opts, opts,
1093 .ctx_size_in = sizeof(ctx),
1095 .ctx_size_out = sizeof(ctx),
1098 if (fill_sk_lookup_ctx(&ctx, local_ip, EXT_PORT, remote_ip, INT_PORT))
1101 ctx.protocol = IPPROTO_TCP;
1103 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
1104 server_fds[i] = make_server(SOCK_STREAM, local_ip, 0, NULL);
1105 if (server_fds[i] < 0)
1108 err = update_lookup_map(skel->maps.redir_map, i,
1114 server_cookie = socket_cookie(server_fds[SERVER_B]);
1118 err = bpf_prog_test_run_opts(bpf_program__fd(lookup_prog), &opts);
1119 if (CHECK(err, "test_run", "failed with error %d\n", errno))
1122 if (CHECK(ctx.cookie == 0, "ctx.cookie", "no socket selected\n"))
1125 CHECK(ctx.cookie != server_cookie, "ctx.cookie",
1126 "selected sk %llu instead of %llu\n", ctx.cookie, server_cookie);
1129 for (i = 0; i < ARRAY_SIZE(server_fds); i++) {
1130 if (server_fds[i] != -1)
1131 close(server_fds[i]);
1135 static void run_sk_assign_v4(struct test_sk_lookup *skel,
1136 struct bpf_program *lookup_prog)
1138 run_sk_assign(skel, lookup_prog, INT_IP4, EXT_IP4);
1141 static void run_sk_assign_v6(struct test_sk_lookup *skel,
1142 struct bpf_program *lookup_prog)
1144 run_sk_assign(skel, lookup_prog, INT_IP6, EXT_IP6);
1147 static void run_sk_assign_connected(struct test_sk_lookup *skel,
1150 int err, client_fd, connected_fd, server_fd;
1151 struct bpf_link *lookup_link;
1153 server_fd = make_server(sotype, EXT_IP4, EXT_PORT, NULL);
1157 connected_fd = make_client(sotype, EXT_IP4, EXT_PORT);
1158 if (connected_fd < 0)
1159 goto out_close_server;
1161 /* Put a connected socket in redirect map */
1162 err = update_lookup_map(skel->maps.redir_map, SERVER_A, connected_fd);
1164 goto out_close_connected;
1166 lookup_link = attach_lookup_prog(skel->progs.sk_assign_esocknosupport);
1168 goto out_close_connected;
1170 /* Try to redirect TCP SYN / UDP packet to a connected socket */
1171 client_fd = make_client(sotype, EXT_IP4, EXT_PORT);
1173 goto out_unlink_prog;
1174 if (sotype == SOCK_DGRAM) {
1175 send_byte(client_fd);
1176 recv_byte(server_fd);
1181 bpf_link__destroy(lookup_link);
1182 out_close_connected:
1183 close(connected_fd);
1188 static void test_sk_assign_helper(struct test_sk_lookup *skel)
1190 if (test__start_subtest("sk_assign returns EEXIST"))
1191 run_sk_assign_v4(skel, skel->progs.sk_assign_eexist);
1192 if (test__start_subtest("sk_assign honors F_REPLACE"))
1193 run_sk_assign_v4(skel, skel->progs.sk_assign_replace_flag);
1194 if (test__start_subtest("sk_assign accepts NULL socket"))
1195 run_sk_assign_v4(skel, skel->progs.sk_assign_null);
1196 if (test__start_subtest("access ctx->sk"))
1197 run_sk_assign_v4(skel, skel->progs.access_ctx_sk);
1198 if (test__start_subtest("narrow access to ctx v4"))
1199 run_sk_assign_v4(skel, skel->progs.ctx_narrow_access);
1200 if (test__start_subtest("narrow access to ctx v6"))
1201 run_sk_assign_v6(skel, skel->progs.ctx_narrow_access);
1202 if (test__start_subtest("sk_assign rejects TCP established"))
1203 run_sk_assign_connected(skel, SOCK_STREAM);
1204 if (test__start_subtest("sk_assign rejects UDP connected"))
1205 run_sk_assign_connected(skel, SOCK_DGRAM);
1208 struct test_multi_prog {
1210 struct bpf_program *prog1;
1211 struct bpf_program *prog2;
1212 struct bpf_map *redir_map;
1213 struct bpf_map *run_map;
1215 struct inet_addr listen_at;
1218 static void run_multi_prog_lookup(const struct test_multi_prog *t)
1220 struct sockaddr_storage dst = {};
1221 int map_fd, server_fd, client_fd;
1222 struct bpf_link *link1, *link2;
1223 int prog_idx, done, err;
1225 map_fd = bpf_map__fd(t->run_map);
1229 err = bpf_map_update_elem(map_fd, &prog_idx, &done, BPF_ANY);
1230 if (CHECK(err, "bpf_map_update_elem", "failed\n"))
1233 err = bpf_map_update_elem(map_fd, &prog_idx, &done, BPF_ANY);
1234 if (CHECK(err, "bpf_map_update_elem", "failed\n"))
1237 link1 = attach_lookup_prog(t->prog1);
1240 link2 = attach_lookup_prog(t->prog2);
1244 server_fd = make_server(SOCK_STREAM, t->listen_at.ip,
1245 t->listen_at.port, NULL);
1249 err = update_lookup_map(t->redir_map, SERVER_A, server_fd);
1251 goto out_close_server;
1253 client_fd = make_socket(SOCK_STREAM, EXT_IP4, EXT_PORT, &dst);
1255 goto out_close_server;
1257 err = connect(client_fd, (void *)&dst, inetaddr_len(&dst));
1258 if (CHECK(err && !t->expect_errno, "connect",
1259 "unexpected error %d\n", errno))
1260 goto out_close_client;
1261 if (CHECK(err && t->expect_errno && errno != t->expect_errno,
1262 "connect", "unexpected error %d\n", errno))
1263 goto out_close_client;
1267 err = bpf_map_lookup_elem(map_fd, &prog_idx, &done);
1268 CHECK(err, "bpf_map_lookup_elem", "failed\n");
1269 CHECK(!done, "bpf_map_lookup_elem", "PROG1 !done\n");
1273 err = bpf_map_lookup_elem(map_fd, &prog_idx, &done);
1274 CHECK(err, "bpf_map_lookup_elem", "failed\n");
1275 CHECK(!done, "bpf_map_lookup_elem", "PROG2 !done\n");
1282 bpf_link__destroy(link2);
1284 bpf_link__destroy(link1);
1287 static void test_multi_prog_lookup(struct test_sk_lookup *skel)
1289 struct test_multi_prog tests[] = {
1291 .desc = "multi prog - pass, pass",
1292 .prog1 = skel->progs.multi_prog_pass1,
1293 .prog2 = skel->progs.multi_prog_pass2,
1294 .listen_at = { EXT_IP4, EXT_PORT },
1297 .desc = "multi prog - drop, drop",
1298 .prog1 = skel->progs.multi_prog_drop1,
1299 .prog2 = skel->progs.multi_prog_drop2,
1300 .listen_at = { EXT_IP4, EXT_PORT },
1301 .expect_errno = ECONNREFUSED,
1304 .desc = "multi prog - pass, drop",
1305 .prog1 = skel->progs.multi_prog_pass1,
1306 .prog2 = skel->progs.multi_prog_drop2,
1307 .listen_at = { EXT_IP4, EXT_PORT },
1308 .expect_errno = ECONNREFUSED,
1311 .desc = "multi prog - drop, pass",
1312 .prog1 = skel->progs.multi_prog_drop1,
1313 .prog2 = skel->progs.multi_prog_pass2,
1314 .listen_at = { EXT_IP4, EXT_PORT },
1315 .expect_errno = ECONNREFUSED,
1318 .desc = "multi prog - pass, redir",
1319 .prog1 = skel->progs.multi_prog_pass1,
1320 .prog2 = skel->progs.multi_prog_redir2,
1321 .listen_at = { INT_IP4, INT_PORT },
1324 .desc = "multi prog - redir, pass",
1325 .prog1 = skel->progs.multi_prog_redir1,
1326 .prog2 = skel->progs.multi_prog_pass2,
1327 .listen_at = { INT_IP4, INT_PORT },
1330 .desc = "multi prog - drop, redir",
1331 .prog1 = skel->progs.multi_prog_drop1,
1332 .prog2 = skel->progs.multi_prog_redir2,
1333 .listen_at = { INT_IP4, INT_PORT },
1336 .desc = "multi prog - redir, drop",
1337 .prog1 = skel->progs.multi_prog_redir1,
1338 .prog2 = skel->progs.multi_prog_drop2,
1339 .listen_at = { INT_IP4, INT_PORT },
1342 .desc = "multi prog - redir, redir",
1343 .prog1 = skel->progs.multi_prog_redir1,
1344 .prog2 = skel->progs.multi_prog_redir2,
1345 .listen_at = { INT_IP4, INT_PORT },
1348 struct test_multi_prog *t;
1350 for (t = tests; t < tests + ARRAY_SIZE(tests); t++) {
1351 t->redir_map = skel->maps.redir_map;
1352 t->run_map = skel->maps.run_map;
1353 if (test__start_subtest(t->desc))
1354 run_multi_prog_lookup(t);
1358 static void run_tests(struct test_sk_lookup *skel)
1360 if (test__start_subtest("query lookup prog"))
1361 query_lookup_prog(skel);
1362 test_redirect_lookup(skel);
1363 test_drop_on_lookup(skel);
1364 test_drop_on_reuseport(skel);
1365 test_sk_assign_helper(skel);
1366 test_multi_prog_lookup(skel);
1369 static int switch_netns(void)
1371 static const char * const setup_script[] = {
1372 "ip -6 addr add dev lo " EXT_IP6 "/128",
1373 "ip -6 addr add dev lo " INT_IP6 "/128",
1374 "ip link set dev lo up",
1377 const char * const *cmd;
1380 err = unshare(CLONE_NEWNET);
1381 if (CHECK(err, "unshare", "failed\n")) {
1382 log_err("unshare(CLONE_NEWNET)");
1386 for (cmd = setup_script; *cmd; cmd++) {
1388 if (CHECK(err, "system", "failed\n")) {
1389 log_err("system(%s)", *cmd);
1397 void test_sk_lookup(void)
1399 struct test_sk_lookup *skel;
1402 err = switch_netns();
1406 skel = test_sk_lookup__open_and_load();
1407 if (CHECK(!skel, "skel open_and_load", "failed\n"))
1412 test_sk_lookup__destroy(skel);