reuseport_dualstack.c 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209
  1. /*
  2. * It is possible to use SO_REUSEPORT to open multiple sockets bound to
  3. * equivalent local addresses using AF_INET and AF_INET6 at the same time. If
  4. * the AF_INET6 socket has IPV6_V6ONLY set, it's clear which socket should
  5. * receive a given incoming packet. However, when it is not set, incoming v4
  6. * packets should prefer the AF_INET socket(s). This behavior was defined with
  7. * the original SO_REUSEPORT implementation, but broke with
  8. * e32ea7e74727 ("soreuseport: fast reuseport UDP socket selection")
  9. * This test creates these mixed AF_INET/AF_INET6 sockets and asserts the
  10. * AF_INET preference for v4 packets.
  11. */
  12. #define _GNU_SOURCE
  13. #include <arpa/inet.h>
  14. #include <errno.h>
  15. #include <error.h>
  16. #include <linux/in.h>
  17. #include <linux/unistd.h>
  18. #include <stdio.h>
  19. #include <stdlib.h>
  20. #include <string.h>
  21. #include <sys/epoll.h>
  22. #include <sys/types.h>
  23. #include <sys/socket.h>
  24. #include <unistd.h>
  25. static const int PORT = 8888;
  26. static void build_rcv_fd(int family, int proto, int *rcv_fds, int count)
  27. {
  28. struct sockaddr_storage addr;
  29. struct sockaddr_in *addr4;
  30. struct sockaddr_in6 *addr6;
  31. int opt, i;
  32. switch (family) {
  33. case AF_INET:
  34. addr4 = (struct sockaddr_in *)&addr;
  35. addr4->sin_family = AF_INET;
  36. addr4->sin_addr.s_addr = htonl(INADDR_ANY);
  37. addr4->sin_port = htons(PORT);
  38. break;
  39. case AF_INET6:
  40. addr6 = (struct sockaddr_in6 *)&addr;
  41. addr6->sin6_family = AF_INET6;
  42. addr6->sin6_addr = in6addr_any;
  43. addr6->sin6_port = htons(PORT);
  44. break;
  45. default:
  46. error(1, 0, "Unsupported family %d", family);
  47. }
  48. for (i = 0; i < count; ++i) {
  49. rcv_fds[i] = socket(family, proto, 0);
  50. if (rcv_fds[i] < 0)
  51. error(1, errno, "failed to create receive socket");
  52. opt = 1;
  53. if (setsockopt(rcv_fds[i], SOL_SOCKET, SO_REUSEPORT, &opt,
  54. sizeof(opt)))
  55. error(1, errno, "failed to set SO_REUSEPORT");
  56. if (bind(rcv_fds[i], (struct sockaddr *)&addr, sizeof(addr)))
  57. error(1, errno, "failed to bind receive socket");
  58. if (proto == SOCK_STREAM && listen(rcv_fds[i], 10))
  59. error(1, errno, "failed to listen on receive port");
  60. }
  61. }
  62. static void send_from_v4(int proto)
  63. {
  64. struct sockaddr_in saddr, daddr;
  65. int fd;
  66. saddr.sin_family = AF_INET;
  67. saddr.sin_addr.s_addr = htonl(INADDR_ANY);
  68. saddr.sin_port = 0;
  69. daddr.sin_family = AF_INET;
  70. daddr.sin_addr.s_addr = htonl(INADDR_LOOPBACK);
  71. daddr.sin_port = htons(PORT);
  72. fd = socket(AF_INET, proto, 0);
  73. if (fd < 0)
  74. error(1, errno, "failed to create send socket");
  75. if (bind(fd, (struct sockaddr *)&saddr, sizeof(saddr)))
  76. error(1, errno, "failed to bind send socket");
  77. if (connect(fd, (struct sockaddr *)&daddr, sizeof(daddr)))
  78. error(1, errno, "failed to connect send socket");
  79. if (send(fd, "a", 1, 0) < 0)
  80. error(1, errno, "failed to send message");
  81. close(fd);
  82. }
  83. static int receive_once(int epfd, int proto)
  84. {
  85. struct epoll_event ev;
  86. int i, fd;
  87. char buf[8];
  88. i = epoll_wait(epfd, &ev, 1, -1);
  89. if (i < 0)
  90. error(1, errno, "epoll_wait failed");
  91. if (proto == SOCK_STREAM) {
  92. fd = accept(ev.data.fd, NULL, NULL);
  93. if (fd < 0)
  94. error(1, errno, "failed to accept");
  95. i = recv(fd, buf, sizeof(buf), 0);
  96. close(fd);
  97. } else {
  98. i = recv(ev.data.fd, buf, sizeof(buf), 0);
  99. }
  100. if (i < 0)
  101. error(1, errno, "failed to recv");
  102. return ev.data.fd;
  103. }
  104. static void test(int *rcv_fds, int count, int proto)
  105. {
  106. struct epoll_event ev;
  107. int epfd, i, test_fd;
  108. uint16_t test_family;
  109. socklen_t len;
  110. epfd = epoll_create(1);
  111. if (epfd < 0)
  112. error(1, errno, "failed to create epoll");
  113. ev.events = EPOLLIN;
  114. for (i = 0; i < count; ++i) {
  115. ev.data.fd = rcv_fds[i];
  116. if (epoll_ctl(epfd, EPOLL_CTL_ADD, rcv_fds[i], &ev))
  117. error(1, errno, "failed to register sock epoll");
  118. }
  119. send_from_v4(proto);
  120. test_fd = receive_once(epfd, proto);
  121. if (getsockopt(test_fd, SOL_SOCKET, SO_DOMAIN, &test_family, &len))
  122. error(1, errno, "failed to read socket domain");
  123. if (test_family != AF_INET)
  124. error(1, 0, "expected to receive on v4 socket but got v6 (%d)",
  125. test_family);
  126. close(epfd);
  127. }
  128. int main(void)
  129. {
  130. int rcv_fds[32], i;
  131. fprintf(stderr, "---- UDP IPv4 created before IPv6 ----\n");
  132. build_rcv_fd(AF_INET, SOCK_DGRAM, rcv_fds, 5);
  133. build_rcv_fd(AF_INET6, SOCK_DGRAM, &(rcv_fds[5]), 5);
  134. test(rcv_fds, 10, SOCK_DGRAM);
  135. for (i = 0; i < 10; ++i)
  136. close(rcv_fds[i]);
  137. fprintf(stderr, "---- UDP IPv6 created before IPv4 ----\n");
  138. build_rcv_fd(AF_INET6, SOCK_DGRAM, rcv_fds, 5);
  139. build_rcv_fd(AF_INET, SOCK_DGRAM, &(rcv_fds[5]), 5);
  140. test(rcv_fds, 10, SOCK_DGRAM);
  141. for (i = 0; i < 10; ++i)
  142. close(rcv_fds[i]);
  143. /* NOTE: UDP socket lookups traverse a different code path when there
  144. * are > 10 sockets in a group.
  145. */
  146. fprintf(stderr, "---- UDP IPv4 created before IPv6 (large) ----\n");
  147. build_rcv_fd(AF_INET, SOCK_DGRAM, rcv_fds, 16);
  148. build_rcv_fd(AF_INET6, SOCK_DGRAM, &(rcv_fds[16]), 16);
  149. test(rcv_fds, 32, SOCK_DGRAM);
  150. for (i = 0; i < 32; ++i)
  151. close(rcv_fds[i]);
  152. fprintf(stderr, "---- UDP IPv6 created before IPv4 (large) ----\n");
  153. build_rcv_fd(AF_INET6, SOCK_DGRAM, rcv_fds, 16);
  154. build_rcv_fd(AF_INET, SOCK_DGRAM, &(rcv_fds[16]), 16);
  155. test(rcv_fds, 32, SOCK_DGRAM);
  156. for (i = 0; i < 32; ++i)
  157. close(rcv_fds[i]);
  158. fprintf(stderr, "---- TCP IPv4 created before IPv6 ----\n");
  159. build_rcv_fd(AF_INET, SOCK_STREAM, rcv_fds, 5);
  160. build_rcv_fd(AF_INET6, SOCK_STREAM, &(rcv_fds[5]), 5);
  161. test(rcv_fds, 10, SOCK_STREAM);
  162. for (i = 0; i < 10; ++i)
  163. close(rcv_fds[i]);
  164. fprintf(stderr, "---- TCP IPv6 created before IPv4 ----\n");
  165. build_rcv_fd(AF_INET6, SOCK_STREAM, rcv_fds, 5);
  166. build_rcv_fd(AF_INET, SOCK_STREAM, &(rcv_fds[5]), 5);
  167. test(rcv_fds, 10, SOCK_STREAM);
  168. for (i = 0; i < 10; ++i)
  169. close(rcv_fds[i]);
  170. fprintf(stderr, "SUCCESS\n");
  171. return 0;
  172. }