rst.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * The test checks that both active and passive reset have correct TCP-AO
  4. * signature. An "active" reset (abort) here is procured from closing
  5. * listen() socket with non-accepted connections in the queue:
  6. * inet_csk_listen_stop() => inet_child_forget() =>
  7. * => tcp_disconnect() => tcp_send_active_reset()
  8. *
  9. * The passive reset is quite hard to get on established TCP connections.
  10. * It could be procured from non-established states, but the synchronization
  11. * part from userspace in order to reliably get RST seems uneasy.
  12. * So, instead it's procured by corrupting SEQ number on TIMED-WAIT state.
  13. *
  14. * It's important to test both passive and active RST as they go through
  15. * different code-paths:
  16. * - tcp_send_active_reset() makes no-data skb, sends it with tcp_transmit_skb()
  17. * - tcp_v*_send_reset() create their reply skbs and send them with
  18. * ip_send_unicast_reply()
  19. *
  20. * In both cases TCP-AO signatures have to be correct, which is verified by
  21. * (1) checking that the TCP-AO connection was reset and (2) TCP-AO counters.
  22. *
  23. * Author: Dmitry Safonov <dima@arista.com>
  24. */
  25. #include <inttypes.h>
  26. #include "../../../../include/linux/kernel.h"
  27. #include "aolib.h"
  28. const size_t quota = 1000;
  29. const size_t packet_sz = 100;
  30. /*
  31. * Backlog == 0 means 1 connection in queue, see:
  32. * commit 64a146513f8f ("[NET]: Revert incorrect accept queue...")
  33. */
  34. const unsigned int backlog;
  35. static void netstats_check(struct netstat *before, struct netstat *after,
  36. char *msg)
  37. {
  38. uint64_t before_cnt, after_cnt;
  39. before_cnt = netstat_get(before, "TCPAORequired", NULL);
  40. after_cnt = netstat_get(after, "TCPAORequired", NULL);
  41. if (after_cnt > before_cnt)
  42. test_fail("Segments without AO sign (%s): %" PRIu64 " => %" PRIu64,
  43. msg, before_cnt, after_cnt);
  44. else
  45. test_ok("No segments without AO sign (%s)", msg);
  46. before_cnt = netstat_get(before, "TCPAOGood", NULL);
  47. after_cnt = netstat_get(after, "TCPAOGood", NULL);
  48. if (after_cnt <= before_cnt)
  49. test_fail("Signed AO segments (%s): %" PRIu64 " => %" PRIu64,
  50. msg, before_cnt, after_cnt);
  51. else
  52. test_ok("Signed AO segments (%s): %" PRIu64 " => %" PRIu64,
  53. msg, before_cnt, after_cnt);
  54. before_cnt = netstat_get(before, "TCPAOBad", NULL);
  55. after_cnt = netstat_get(after, "TCPAOBad", NULL);
  56. if (after_cnt > before_cnt)
  57. test_fail("Segments with bad AO sign (%s): %" PRIu64 " => %" PRIu64,
  58. msg, before_cnt, after_cnt);
  59. else
  60. test_ok("No segments with bad AO sign (%s)", msg);
  61. }
  62. /*
  63. * Another way to send RST, but not through tcp_v{4,6}_send_reset()
  64. * is tcp_send_active_reset(), that is not in reply to inbound segment,
  65. * but rather active send. It uses tcp_transmit_skb(), so that should
  66. * work, but as it also sends RST - nice that it can be covered as well.
  67. */
  68. static void close_forced(int sk)
  69. {
  70. struct linger sl;
  71. sl.l_onoff = 1;
  72. sl.l_linger = 0;
  73. if (setsockopt(sk, SOL_SOCKET, SO_LINGER, &sl, sizeof(sl)))
  74. test_error("setsockopt(SO_LINGER)");
  75. close(sk);
  76. }
  77. static void test_server_active_rst(unsigned int port)
  78. {
  79. struct tcp_counters cnt1, cnt2;
  80. ssize_t bytes;
  81. int sk, lsk;
  82. lsk = test_listen_socket(this_ip_addr, port, backlog);
  83. if (test_add_key(lsk, DEFAULT_TEST_PASSWORD, this_ip_dest, -1, 100, 100))
  84. test_error("setsockopt(TCP_AO_ADD_KEY)");
  85. if (test_get_tcp_counters(lsk, &cnt1))
  86. test_error("test_get_tcp_counters()");
  87. synchronize_threads(); /* 1: MKT added */
  88. if (test_wait_fd(lsk, TEST_TIMEOUT_SEC, 0))
  89. test_error("test_wait_fd()");
  90. sk = accept(lsk, NULL, NULL);
  91. if (sk < 0)
  92. test_error("accept()");
  93. synchronize_threads(); /* 2: connection accept()ed, another queued */
  94. if (test_get_tcp_counters(lsk, &cnt2))
  95. test_error("test_get_tcp_counters()");
  96. synchronize_threads(); /* 3: close listen socket */
  97. close(lsk);
  98. bytes = test_server_run(sk, quota, 0);
  99. if (bytes != quota)
  100. test_error("servered only %zd bytes", bytes);
  101. else
  102. test_ok("servered %zd bytes", bytes);
  103. synchronize_threads(); /* 4: finishing up */
  104. close_forced(sk);
  105. synchronize_threads(); /* 5: closed active sk */
  106. synchronize_threads(); /* 6: counters checks */
  107. if (test_assert_counters("active RST server", &cnt1, &cnt2, TEST_CNT_GOOD))
  108. test_fail("MKT counters (server) have not only good packets");
  109. else
  110. test_ok("MKT counters are good on server");
  111. }
  112. static void test_server_passive_rst(unsigned int port)
  113. {
  114. struct tcp_counters cnt1, cnt2;
  115. int sk, lsk;
  116. ssize_t bytes;
  117. lsk = test_listen_socket(this_ip_addr, port, 1);
  118. if (test_add_key(lsk, DEFAULT_TEST_PASSWORD, this_ip_dest, -1, 100, 100))
  119. test_error("setsockopt(TCP_AO_ADD_KEY)");
  120. synchronize_threads(); /* 1: MKT added => connect() */
  121. if (test_wait_fd(lsk, TEST_TIMEOUT_SEC, 0))
  122. test_error("test_wait_fd()");
  123. sk = accept(lsk, NULL, NULL);
  124. if (sk < 0)
  125. test_error("accept()");
  126. synchronize_threads(); /* 2: accepted => send data */
  127. close(lsk);
  128. if (test_get_tcp_counters(sk, &cnt1))
  129. test_error("test_get_tcp_counters()");
  130. bytes = test_server_run(sk, quota, TEST_TIMEOUT_SEC);
  131. if (bytes != quota) {
  132. if (bytes > 0)
  133. test_fail("server served: %zd", bytes);
  134. else
  135. test_fail("server returned %zd", bytes);
  136. }
  137. synchronize_threads(); /* 3: checkpoint the client */
  138. synchronize_threads(); /* 4: close the server, creating twsk */
  139. if (test_get_tcp_counters(sk, &cnt2))
  140. test_error("test_get_tcp_counters()");
  141. close(sk);
  142. synchronize_threads(); /* 5: restore the socket, send more data */
  143. test_assert_counters("passive RST server", &cnt1, &cnt2, TEST_CNT_GOOD);
  144. synchronize_threads(); /* 6: server exits */
  145. }
  146. static void *server_fn(void *arg)
  147. {
  148. struct netstat *ns_before, *ns_after;
  149. unsigned int port = test_server_port;
  150. ns_before = netstat_read();
  151. test_server_active_rst(port++);
  152. test_server_passive_rst(port++);
  153. ns_after = netstat_read();
  154. netstats_check(ns_before, ns_after, "server");
  155. netstat_free(ns_after);
  156. netstat_free(ns_before);
  157. synchronize_threads(); /* exit */
  158. synchronize_threads(); /* don't race to exit() - client exits */
  159. return NULL;
  160. }
  161. static int test_wait_fds(int sk[], size_t nr, bool is_writable[],
  162. ssize_t wait_for, time_t sec)
  163. {
  164. struct timeval tv = { .tv_sec = sec };
  165. struct timeval *ptv = NULL;
  166. fd_set left;
  167. size_t i;
  168. int ret;
  169. FD_ZERO(&left);
  170. for (i = 0; i < nr; i++) {
  171. FD_SET(sk[i], &left);
  172. if (is_writable)
  173. is_writable[i] = false;
  174. }
  175. if (sec)
  176. ptv = &tv;
  177. do {
  178. bool is_empty = true;
  179. fd_set fds, efds;
  180. int nfd = 0;
  181. FD_ZERO(&fds);
  182. FD_ZERO(&efds);
  183. for (i = 0; i < nr; i++) {
  184. if (!FD_ISSET(sk[i], &left))
  185. continue;
  186. if (sk[i] > nfd)
  187. nfd = sk[i];
  188. FD_SET(sk[i], &fds);
  189. FD_SET(sk[i], &efds);
  190. is_empty = false;
  191. }
  192. if (is_empty)
  193. return -ENOENT;
  194. errno = 0;
  195. ret = select(nfd + 1, NULL, &fds, &efds, ptv);
  196. if (ret < 0)
  197. return -errno;
  198. if (!ret)
  199. return -ETIMEDOUT;
  200. for (i = 0; i < nr; i++) {
  201. if (FD_ISSET(sk[i], &fds)) {
  202. if (is_writable)
  203. is_writable[i] = true;
  204. FD_CLR(sk[i], &left);
  205. wait_for--;
  206. continue;
  207. }
  208. if (FD_ISSET(sk[i], &efds)) {
  209. FD_CLR(sk[i], &left);
  210. wait_for--;
  211. }
  212. }
  213. } while (wait_for > 0);
  214. return 0;
  215. }
  216. static void test_client_active_rst(unsigned int port)
  217. {
  218. int i, sk[3], err;
  219. bool is_writable[ARRAY_SIZE(sk)] = {false};
  220. unsigned int last = ARRAY_SIZE(sk) - 1;
  221. for (i = 0; i < ARRAY_SIZE(sk); i++) {
  222. sk[i] = socket(test_family, SOCK_STREAM, IPPROTO_TCP);
  223. if (sk[i] < 0)
  224. test_error("socket()");
  225. if (test_add_key(sk[i], DEFAULT_TEST_PASSWORD,
  226. this_ip_dest, -1, 100, 100))
  227. test_error("setsockopt(TCP_AO_ADD_KEY)");
  228. }
  229. synchronize_threads(); /* 1: MKT added */
  230. for (i = 0; i < last; i++) {
  231. err = _test_connect_socket(sk[i], this_ip_dest, port, i != 0);
  232. if (err < 0)
  233. test_error("failed to connect()");
  234. }
  235. synchronize_threads(); /* 2: two connections: one accept()ed, another queued */
  236. err = test_wait_fds(sk, last, is_writable, last, TEST_TIMEOUT_SEC);
  237. if (err < 0)
  238. test_error("test_wait_fds(): %d", err);
  239. /* async connect() with third sk to get into request_sock_queue */
  240. err = _test_connect_socket(sk[last], this_ip_dest, port, 1);
  241. if (err < 0)
  242. test_error("failed to connect()");
  243. synchronize_threads(); /* 3: close listen socket */
  244. if (test_client_verify(sk[0], packet_sz, quota / packet_sz))
  245. test_fail("Failed to send data on connected socket");
  246. else
  247. test_ok("Verified established tcp connection");
  248. synchronize_threads(); /* 4: finishing up */
  249. synchronize_threads(); /* 5: closed active sk */
  250. /*
  251. * Wait for 2 connections: one accepted, another in the accept queue,
  252. * the one in request_sock_queue won't get fully established, so
  253. * doesn't receive an active RST, see inet_csk_listen_stop().
  254. */
  255. err = test_wait_fds(sk, last, NULL, last, TEST_TIMEOUT_SEC);
  256. if (err < 0)
  257. test_error("select(): %d", err);
  258. for (i = 0; i < ARRAY_SIZE(sk); i++) {
  259. socklen_t slen = sizeof(err);
  260. if (getsockopt(sk[i], SOL_SOCKET, SO_ERROR, &err, &slen))
  261. test_error("getsockopt()");
  262. if (is_writable[i] && err != ECONNRESET) {
  263. test_fail("sk[%d] = %d, err = %d, connection wasn't reset",
  264. i, sk[i], err);
  265. } else {
  266. test_ok("sk[%d] = %d%s", i, sk[i],
  267. is_writable[i] ? ", connection was reset" : "");
  268. }
  269. }
  270. synchronize_threads(); /* 6: counters checks */
  271. }
  272. static void test_client_passive_rst(unsigned int port)
  273. {
  274. struct tcp_counters cnt1, cnt2;
  275. struct tcp_ao_repair ao_img;
  276. struct tcp_sock_state img;
  277. sockaddr_af saddr;
  278. int sk, err;
  279. sk = socket(test_family, SOCK_STREAM, IPPROTO_TCP);
  280. if (sk < 0)
  281. test_error("socket()");
  282. if (test_add_key(sk, DEFAULT_TEST_PASSWORD, this_ip_dest, -1, 100, 100))
  283. test_error("setsockopt(TCP_AO_ADD_KEY)");
  284. synchronize_threads(); /* 1: MKT added => connect() */
  285. if (test_connect_socket(sk, this_ip_dest, port) <= 0)
  286. test_error("failed to connect()");
  287. synchronize_threads(); /* 2: accepted => send data */
  288. if (test_client_verify(sk, packet_sz, quota / packet_sz))
  289. test_fail("Failed to send data on connected socket");
  290. else
  291. test_ok("Verified established tcp connection");
  292. synchronize_threads(); /* 3: checkpoint the client */
  293. test_enable_repair(sk);
  294. test_sock_checkpoint(sk, &img, &saddr);
  295. test_ao_checkpoint(sk, &ao_img);
  296. test_disable_repair(sk);
  297. synchronize_threads(); /* 4: close the server, creating twsk */
  298. /*
  299. * The "corruption" in SEQ has to be small enough to fit into TCP
  300. * window, see tcp_timewait_state_process() for out-of-window
  301. * segments.
  302. */
  303. img.out.seq += 5; /* 5 is more noticeable in tcpdump than 1 */
  304. /*
  305. * FIXME: This is kind-of ugly and dirty, but it works.
  306. *
  307. * At this moment, the server has close'ed(sk).
  308. * The passive RST that is being targeted here is new data after
  309. * half-duplex close, see tcp_timewait_state_process() => TCP_TW_RST
  310. *
  311. * What is needed here is:
  312. * (1) wait for FIN from the server
  313. * (2) make sure that the ACK from the client went out
  314. * (3) make sure that the ACK was received and processed by the server
  315. *
  316. * Otherwise, the data that will be sent from "repaired" socket
  317. * post SEQ corruption may get to the server before it's in
  318. * TCP_FIN_WAIT2.
  319. *
  320. * (1) is easy with select()/poll()
  321. * (2) is possible by polling tcpi_state from TCP_INFO
  322. * (3) is quite complex: as server's socket was already closed,
  323. * probably the way to do it would be tcp-diag.
  324. */
  325. sleep(TEST_RETRANSMIT_SEC);
  326. synchronize_threads(); /* 5: restore the socket, send more data */
  327. test_kill_sk(sk);
  328. sk = socket(test_family, SOCK_STREAM, IPPROTO_TCP);
  329. if (sk < 0)
  330. test_error("socket()");
  331. test_enable_repair(sk);
  332. test_sock_restore(sk, &img, &saddr, this_ip_dest, port);
  333. if (test_add_repaired_key(sk, DEFAULT_TEST_PASSWORD, 0, this_ip_dest, -1, 100, 100))
  334. test_error("setsockopt(TCP_AO_ADD_KEY)");
  335. test_ao_restore(sk, &ao_img);
  336. if (test_get_tcp_counters(sk, &cnt1))
  337. test_error("test_get_tcp_counters()");
  338. test_disable_repair(sk);
  339. test_sock_state_free(&img);
  340. /*
  341. * This is how "passive reset" is acquired in this test from TCP_TW_RST:
  342. *
  343. * IP 10.0.254.1.7011 > 10.0.1.1.59772: Flags [P.], seq 901:1001, ack 1001, win 249,
  344. * options [tcp-ao keyid 100 rnextkeyid 100 mac 0x10217d6c36a22379086ef3b1], length 100
  345. * IP 10.0.254.1.7011 > 10.0.1.1.59772: Flags [F.], seq 1001, ack 1001, win 249,
  346. * options [tcp-ao keyid 100 rnextkeyid 100 mac 0x104ffc99b98c10a5298cc268], length 0
  347. * IP 10.0.1.1.59772 > 10.0.254.1.7011: Flags [.], ack 1002, win 251,
  348. * options [tcp-ao keyid 100 rnextkeyid 100 mac 0xe496dd4f7f5a8a66873c6f93,nop,nop,sack 1 {1001:1002}], length 0
  349. * IP 10.0.1.1.59772 > 10.0.254.1.7011: Flags [P.], seq 1006:1106, ack 1001, win 251,
  350. * options [tcp-ao keyid 100 rnextkeyid 100 mac 0x1b5f3330fb23fbcd0c77d0ca], length 100
  351. * IP 10.0.254.1.7011 > 10.0.1.1.59772: Flags [R], seq 3215596252, win 0,
  352. * options [tcp-ao keyid 100 rnextkeyid 100 mac 0x0bcfbbf497bce844312304b2], length 0
  353. */
  354. err = test_client_verify(sk, packet_sz, quota / packet_sz);
  355. /* Make sure that the connection was reset, not timeouted */
  356. if (err && err == -ECONNRESET)
  357. test_ok("client sock was passively reset post-seq-adjust");
  358. else if (err)
  359. test_fail("client sock was not reset post-seq-adjust: %d", err);
  360. else
  361. test_fail("client sock is yet connected post-seq-adjust");
  362. if (test_get_tcp_counters(sk, &cnt2))
  363. test_error("test_get_tcp_counters()");
  364. synchronize_threads(); /* 6: server exits */
  365. close(sk);
  366. test_assert_counters("client passive RST", &cnt1, &cnt2, TEST_CNT_GOOD);
  367. }
  368. static void *client_fn(void *arg)
  369. {
  370. struct netstat *ns_before, *ns_after;
  371. unsigned int port = test_server_port;
  372. ns_before = netstat_read();
  373. test_client_active_rst(port++);
  374. test_client_passive_rst(port++);
  375. ns_after = netstat_read();
  376. netstats_check(ns_before, ns_after, "client");
  377. netstat_free(ns_after);
  378. netstat_free(ns_before);
  379. synchronize_threads(); /* exit */
  380. return NULL;
  381. }
  382. int main(int argc, char *argv[])
  383. {
  384. test_init(15, server_fn, client_fn);
  385. return 0;
  386. }