NetworkTask.cpp 29 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672
  1. /*
  2. * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <Kernel/Debug.h>
  7. #include <Kernel/Locking/Mutex.h>
  8. #include <Kernel/Locking/MutexProtected.h>
  9. #include <Kernel/Net/ARP.h>
  10. #include <Kernel/Net/EtherType.h>
  11. #include <Kernel/Net/EthernetFrameHeader.h>
  12. #include <Kernel/Net/ICMP.h>
  13. #include <Kernel/Net/IPv4.h>
  14. #include <Kernel/Net/IPv4Socket.h>
  15. #include <Kernel/Net/LoopbackAdapter.h>
  16. #include <Kernel/Net/NetworkTask.h>
  17. #include <Kernel/Net/NetworkingManagement.h>
  18. #include <Kernel/Net/Routing.h>
  19. #include <Kernel/Net/TCP.h>
  20. #include <Kernel/Net/TCPSocket.h>
  21. #include <Kernel/Net/UDP.h>
  22. #include <Kernel/Net/UDPSocket.h>
  23. #include <Kernel/Process.h>
  24. namespace Kernel {
  25. static void handle_arp(EthernetFrameHeader const&, size_t frame_size);
  26. static void handle_ipv4(EthernetFrameHeader const&, size_t frame_size, Time const& packet_timestamp);
  27. static void handle_icmp(EthernetFrameHeader const&, IPv4Packet const&, Time const& packet_timestamp);
  28. static void handle_udp(IPv4Packet const&, Time const& packet_timestamp);
  29. static void handle_tcp(IPv4Packet const&, Time const& packet_timestamp);
  30. static void send_delayed_tcp_ack(TCPSocket& socket);
  31. static void send_tcp_rst(IPv4Packet const& ipv4_packet, TCPPacket const& tcp_packet, LockRefPtr<NetworkAdapter> adapter);
  32. static void flush_delayed_tcp_acks();
  33. static void retransmit_tcp_packets();
  34. static Thread* network_task = nullptr;
  35. static HashTable<NonnullRefPtr<TCPSocket>>* delayed_ack_sockets;
  36. [[noreturn]] static void NetworkTask_main(void*);
  37. void NetworkTask::spawn()
  38. {
  39. auto name = KString::try_create("Network Task"sv);
  40. if (name.is_error())
  41. TODO();
  42. auto [_, first_thread] = MUST(Process::create_kernel_process(name.release_value(), NetworkTask_main, nullptr));
  43. network_task = first_thread;
  44. }
  45. bool NetworkTask::is_current()
  46. {
  47. return Thread::current() == network_task;
  48. }
  49. void NetworkTask_main(void*)
  50. {
  51. delayed_ack_sockets = new HashTable<NonnullRefPtr<TCPSocket>>;
  52. WaitQueue packet_wait_queue;
  53. int pending_packets = 0;
  54. NetworkingManagement::the().for_each([&](auto& adapter) {
  55. dmesgln("NetworkTask: {} network adapter found: hw={}", adapter.class_name(), adapter.mac_address().to_string());
  56. if (adapter.class_name() == "LoopbackAdapter"sv) {
  57. adapter.set_ipv4_address({ 127, 0, 0, 1 });
  58. adapter.set_ipv4_netmask({ 255, 0, 0, 0 });
  59. }
  60. adapter.on_receive = [&]() {
  61. pending_packets++;
  62. packet_wait_queue.wake_all();
  63. };
  64. });
  65. auto dequeue_packet = [&pending_packets](u8* buffer, size_t buffer_size, Time& packet_timestamp) -> size_t {
  66. if (pending_packets == 0)
  67. return 0;
  68. size_t packet_size = 0;
  69. NetworkingManagement::the().for_each([&](auto& adapter) {
  70. if (packet_size || !adapter.has_queued_packets())
  71. return;
  72. packet_size = adapter.dequeue_packet(buffer, buffer_size, packet_timestamp);
  73. pending_packets--;
  74. dbgln_if(NETWORK_TASK_DEBUG, "NetworkTask: Dequeued packet from {} ({} bytes)", adapter.name(), packet_size);
  75. });
  76. return packet_size;
  77. };
  78. size_t buffer_size = 64 * KiB;
  79. auto region_or_error = MM.allocate_kernel_region(buffer_size, "Kernel Packet Buffer"sv, Memory::Region::Access::ReadWrite);
  80. if (region_or_error.is_error())
  81. TODO();
  82. auto buffer_region = region_or_error.release_value();
  83. auto buffer = (u8*)buffer_region->vaddr().get();
  84. Time packet_timestamp;
  85. for (;;) {
  86. flush_delayed_tcp_acks();
  87. retransmit_tcp_packets();
  88. size_t packet_size = dequeue_packet(buffer, buffer_size, packet_timestamp);
  89. if (!packet_size) {
  90. auto timeout_time = Time::from_milliseconds(500);
  91. auto timeout = Thread::BlockTimeout { false, &timeout_time };
  92. [[maybe_unused]] auto result = packet_wait_queue.wait_on(timeout, "NetworkTask"sv);
  93. continue;
  94. }
  95. if (packet_size < sizeof(EthernetFrameHeader)) {
  96. dbgln("NetworkTask: Packet is too small to be an Ethernet packet! ({})", packet_size);
  97. continue;
  98. }
  99. auto& eth = *(EthernetFrameHeader const*)buffer;
  100. dbgln_if(ETHERNET_DEBUG, "NetworkTask: From {} to {}, ether_type={:#04x}, packet_size={}", eth.source().to_string(), eth.destination().to_string(), eth.ether_type(), packet_size);
  101. switch (eth.ether_type()) {
  102. case EtherType::ARP:
  103. handle_arp(eth, packet_size);
  104. break;
  105. case EtherType::IPv4:
  106. handle_ipv4(eth, packet_size, packet_timestamp);
  107. break;
  108. case EtherType::IPv6:
  109. // ignore
  110. break;
  111. default:
  112. dbgln_if(ETHERNET_DEBUG, "NetworkTask: Unknown ethernet type {:#04x}", eth.ether_type());
  113. }
  114. }
  115. }
  116. void handle_arp(EthernetFrameHeader const& eth, size_t frame_size)
  117. {
  118. constexpr size_t minimum_arp_frame_size = sizeof(EthernetFrameHeader) + sizeof(ARPPacket);
  119. if (frame_size < minimum_arp_frame_size) {
  120. dbgln("handle_arp: Frame too small ({}, need {})", frame_size, minimum_arp_frame_size);
  121. return;
  122. }
  123. auto& packet = *static_cast<ARPPacket const*>(eth.payload());
  124. if (packet.hardware_type() != 1 || packet.hardware_address_length() != sizeof(MACAddress)) {
  125. dbgln("handle_arp: Hardware type not ethernet ({:#04x}, len={})", packet.hardware_type(), packet.hardware_address_length());
  126. return;
  127. }
  128. if (packet.protocol_type() != EtherType::IPv4 || packet.protocol_address_length() != sizeof(IPv4Address)) {
  129. dbgln("handle_arp: Protocol type not IPv4 ({:#04x}, len={})", packet.protocol_type(), packet.protocol_address_length());
  130. return;
  131. }
  132. dbgln_if(ARP_DEBUG, "handle_arp: operation={:#04x}, sender={}/{}, target={}/{}",
  133. packet.operation(),
  134. packet.sender_hardware_address().to_string(),
  135. packet.sender_protocol_address().to_string(),
  136. packet.target_hardware_address().to_string(),
  137. packet.target_protocol_address().to_string());
  138. if (!packet.sender_hardware_address().is_zero() && !packet.sender_protocol_address().is_zero()) {
  139. // Someone has this IPv4 address. I guess we can try to remember that.
  140. // FIXME: Protect against ARP spamming.
  141. update_arp_table(packet.sender_protocol_address(), packet.sender_hardware_address(), UpdateTable::Set);
  142. }
  143. if (packet.operation() == ARPOperation::Request) {
  144. // Who has this IP address?
  145. if (auto adapter = NetworkingManagement::the().from_ipv4_address(packet.target_protocol_address())) {
  146. // We do!
  147. dbgln("handle_arp: Responding to ARP request for my IPv4 address ({})", adapter->ipv4_address());
  148. ARPPacket response;
  149. response.set_operation(ARPOperation::Response);
  150. response.set_target_hardware_address(packet.sender_hardware_address());
  151. response.set_target_protocol_address(packet.sender_protocol_address());
  152. response.set_sender_hardware_address(adapter->mac_address());
  153. response.set_sender_protocol_address(adapter->ipv4_address());
  154. adapter->send(packet.sender_hardware_address(), response);
  155. }
  156. return;
  157. }
  158. }
  159. void handle_ipv4(EthernetFrameHeader const& eth, size_t frame_size, Time const& packet_timestamp)
  160. {
  161. constexpr size_t minimum_ipv4_frame_size = sizeof(EthernetFrameHeader) + sizeof(IPv4Packet);
  162. if (frame_size < minimum_ipv4_frame_size) {
  163. dbgln("handle_ipv4: Frame too small ({}, need {})", frame_size, minimum_ipv4_frame_size);
  164. return;
  165. }
  166. auto& packet = *static_cast<IPv4Packet const*>(eth.payload());
  167. if (packet.length() < sizeof(IPv4Packet)) {
  168. dbgln("handle_ipv4: IPv4 packet too short ({}, need {})", packet.length(), sizeof(IPv4Packet));
  169. return;
  170. }
  171. size_t actual_ipv4_packet_length = frame_size - sizeof(EthernetFrameHeader);
  172. if (packet.length() > actual_ipv4_packet_length) {
  173. dbgln("handle_ipv4: IPv4 packet claims to be longer than it is ({}, actually {})", packet.length(), actual_ipv4_packet_length);
  174. return;
  175. }
  176. dbgln_if(IPV4_DEBUG, "handle_ipv4: source={}, destination={}", packet.source(), packet.destination());
  177. NetworkingManagement::the().for_each([&](auto& adapter) {
  178. if (adapter.ipv4_address().is_zero() || !adapter.link_up())
  179. return;
  180. auto my_net = adapter.ipv4_address().to_u32() & adapter.ipv4_netmask().to_u32();
  181. auto their_net = packet.source().to_u32() & adapter.ipv4_netmask().to_u32();
  182. if (my_net == their_net)
  183. update_arp_table(packet.source(), eth.source(), UpdateTable::Set);
  184. });
  185. switch ((IPv4Protocol)packet.protocol()) {
  186. case IPv4Protocol::ICMP:
  187. return handle_icmp(eth, packet, packet_timestamp);
  188. case IPv4Protocol::UDP:
  189. return handle_udp(packet, packet_timestamp);
  190. case IPv4Protocol::TCP:
  191. return handle_tcp(packet, packet_timestamp);
  192. default:
  193. dbgln_if(IPV4_DEBUG, "handle_ipv4: Unhandled protocol {:#02x}", packet.protocol());
  194. break;
  195. }
  196. }
  197. void handle_icmp(EthernetFrameHeader const& eth, IPv4Packet const& ipv4_packet, Time const& packet_timestamp)
  198. {
  199. auto& icmp_header = *static_cast<ICMPHeader const*>(ipv4_packet.payload());
  200. dbgln_if(ICMP_DEBUG, "handle_icmp: source={}, destination={}, type={:#02x}, code={:#02x}", ipv4_packet.source().to_string(), ipv4_packet.destination().to_string(), icmp_header.type(), icmp_header.code());
  201. {
  202. Vector<NonnullRefPtr<IPv4Socket>> icmp_sockets;
  203. IPv4Socket::all_sockets().with_exclusive([&](auto& sockets) {
  204. for (auto& socket : sockets) {
  205. if (socket.protocol() == (unsigned)IPv4Protocol::ICMP)
  206. icmp_sockets.append(socket);
  207. }
  208. });
  209. for (auto& socket : icmp_sockets)
  210. socket->did_receive(ipv4_packet.source(), 0, { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp);
  211. }
  212. auto adapter = NetworkingManagement::the().from_ipv4_address(ipv4_packet.destination());
  213. if (!adapter)
  214. return;
  215. if (icmp_header.type() == ICMPType::EchoRequest) {
  216. auto& request = reinterpret_cast<ICMPEchoPacket const&>(icmp_header);
  217. dbgln("handle_icmp: EchoRequest from {}: id={}, seq={}", ipv4_packet.source(), (u16)request.identifier, (u16)request.sequence_number);
  218. size_t icmp_packet_size = ipv4_packet.payload_size();
  219. if (icmp_packet_size < sizeof(ICMPEchoPacket)) {
  220. dbgln("handle_icmp: EchoRequest packet is too small, ignoring.");
  221. return;
  222. }
  223. auto ipv4_payload_offset = adapter->ipv4_payload_offset();
  224. auto packet = adapter->acquire_packet_buffer(ipv4_payload_offset + icmp_packet_size);
  225. if (!packet) {
  226. dbgln("Could not allocate packet buffer while sending ICMP packet");
  227. return;
  228. }
  229. adapter->fill_in_ipv4_header(*packet, adapter->ipv4_address(), eth.source(), ipv4_packet.source(), IPv4Protocol::ICMP, icmp_packet_size, 0, 64);
  230. memset(packet->buffer->data() + ipv4_payload_offset, 0, sizeof(ICMPEchoPacket));
  231. auto& response = *(ICMPEchoPacket*)(packet->buffer->data() + ipv4_payload_offset);
  232. response.header.set_type(ICMPType::EchoReply);
  233. response.header.set_code(0);
  234. response.identifier = request.identifier;
  235. response.sequence_number = request.sequence_number;
  236. if (size_t icmp_payload_size = icmp_packet_size - sizeof(ICMPEchoPacket))
  237. memcpy(response.payload(), request.payload(), icmp_payload_size);
  238. response.header.set_checksum(internet_checksum(&response, icmp_packet_size));
  239. // FIXME: What is the right TTL value here? Is 64 ok? Should we use the same TTL as the echo request?
  240. adapter->send_packet(packet->bytes());
  241. adapter->release_packet_buffer(*packet);
  242. }
  243. }
  244. void handle_udp(IPv4Packet const& ipv4_packet, Time const& packet_timestamp)
  245. {
  246. if (ipv4_packet.payload_size() < sizeof(UDPPacket)) {
  247. dbgln("handle_udp: Packet too small ({}, need {})", ipv4_packet.payload_size(), sizeof(UDPPacket));
  248. return;
  249. }
  250. auto& udp_packet = *static_cast<UDPPacket const*>(ipv4_packet.payload());
  251. dbgln_if(UDP_DEBUG, "handle_udp: source={}:{}, destination={}:{}, length={}",
  252. ipv4_packet.source(), udp_packet.source_port(),
  253. ipv4_packet.destination(), udp_packet.destination_port(),
  254. udp_packet.length());
  255. auto socket = UDPSocket::from_port(udp_packet.destination_port());
  256. if (!socket) {
  257. dbgln_if(UDP_DEBUG, "handle_udp: No local UDP socket for {}:{}", ipv4_packet.destination(), udp_packet.destination_port());
  258. return;
  259. }
  260. VERIFY(socket->type() == SOCK_DGRAM);
  261. VERIFY(socket->local_port() == udp_packet.destination_port());
  262. auto& destination = ipv4_packet.destination();
  263. if (destination == IPv4Address(255, 255, 255, 255) || NetworkingManagement::the().from_ipv4_address(destination) || socket->multicast_memberships().contains_slow(destination))
  264. socket->did_receive(ipv4_packet.source(), udp_packet.source_port(), { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp);
  265. }
  266. void send_delayed_tcp_ack(TCPSocket& socket)
  267. {
  268. VERIFY(socket.mutex().is_locked());
  269. if (!socket.should_delay_next_ack()) {
  270. [[maybe_unused]] auto result = socket.send_ack();
  271. return;
  272. }
  273. delayed_ack_sockets->set(move(socket));
  274. }
  275. void flush_delayed_tcp_acks()
  276. {
  277. Vector<NonnullRefPtr<TCPSocket>, 32> remaining_sockets;
  278. for (auto& socket : *delayed_ack_sockets) {
  279. MutexLocker locker(socket->mutex());
  280. if (socket->should_delay_next_ack()) {
  281. MUST(remaining_sockets.try_append(*socket));
  282. continue;
  283. }
  284. [[maybe_unused]] auto result = socket->send_ack();
  285. }
  286. if (remaining_sockets.size() != delayed_ack_sockets->size()) {
  287. delayed_ack_sockets->clear();
  288. if (remaining_sockets.size() > 0)
  289. dbgln("flush_delayed_tcp_acks: {} sockets remaining", remaining_sockets.size());
  290. for (auto&& socket : remaining_sockets)
  291. delayed_ack_sockets->set(move(socket));
  292. }
  293. }
  294. void send_tcp_rst(IPv4Packet const& ipv4_packet, TCPPacket const& tcp_packet, LockRefPtr<NetworkAdapter> adapter)
  295. {
  296. auto routing_decision = route_to(ipv4_packet.source(), ipv4_packet.destination(), adapter);
  297. if (routing_decision.is_zero())
  298. return;
  299. auto ipv4_payload_offset = routing_decision.adapter->ipv4_payload_offset();
  300. const size_t options_size = 0;
  301. const size_t tcp_header_size = sizeof(TCPPacket) + options_size;
  302. const size_t buffer_size = ipv4_payload_offset + tcp_header_size;
  303. auto packet = routing_decision.adapter->acquire_packet_buffer(buffer_size);
  304. if (!packet)
  305. return;
  306. routing_decision.adapter->fill_in_ipv4_header(*packet, ipv4_packet.destination(),
  307. routing_decision.next_hop, ipv4_packet.source(), IPv4Protocol::TCP,
  308. buffer_size - ipv4_payload_offset, 0, 64);
  309. auto& rst_packet = *(TCPPacket*)(packet->buffer->data() + ipv4_payload_offset);
  310. rst_packet = {};
  311. rst_packet.set_source_port(tcp_packet.destination_port());
  312. rst_packet.set_destination_port(tcp_packet.source_port());
  313. rst_packet.set_window_size(0);
  314. rst_packet.set_sequence_number(0);
  315. rst_packet.set_ack_number(tcp_packet.sequence_number() + 1);
  316. rst_packet.set_data_offset(tcp_header_size / sizeof(u32));
  317. rst_packet.set_flags(TCPFlags::RST | TCPFlags::ACK);
  318. rst_packet.set_checksum(TCPSocket::compute_tcp_checksum(ipv4_packet.source(), ipv4_packet.destination(), rst_packet, 0));
  319. routing_decision.adapter->send_packet(packet->bytes());
  320. routing_decision.adapter->release_packet_buffer(*packet);
  321. }
  322. void handle_tcp(IPv4Packet const& ipv4_packet, Time const& packet_timestamp)
  323. {
  324. if (ipv4_packet.payload_size() < sizeof(TCPPacket)) {
  325. dbgln("handle_tcp: IPv4 payload is too small to be a TCP packet ({}, need {})", ipv4_packet.payload_size(), sizeof(TCPPacket));
  326. return;
  327. }
  328. auto& tcp_packet = *static_cast<TCPPacket const*>(ipv4_packet.payload());
  329. size_t minimum_tcp_header_size = 5 * sizeof(u32);
  330. size_t maximum_tcp_header_size = 15 * sizeof(u32);
  331. if (tcp_packet.header_size() < minimum_tcp_header_size || tcp_packet.header_size() > maximum_tcp_header_size) {
  332. dbgln("handle_tcp: TCP packet header has invalid size {}", tcp_packet.header_size());
  333. }
  334. if (ipv4_packet.payload_size() < tcp_packet.header_size()) {
  335. dbgln("handle_tcp: IPv4 payload is smaller than TCP header claims ({}, supposedly {})", ipv4_packet.payload_size(), tcp_packet.header_size());
  336. return;
  337. }
  338. size_t payload_size = ipv4_packet.payload_size() - tcp_packet.header_size();
  339. dbgln_if(TCP_DEBUG, "handle_tcp: source={}:{}, destination={}:{}, seq_no={}, ack_no={}, flags={:#04x} ({}{}{}{}), window_size={}, payload_size={}",
  340. ipv4_packet.source().to_string(),
  341. tcp_packet.source_port(),
  342. ipv4_packet.destination().to_string(),
  343. tcp_packet.destination_port(),
  344. tcp_packet.sequence_number(),
  345. tcp_packet.ack_number(),
  346. tcp_packet.flags(),
  347. tcp_packet.has_syn() ? "SYN " : "",
  348. tcp_packet.has_ack() ? "ACK " : "",
  349. tcp_packet.has_fin() ? "FIN " : "",
  350. tcp_packet.has_rst() ? "RST " : "",
  351. tcp_packet.window_size(),
  352. payload_size);
  353. auto adapter = NetworkingManagement::the().from_ipv4_address(ipv4_packet.destination());
  354. if (!adapter) {
  355. dbgln("handle_tcp: this packet is not for me, it's for {}", ipv4_packet.destination());
  356. return;
  357. }
  358. IPv4SocketTuple tuple(ipv4_packet.destination(), tcp_packet.destination_port(), ipv4_packet.source(), tcp_packet.source_port());
  359. dbgln_if(TCP_DEBUG, "handle_tcp: looking for socket; tuple={}", tuple.to_string());
  360. auto socket = TCPSocket::from_tuple(tuple);
  361. if (!socket) {
  362. if (!tcp_packet.has_rst()) {
  363. dbgln("handle_tcp: No TCP socket for tuple {}. Sending RST.", tuple.to_string());
  364. send_tcp_rst(ipv4_packet, tcp_packet, adapter);
  365. }
  366. return;
  367. }
  368. MutexLocker locker(socket->mutex());
  369. VERIFY(socket->type() == SOCK_STREAM);
  370. VERIFY(socket->local_port() == tcp_packet.destination_port());
  371. dbgln_if(TCP_DEBUG, "handle_tcp: got socket {}; state={}", socket->tuple().to_string(), TCPSocket::to_string(socket->state()));
  372. socket->receive_tcp_packet(tcp_packet, ipv4_packet.payload_size());
  373. switch (socket->state()) {
  374. case TCPSocket::State::Closed:
  375. dbgln("handle_tcp: unexpected flags in Closed state ({:x})", tcp_packet.flags());
  376. // TODO: we may want to send an RST here, maybe as a configurable option
  377. return;
  378. case TCPSocket::State::TimeWait:
  379. dbgln("handle_tcp: unexpected flags in TimeWait state ({:x})", tcp_packet.flags());
  380. (void)socket->send_tcp_packet(TCPFlags::RST);
  381. socket->set_state(TCPSocket::State::Closed);
  382. return;
  383. case TCPSocket::State::Listen:
  384. switch (tcp_packet.flags()) {
  385. case TCPFlags::SYN: {
  386. dbgln_if(TCP_DEBUG, "handle_tcp: incoming connection");
  387. auto& local_address = ipv4_packet.destination();
  388. auto& peer_address = ipv4_packet.source();
  389. auto client_or_error = socket->try_create_client(local_address, tcp_packet.destination_port(), peer_address, tcp_packet.source_port());
  390. if (client_or_error.is_error()) {
  391. dmesgln("handle_tcp: couldn't create client socket: {}", client_or_error.error());
  392. return;
  393. }
  394. auto client = client_or_error.release_value();
  395. MutexLocker locker(client->mutex());
  396. dbgln_if(TCP_DEBUG, "handle_tcp: created new client socket with tuple {}", client->tuple().to_string());
  397. client->set_sequence_number(1000);
  398. client->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  399. [[maybe_unused]] auto rc2 = client->send_tcp_packet(TCPFlags::SYN | TCPFlags::ACK);
  400. client->set_state(TCPSocket::State::SynReceived);
  401. return;
  402. }
  403. default:
  404. dbgln("handle_tcp: unexpected flags in Listen state ({:x})", tcp_packet.flags());
  405. // socket->send_tcp_packet(TCPFlags::RST);
  406. return;
  407. }
  408. case TCPSocket::State::SynSent:
  409. switch (tcp_packet.flags()) {
  410. case TCPFlags::SYN:
  411. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  412. (void)socket->send_tcp_packet(TCPFlags::SYN | TCPFlags::ACK);
  413. socket->set_state(TCPSocket::State::SynReceived);
  414. return;
  415. case TCPFlags::ACK | TCPFlags::SYN:
  416. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  417. (void)socket->send_ack(true);
  418. socket->set_state(TCPSocket::State::Established);
  419. socket->set_setup_state(Socket::SetupState::Completed);
  420. socket->set_connected(true);
  421. return;
  422. case TCPFlags::ACK | TCPFlags::FIN:
  423. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  424. send_delayed_tcp_ack(*socket);
  425. socket->set_state(TCPSocket::State::Closed);
  426. socket->set_error(TCPSocket::Error::FINDuringConnect);
  427. socket->set_setup_state(Socket::SetupState::Completed);
  428. return;
  429. case TCPFlags::ACK | TCPFlags::RST:
  430. socket->set_state(TCPSocket::State::Closed);
  431. socket->set_error(TCPSocket::Error::RSTDuringConnect);
  432. socket->set_setup_state(Socket::SetupState::Completed);
  433. return;
  434. default:
  435. dbgln("handle_tcp: unexpected flags in SynSent state ({:x})", tcp_packet.flags());
  436. (void)socket->send_tcp_packet(TCPFlags::RST);
  437. socket->set_state(TCPSocket::State::Closed);
  438. socket->set_error(TCPSocket::Error::UnexpectedFlagsDuringConnect);
  439. socket->set_setup_state(Socket::SetupState::Completed);
  440. return;
  441. }
  442. case TCPSocket::State::SynReceived:
  443. switch (tcp_packet.flags()) {
  444. case TCPFlags::ACK:
  445. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  446. switch (socket->direction()) {
  447. case TCPSocket::Direction::Incoming:
  448. if (!socket->has_originator()) {
  449. dbgln("handle_tcp: connection doesn't have an originating socket; maybe it went away?");
  450. (void)socket->send_tcp_packet(TCPFlags::RST);
  451. socket->set_state(TCPSocket::State::Closed);
  452. return;
  453. }
  454. socket->set_state(TCPSocket::State::Established);
  455. socket->set_setup_state(Socket::SetupState::Completed);
  456. socket->release_to_originator();
  457. return;
  458. case TCPSocket::Direction::Outgoing:
  459. socket->set_state(TCPSocket::State::Established);
  460. socket->set_setup_state(Socket::SetupState::Completed);
  461. socket->set_connected(true);
  462. return;
  463. default:
  464. dbgln("handle_tcp: got ACK in SynReceived state but direction is invalid ({})", TCPSocket::to_string(socket->direction()));
  465. (void)socket->send_tcp_packet(TCPFlags::RST);
  466. socket->set_state(TCPSocket::State::Closed);
  467. return;
  468. }
  469. VERIFY_NOT_REACHED();
  470. case TCPFlags::SYN:
  471. dbgln("handle_tcp: ignoring SYN for partially established connection");
  472. return;
  473. default:
  474. dbgln("handle_tcp: unexpected flags in SynReceived state ({:x})", tcp_packet.flags());
  475. (void)socket->send_tcp_packet(TCPFlags::RST);
  476. socket->set_state(TCPSocket::State::Closed);
  477. return;
  478. }
  479. case TCPSocket::State::CloseWait:
  480. switch (tcp_packet.flags()) {
  481. default:
  482. dbgln("handle_tcp: unexpected flags in CloseWait state ({:x})", tcp_packet.flags());
  483. (void)socket->send_tcp_packet(TCPFlags::RST);
  484. socket->set_state(TCPSocket::State::Closed);
  485. return;
  486. }
  487. case TCPSocket::State::LastAck:
  488. switch (tcp_packet.flags()) {
  489. case TCPFlags::ACK:
  490. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  491. socket->set_state(TCPSocket::State::Closed);
  492. return;
  493. default:
  494. dbgln("handle_tcp: unexpected flags in LastAck state ({:x})", tcp_packet.flags());
  495. (void)socket->send_tcp_packet(TCPFlags::RST);
  496. socket->set_state(TCPSocket::State::Closed);
  497. return;
  498. }
  499. case TCPSocket::State::FinWait1:
  500. switch (tcp_packet.flags()) {
  501. case TCPFlags::ACK:
  502. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  503. socket->set_state(TCPSocket::State::FinWait2);
  504. return;
  505. case TCPFlags::FIN:
  506. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  507. socket->set_state(TCPSocket::State::Closing);
  508. (void)socket->send_ack(true);
  509. return;
  510. case TCPFlags::FIN | TCPFlags::ACK:
  511. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  512. socket->set_state(TCPSocket::State::TimeWait);
  513. (void)socket->send_ack(true);
  514. return;
  515. default:
  516. dbgln("handle_tcp: unexpected flags in FinWait1 state ({:x})", tcp_packet.flags());
  517. (void)socket->send_tcp_packet(TCPFlags::RST);
  518. socket->set_state(TCPSocket::State::Closed);
  519. return;
  520. }
  521. case TCPSocket::State::FinWait2:
  522. switch (tcp_packet.flags()) {
  523. case TCPFlags::FIN:
  524. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  525. socket->set_state(TCPSocket::State::TimeWait);
  526. (void)socket->send_ack(true);
  527. return;
  528. case TCPFlags::ACK | TCPFlags::RST:
  529. // FIXME: Verify that this transition is legitimate.
  530. socket->set_state(TCPSocket::State::Closed);
  531. return;
  532. default:
  533. dbgln("handle_tcp: unexpected flags in FinWait2 state ({:x})", tcp_packet.flags());
  534. (void)socket->send_tcp_packet(TCPFlags::RST);
  535. socket->set_state(TCPSocket::State::Closed);
  536. return;
  537. }
  538. case TCPSocket::State::Closing:
  539. switch (tcp_packet.flags()) {
  540. case TCPFlags::ACK:
  541. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  542. socket->set_state(TCPSocket::State::TimeWait);
  543. return;
  544. default:
  545. dbgln("handle_tcp: unexpected flags in Closing state ({:x})", tcp_packet.flags());
  546. (void)socket->send_tcp_packet(TCPFlags::RST);
  547. socket->set_state(TCPSocket::State::Closed);
  548. return;
  549. }
  550. case TCPSocket::State::Established:
  551. if (tcp_packet.has_rst()) {
  552. socket->set_state(TCPSocket::State::Closed);
  553. return;
  554. }
  555. if (tcp_packet.sequence_number() != socket->ack_number()) {
  556. dbgln_if(TCP_DEBUG, "Discarding out of order packet: seq {} vs. ack {}", tcp_packet.sequence_number(), socket->ack_number());
  557. if (socket->duplicate_acks() < TCPSocket::maximum_duplicate_acks) {
  558. dbgln_if(TCP_DEBUG, "Sending ACK with same ack number to trigger fast retransmission");
  559. socket->set_duplicate_acks(socket->duplicate_acks() + 1);
  560. [[maybe_unused]] auto result = socket->send_ack(true);
  561. }
  562. return;
  563. }
  564. socket->set_duplicate_acks(0);
  565. if (tcp_packet.has_fin()) {
  566. if (payload_size != 0)
  567. socket->did_receive(ipv4_packet.source(), tcp_packet.source_port(), { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp);
  568. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  569. send_delayed_tcp_ack(*socket);
  570. socket->set_state(TCPSocket::State::CloseWait);
  571. socket->set_connected(false);
  572. return;
  573. }
  574. if (payload_size) {
  575. if (socket->did_receive(ipv4_packet.source(), tcp_packet.source_port(), { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp)) {
  576. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  577. dbgln_if(TCP_DEBUG, "Got packet with ack_no={}, seq_no={}, payload_size={}, acking it with new ack_no={}, seq_no={}",
  578. tcp_packet.ack_number(), tcp_packet.sequence_number(), payload_size, socket->ack_number(), socket->sequence_number());
  579. send_delayed_tcp_ack(*socket);
  580. }
  581. }
  582. }
  583. }
  584. void retransmit_tcp_packets()
  585. {
  586. // We must keep the sockets alive until after we've unlocked the hash table
  587. // in case retransmit_packets() realizes that it wants to close the socket.
  588. Vector<NonnullRefPtr<TCPSocket>, 16> sockets;
  589. TCPSocket::sockets_for_retransmit().for_each_shared([&](auto const& socket) {
  590. // We ignore allocation failures above the first 16 guaranteed socket slots, as
  591. // we will just retransmit their packets the next time around
  592. (void)sockets.try_append(socket);
  593. });
  594. for (auto& socket : sockets) {
  595. MutexLocker socket_locker(socket->mutex());
  596. socket->retransmit_packets();
  597. }
  598. }
  599. }