NetworkTask.cpp 29 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663
  1. /*
  2. * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <Kernel/Debug.h>
  7. #include <Kernel/Locking/Mutex.h>
  8. #include <Kernel/Locking/MutexProtected.h>
  9. #include <Kernel/Net/ARP.h>
  10. #include <Kernel/Net/EtherType.h>
  11. #include <Kernel/Net/EthernetFrameHeader.h>
  12. #include <Kernel/Net/ICMP.h>
  13. #include <Kernel/Net/IPv4.h>
  14. #include <Kernel/Net/IPv4Socket.h>
  15. #include <Kernel/Net/LoopbackAdapter.h>
  16. #include <Kernel/Net/NetworkTask.h>
  17. #include <Kernel/Net/NetworkingManagement.h>
  18. #include <Kernel/Net/Routing.h>
  19. #include <Kernel/Net/TCP.h>
  20. #include <Kernel/Net/TCPSocket.h>
  21. #include <Kernel/Net/UDP.h>
  22. #include <Kernel/Net/UDPSocket.h>
  23. #include <Kernel/Process.h>
  24. namespace Kernel {
  25. static void handle_arp(EthernetFrameHeader const&, size_t frame_size);
  26. static void handle_ipv4(EthernetFrameHeader const&, size_t frame_size, Time const& packet_timestamp);
  27. static void handle_icmp(EthernetFrameHeader const&, IPv4Packet const&, Time const& packet_timestamp);
  28. static void handle_udp(IPv4Packet const&, Time const& packet_timestamp);
  29. static void handle_tcp(IPv4Packet const&, Time const& packet_timestamp);
  30. static void send_delayed_tcp_ack(RefPtr<TCPSocket> socket);
  31. static void send_tcp_rst(IPv4Packet const& ipv4_packet, TCPPacket const& tcp_packet, RefPtr<NetworkAdapter> adapter);
  32. static void flush_delayed_tcp_acks();
  33. static void retransmit_tcp_packets();
  34. static Thread* network_task = nullptr;
  35. static HashTable<RefPtr<TCPSocket>>* delayed_ack_sockets;
  36. [[noreturn]] static void NetworkTask_main(void*);
  37. void NetworkTask::spawn()
  38. {
  39. RefPtr<Thread> thread;
  40. auto name = KString::try_create("NetworkTask");
  41. if (name.is_error())
  42. TODO();
  43. Process::create_kernel_process(thread, name.release_value(), NetworkTask_main, nullptr);
  44. network_task = thread;
  45. }
  46. bool NetworkTask::is_current()
  47. {
  48. return Thread::current() == network_task;
  49. }
  50. void NetworkTask_main(void*)
  51. {
  52. delayed_ack_sockets = new HashTable<RefPtr<TCPSocket>>;
  53. WaitQueue packet_wait_queue;
  54. int pending_packets = 0;
  55. NetworkingManagement::the().for_each([&](auto& adapter) {
  56. dmesgln("NetworkTask: {} network adapter found: hw={}", adapter.class_name(), adapter.mac_address().to_string());
  57. if (adapter.class_name() == "LoopbackAdapter"sv) {
  58. adapter.set_ipv4_address({ 127, 0, 0, 1 });
  59. adapter.set_ipv4_netmask({ 255, 0, 0, 0 });
  60. adapter.set_ipv4_gateway({ 0, 0, 0, 0 });
  61. }
  62. adapter.on_receive = [&]() {
  63. pending_packets++;
  64. packet_wait_queue.wake_all();
  65. };
  66. });
  67. auto dequeue_packet = [&pending_packets](u8* buffer, size_t buffer_size, Time& packet_timestamp) -> size_t {
  68. if (pending_packets == 0)
  69. return 0;
  70. size_t packet_size = 0;
  71. NetworkingManagement::the().for_each([&](auto& adapter) {
  72. if (packet_size || !adapter.has_queued_packets())
  73. return;
  74. packet_size = adapter.dequeue_packet(buffer, buffer_size, packet_timestamp);
  75. pending_packets--;
  76. dbgln_if(NETWORK_TASK_DEBUG, "NetworkTask: Dequeued packet from {} ({} bytes)", adapter.name(), packet_size);
  77. });
  78. return packet_size;
  79. };
  80. size_t buffer_size = 64 * KiB;
  81. auto region_or_error = MM.allocate_kernel_region(buffer_size, "Kernel Packet Buffer", Memory::Region::Access::ReadWrite);
  82. if (region_or_error.is_error())
  83. TODO();
  84. auto buffer_region = region_or_error.release_value();
  85. auto buffer = (u8*)buffer_region->vaddr().get();
  86. Time packet_timestamp;
  87. for (;;) {
  88. flush_delayed_tcp_acks();
  89. retransmit_tcp_packets();
  90. size_t packet_size = dequeue_packet(buffer, buffer_size, packet_timestamp);
  91. if (!packet_size) {
  92. auto timeout_time = Time::from_milliseconds(500);
  93. auto timeout = Thread::BlockTimeout { false, &timeout_time };
  94. [[maybe_unused]] auto result = packet_wait_queue.wait_on(timeout, "NetworkTask");
  95. continue;
  96. }
  97. if (packet_size < sizeof(EthernetFrameHeader)) {
  98. dbgln("NetworkTask: Packet is too small to be an Ethernet packet! ({})", packet_size);
  99. continue;
  100. }
  101. auto& eth = *(EthernetFrameHeader const*)buffer;
  102. dbgln_if(ETHERNET_DEBUG, "NetworkTask: From {} to {}, ether_type={:#04x}, packet_size={}", eth.source().to_string(), eth.destination().to_string(), eth.ether_type(), packet_size);
  103. switch (eth.ether_type()) {
  104. case EtherType::ARP:
  105. handle_arp(eth, packet_size);
  106. break;
  107. case EtherType::IPv4:
  108. handle_ipv4(eth, packet_size, packet_timestamp);
  109. break;
  110. case EtherType::IPv6:
  111. // ignore
  112. break;
  113. default:
  114. dbgln_if(ETHERNET_DEBUG, "NetworkTask: Unknown ethernet type {:#04x}", eth.ether_type());
  115. }
  116. }
  117. }
  118. void handle_arp(EthernetFrameHeader const& eth, size_t frame_size)
  119. {
  120. constexpr size_t minimum_arp_frame_size = sizeof(EthernetFrameHeader) + sizeof(ARPPacket);
  121. if (frame_size < minimum_arp_frame_size) {
  122. dbgln("handle_arp: Frame too small ({}, need {})", frame_size, minimum_arp_frame_size);
  123. return;
  124. }
  125. auto& packet = *static_cast<ARPPacket const*>(eth.payload());
  126. if (packet.hardware_type() != 1 || packet.hardware_address_length() != sizeof(MACAddress)) {
  127. dbgln("handle_arp: Hardware type not ethernet ({:#04x}, len={})", packet.hardware_type(), packet.hardware_address_length());
  128. return;
  129. }
  130. if (packet.protocol_type() != EtherType::IPv4 || packet.protocol_address_length() != sizeof(IPv4Address)) {
  131. dbgln("handle_arp: Protocol type not IPv4 ({:#04x}, len={})", packet.protocol_type(), packet.protocol_address_length());
  132. return;
  133. }
  134. dbgln_if(ARP_DEBUG, "handle_arp: operation={:#04x}, sender={}/{}, target={}/{}",
  135. packet.operation(),
  136. packet.sender_hardware_address().to_string(),
  137. packet.sender_protocol_address().to_string(),
  138. packet.target_hardware_address().to_string(),
  139. packet.target_protocol_address().to_string());
  140. if (!packet.sender_hardware_address().is_zero() && !packet.sender_protocol_address().is_zero()) {
  141. // Someone has this IPv4 address. I guess we can try to remember that.
  142. // FIXME: Protect against ARP spamming.
  143. update_arp_table(packet.sender_protocol_address(), packet.sender_hardware_address(), UpdateArp::Set);
  144. }
  145. if (packet.operation() == ARPOperation::Request) {
  146. // Who has this IP address?
  147. if (auto adapter = NetworkingManagement::the().from_ipv4_address(packet.target_protocol_address())) {
  148. // We do!
  149. dbgln("handle_arp: Responding to ARP request for my IPv4 address ({})", adapter->ipv4_address());
  150. ARPPacket response;
  151. response.set_operation(ARPOperation::Response);
  152. response.set_target_hardware_address(packet.sender_hardware_address());
  153. response.set_target_protocol_address(packet.sender_protocol_address());
  154. response.set_sender_hardware_address(adapter->mac_address());
  155. response.set_sender_protocol_address(adapter->ipv4_address());
  156. adapter->send(packet.sender_hardware_address(), response);
  157. }
  158. return;
  159. }
  160. }
  161. void handle_ipv4(EthernetFrameHeader const& eth, size_t frame_size, Time const& packet_timestamp)
  162. {
  163. constexpr size_t minimum_ipv4_frame_size = sizeof(EthernetFrameHeader) + sizeof(IPv4Packet);
  164. if (frame_size < minimum_ipv4_frame_size) {
  165. dbgln("handle_ipv4: Frame too small ({}, need {})", frame_size, minimum_ipv4_frame_size);
  166. return;
  167. }
  168. auto& packet = *static_cast<IPv4Packet const*>(eth.payload());
  169. if (packet.length() < sizeof(IPv4Packet)) {
  170. dbgln("handle_ipv4: IPv4 packet too short ({}, need {})", packet.length(), sizeof(IPv4Packet));
  171. return;
  172. }
  173. size_t actual_ipv4_packet_length = frame_size - sizeof(EthernetFrameHeader);
  174. if (packet.length() > actual_ipv4_packet_length) {
  175. dbgln("handle_ipv4: IPv4 packet claims to be longer than it is ({}, actually {})", packet.length(), actual_ipv4_packet_length);
  176. return;
  177. }
  178. dbgln_if(IPV4_DEBUG, "handle_ipv4: source={}, destination={}", packet.source(), packet.destination());
  179. NetworkingManagement::the().for_each([&](auto& adapter) {
  180. if (adapter.link_up()) {
  181. auto my_net = adapter.ipv4_address().to_u32() & adapter.ipv4_netmask().to_u32();
  182. auto their_net = packet.source().to_u32() & adapter.ipv4_netmask().to_u32();
  183. if (my_net == their_net)
  184. update_arp_table(packet.source(), eth.source(), UpdateArp::Set);
  185. }
  186. });
  187. switch ((IPv4Protocol)packet.protocol()) {
  188. case IPv4Protocol::ICMP:
  189. return handle_icmp(eth, packet, packet_timestamp);
  190. case IPv4Protocol::UDP:
  191. return handle_udp(packet, packet_timestamp);
  192. case IPv4Protocol::TCP:
  193. return handle_tcp(packet, packet_timestamp);
  194. default:
  195. dbgln_if(IPV4_DEBUG, "handle_ipv4: Unhandled protocol {:#02x}", packet.protocol());
  196. break;
  197. }
  198. }
  199. void handle_icmp(EthernetFrameHeader const& eth, IPv4Packet const& ipv4_packet, Time const& packet_timestamp)
  200. {
  201. auto& icmp_header = *static_cast<ICMPHeader const*>(ipv4_packet.payload());
  202. dbgln_if(ICMP_DEBUG, "handle_icmp: source={}, destination={}, type={:#02x}, code={:#02x}", ipv4_packet.source().to_string(), ipv4_packet.destination().to_string(), icmp_header.type(), icmp_header.code());
  203. {
  204. NonnullRefPtrVector<IPv4Socket> icmp_sockets;
  205. IPv4Socket::all_sockets().with_exclusive([&](auto& sockets) {
  206. for (auto& socket : sockets) {
  207. if (socket.protocol() == (unsigned)IPv4Protocol::ICMP)
  208. icmp_sockets.append(socket);
  209. }
  210. });
  211. for (auto& socket : icmp_sockets)
  212. socket.did_receive(ipv4_packet.source(), 0, { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp);
  213. }
  214. auto adapter = NetworkingManagement::the().from_ipv4_address(ipv4_packet.destination());
  215. if (!adapter)
  216. return;
  217. if (icmp_header.type() == ICMPType::EchoRequest) {
  218. auto& request = reinterpret_cast<ICMPEchoPacket const&>(icmp_header);
  219. dbgln("handle_icmp: EchoRequest from {}: id={}, seq={}", ipv4_packet.source(), (u16)request.identifier, (u16)request.sequence_number);
  220. size_t icmp_packet_size = ipv4_packet.payload_size();
  221. if (icmp_packet_size < sizeof(ICMPEchoPacket)) {
  222. dbgln("handle_icmp: EchoRequest packet is too small, ignoring.");
  223. return;
  224. }
  225. auto ipv4_payload_offset = adapter->ipv4_payload_offset();
  226. auto packet = adapter->acquire_packet_buffer(ipv4_payload_offset + icmp_packet_size);
  227. if (!packet) {
  228. dbgln("Could not allocate packet buffer while sending ICMP packet");
  229. return;
  230. }
  231. adapter->fill_in_ipv4_header(*packet, adapter->ipv4_address(), eth.source(), ipv4_packet.source(), IPv4Protocol::ICMP, icmp_packet_size, 0, 64);
  232. memset(packet->buffer->data() + ipv4_payload_offset, 0, sizeof(ICMPEchoPacket));
  233. auto& response = *(ICMPEchoPacket*)(packet->buffer->data() + ipv4_payload_offset);
  234. response.header.set_type(ICMPType::EchoReply);
  235. response.header.set_code(0);
  236. response.identifier = request.identifier;
  237. response.sequence_number = request.sequence_number;
  238. if (size_t icmp_payload_size = icmp_packet_size - sizeof(ICMPEchoPacket))
  239. memcpy(response.payload(), request.payload(), icmp_payload_size);
  240. response.header.set_checksum(internet_checksum(&response, icmp_packet_size));
  241. // FIXME: What is the right TTL value here? Is 64 ok? Should we use the same TTL as the echo request?
  242. adapter->send_packet(packet->bytes());
  243. adapter->release_packet_buffer(*packet);
  244. }
  245. }
  246. void handle_udp(IPv4Packet const& ipv4_packet, Time const& packet_timestamp)
  247. {
  248. if (ipv4_packet.payload_size() < sizeof(UDPPacket)) {
  249. dbgln("handle_udp: Packet too small ({}, need {})", ipv4_packet.payload_size(), sizeof(UDPPacket));
  250. return;
  251. }
  252. auto& udp_packet = *static_cast<UDPPacket const*>(ipv4_packet.payload());
  253. dbgln_if(UDP_DEBUG, "handle_udp: source={}:{}, destination={}:{}, length={}",
  254. ipv4_packet.source(), udp_packet.source_port(),
  255. ipv4_packet.destination(), udp_packet.destination_port(),
  256. udp_packet.length());
  257. auto socket = UDPSocket::from_port(udp_packet.destination_port());
  258. if (!socket) {
  259. dbgln_if(UDP_DEBUG, "handle_udp: No local UDP socket for {}:{}", ipv4_packet.destination(), udp_packet.destination_port());
  260. return;
  261. }
  262. VERIFY(socket->type() == SOCK_DGRAM);
  263. VERIFY(socket->local_port() == udp_packet.destination_port());
  264. auto& destination = ipv4_packet.destination();
  265. if (destination == IPv4Address(255, 255, 255, 255) || NetworkingManagement::the().from_ipv4_address(destination) || socket->multicast_memberships().contains_slow(destination))
  266. socket->did_receive(ipv4_packet.source(), udp_packet.source_port(), { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp);
  267. }
  268. void send_delayed_tcp_ack(RefPtr<TCPSocket> socket)
  269. {
  270. VERIFY(socket->mutex().is_locked());
  271. if (!socket->should_delay_next_ack()) {
  272. [[maybe_unused]] auto result = socket->send_ack();
  273. return;
  274. }
  275. delayed_ack_sockets->set(move(socket));
  276. }
  277. void flush_delayed_tcp_acks()
  278. {
  279. Vector<RefPtr<TCPSocket>, 32> remaining_sockets;
  280. for (auto& socket : *delayed_ack_sockets) {
  281. MutexLocker locker(socket->mutex());
  282. if (socket->should_delay_next_ack()) {
  283. remaining_sockets.append(socket);
  284. continue;
  285. }
  286. [[maybe_unused]] auto result = socket->send_ack();
  287. }
  288. if (remaining_sockets.size() != delayed_ack_sockets->size()) {
  289. delayed_ack_sockets->clear();
  290. if (remaining_sockets.size() > 0)
  291. dbgln("flush_delayed_tcp_acks: {} sockets remaining", remaining_sockets.size());
  292. for (auto&& socket : remaining_sockets)
  293. delayed_ack_sockets->set(move(socket));
  294. }
  295. }
  296. void send_tcp_rst(IPv4Packet const& ipv4_packet, TCPPacket const& tcp_packet, RefPtr<NetworkAdapter> adapter)
  297. {
  298. auto routing_decision = route_to(ipv4_packet.source(), ipv4_packet.destination(), adapter);
  299. if (routing_decision.is_zero())
  300. return;
  301. auto ipv4_payload_offset = routing_decision.adapter->ipv4_payload_offset();
  302. const size_t options_size = 0;
  303. const size_t tcp_header_size = sizeof(TCPPacket) + options_size;
  304. const size_t buffer_size = ipv4_payload_offset + tcp_header_size;
  305. auto packet = routing_decision.adapter->acquire_packet_buffer(buffer_size);
  306. if (!packet)
  307. return;
  308. routing_decision.adapter->fill_in_ipv4_header(*packet, ipv4_packet.destination(),
  309. routing_decision.next_hop, ipv4_packet.source(), IPv4Protocol::TCP,
  310. buffer_size - ipv4_payload_offset, 0, 64);
  311. auto& rst_packet = *(TCPPacket*)(packet->buffer->data() + ipv4_payload_offset);
  312. rst_packet = {};
  313. rst_packet.set_source_port(tcp_packet.destination_port());
  314. rst_packet.set_destination_port(tcp_packet.source_port());
  315. rst_packet.set_window_size(0);
  316. rst_packet.set_sequence_number(0);
  317. rst_packet.set_ack_number(tcp_packet.sequence_number() + 1);
  318. rst_packet.set_data_offset(tcp_header_size / sizeof(u32));
  319. rst_packet.set_flags(TCPFlags::RST | TCPFlags::ACK);
  320. rst_packet.set_checksum(TCPSocket::compute_tcp_checksum(ipv4_packet.source(), ipv4_packet.destination(), rst_packet, 0));
  321. routing_decision.adapter->send_packet(packet->bytes());
  322. routing_decision.adapter->release_packet_buffer(*packet);
  323. }
  324. void handle_tcp(IPv4Packet const& ipv4_packet, Time const& packet_timestamp)
  325. {
  326. if (ipv4_packet.payload_size() < sizeof(TCPPacket)) {
  327. dbgln("handle_tcp: IPv4 payload is too small to be a TCP packet ({}, need {})", ipv4_packet.payload_size(), sizeof(TCPPacket));
  328. return;
  329. }
  330. auto& tcp_packet = *static_cast<TCPPacket const*>(ipv4_packet.payload());
  331. size_t minimum_tcp_header_size = 5 * sizeof(u32);
  332. size_t maximum_tcp_header_size = 15 * sizeof(u32);
  333. if (tcp_packet.header_size() < minimum_tcp_header_size || tcp_packet.header_size() > maximum_tcp_header_size) {
  334. dbgln("handle_tcp: TCP packet header has invalid size {}", tcp_packet.header_size());
  335. }
  336. if (ipv4_packet.payload_size() < tcp_packet.header_size()) {
  337. dbgln("handle_tcp: IPv4 payload is smaller than TCP header claims ({}, supposedly {})", ipv4_packet.payload_size(), tcp_packet.header_size());
  338. return;
  339. }
  340. size_t payload_size = ipv4_packet.payload_size() - tcp_packet.header_size();
  341. dbgln_if(TCP_DEBUG, "handle_tcp: source={}:{}, destination={}:{}, seq_no={}, ack_no={}, flags={:#04x} ({}{}{}{}), window_size={}, payload_size={}",
  342. ipv4_packet.source().to_string(),
  343. tcp_packet.source_port(),
  344. ipv4_packet.destination().to_string(),
  345. tcp_packet.destination_port(),
  346. tcp_packet.sequence_number(),
  347. tcp_packet.ack_number(),
  348. tcp_packet.flags(),
  349. tcp_packet.has_syn() ? "SYN " : "",
  350. tcp_packet.has_ack() ? "ACK " : "",
  351. tcp_packet.has_fin() ? "FIN " : "",
  352. tcp_packet.has_rst() ? "RST " : "",
  353. tcp_packet.window_size(),
  354. payload_size);
  355. auto adapter = NetworkingManagement::the().from_ipv4_address(ipv4_packet.destination());
  356. if (!adapter) {
  357. dbgln("handle_tcp: this packet is not for me, it's for {}", ipv4_packet.destination());
  358. return;
  359. }
  360. IPv4SocketTuple tuple(ipv4_packet.destination(), tcp_packet.destination_port(), ipv4_packet.source(), tcp_packet.source_port());
  361. dbgln_if(TCP_DEBUG, "handle_tcp: looking for socket; tuple={}", tuple.to_string());
  362. auto socket = TCPSocket::from_tuple(tuple);
  363. if (!socket) {
  364. if (!tcp_packet.has_rst()) {
  365. dbgln("handle_tcp: No TCP socket for tuple {}. Sending RST.", tuple.to_string());
  366. send_tcp_rst(ipv4_packet, tcp_packet, adapter);
  367. }
  368. return;
  369. }
  370. MutexLocker locker(socket->mutex());
  371. VERIFY(socket->type() == SOCK_STREAM);
  372. VERIFY(socket->local_port() == tcp_packet.destination_port());
  373. dbgln_if(TCP_DEBUG, "handle_tcp: got socket {}; state={}", socket->tuple().to_string(), TCPSocket::to_string(socket->state()));
  374. socket->receive_tcp_packet(tcp_packet, ipv4_packet.payload_size());
  375. switch (socket->state()) {
  376. case TCPSocket::State::Closed:
  377. dbgln("handle_tcp: unexpected flags in Closed state");
  378. // TODO: we may want to send an RST here, maybe as a configurable option
  379. return;
  380. case TCPSocket::State::TimeWait:
  381. dbgln("handle_tcp: unexpected flags in TimeWait state");
  382. (void)socket->send_tcp_packet(TCPFlags::RST);
  383. socket->set_state(TCPSocket::State::Closed);
  384. return;
  385. case TCPSocket::State::Listen:
  386. switch (tcp_packet.flags()) {
  387. case TCPFlags::SYN: {
  388. dbgln_if(TCP_DEBUG, "handle_tcp: incoming connection");
  389. auto& local_address = ipv4_packet.destination();
  390. auto& peer_address = ipv4_packet.source();
  391. auto client_or_error = socket->try_create_client(local_address, tcp_packet.destination_port(), peer_address, tcp_packet.source_port());
  392. if (client_or_error.is_error()) {
  393. dmesgln("handle_tcp: couldn't create client socket: {}", client_or_error.error());
  394. return;
  395. }
  396. auto client = client_or_error.release_value();
  397. MutexLocker locker(client->mutex());
  398. dbgln_if(TCP_DEBUG, "handle_tcp: created new client socket with tuple {}", client->tuple().to_string());
  399. client->set_sequence_number(1000);
  400. client->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  401. [[maybe_unused]] auto rc2 = client->send_tcp_packet(TCPFlags::SYN | TCPFlags::ACK);
  402. client->set_state(TCPSocket::State::SynReceived);
  403. return;
  404. }
  405. default:
  406. dbgln("handle_tcp: unexpected flags in Listen state ({:x})", tcp_packet.flags());
  407. // socket->send_tcp_packet(TCPFlags::RST);
  408. return;
  409. }
  410. case TCPSocket::State::SynSent:
  411. switch (tcp_packet.flags()) {
  412. case TCPFlags::SYN:
  413. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  414. (void)socket->send_ack(true);
  415. socket->set_state(TCPSocket::State::SynReceived);
  416. return;
  417. case TCPFlags::ACK | TCPFlags::SYN:
  418. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  419. (void)socket->send_ack(true);
  420. socket->set_state(TCPSocket::State::Established);
  421. socket->set_setup_state(Socket::SetupState::Completed);
  422. socket->set_connected(true);
  423. return;
  424. case TCPFlags::ACK | TCPFlags::FIN:
  425. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  426. send_delayed_tcp_ack(socket);
  427. socket->set_state(TCPSocket::State::Closed);
  428. socket->set_error(TCPSocket::Error::FINDuringConnect);
  429. socket->set_setup_state(Socket::SetupState::Completed);
  430. return;
  431. case TCPFlags::ACK | TCPFlags::RST:
  432. socket->set_state(TCPSocket::State::Closed);
  433. socket->set_error(TCPSocket::Error::RSTDuringConnect);
  434. socket->set_setup_state(Socket::SetupState::Completed);
  435. return;
  436. default:
  437. dbgln("handle_tcp: unexpected flags in SynSent state ({:x})", tcp_packet.flags());
  438. (void)socket->send_tcp_packet(TCPFlags::RST);
  439. socket->set_state(TCPSocket::State::Closed);
  440. socket->set_error(TCPSocket::Error::UnexpectedFlagsDuringConnect);
  441. socket->set_setup_state(Socket::SetupState::Completed);
  442. return;
  443. }
  444. case TCPSocket::State::SynReceived:
  445. switch (tcp_packet.flags()) {
  446. case TCPFlags::ACK:
  447. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  448. switch (socket->direction()) {
  449. case TCPSocket::Direction::Incoming:
  450. if (!socket->has_originator()) {
  451. dbgln("handle_tcp: connection doesn't have an originating socket; maybe it went away?");
  452. (void)socket->send_tcp_packet(TCPFlags::RST);
  453. socket->set_state(TCPSocket::State::Closed);
  454. return;
  455. }
  456. socket->set_state(TCPSocket::State::Established);
  457. socket->set_setup_state(Socket::SetupState::Completed);
  458. socket->release_to_originator();
  459. return;
  460. case TCPSocket::Direction::Outgoing:
  461. socket->set_state(TCPSocket::State::Established);
  462. socket->set_setup_state(Socket::SetupState::Completed);
  463. socket->set_connected(true);
  464. return;
  465. default:
  466. dbgln("handle_tcp: got ACK in SynReceived state but direction is invalid ({})", TCPSocket::to_string(socket->direction()));
  467. (void)socket->send_tcp_packet(TCPFlags::RST);
  468. socket->set_state(TCPSocket::State::Closed);
  469. return;
  470. }
  471. VERIFY_NOT_REACHED();
  472. case TCPFlags::SYN:
  473. dbgln("handle_tcp: ignoring SYN for partially established connection");
  474. return;
  475. default:
  476. dbgln("handle_tcp: unexpected flags in SynReceived state ({:x})", tcp_packet.flags());
  477. (void)socket->send_tcp_packet(TCPFlags::RST);
  478. socket->set_state(TCPSocket::State::Closed);
  479. return;
  480. }
  481. case TCPSocket::State::CloseWait:
  482. switch (tcp_packet.flags()) {
  483. default:
  484. dbgln("handle_tcp: unexpected flags in CloseWait state ({:x})", tcp_packet.flags());
  485. (void)socket->send_tcp_packet(TCPFlags::RST);
  486. socket->set_state(TCPSocket::State::Closed);
  487. return;
  488. }
  489. case TCPSocket::State::LastAck:
  490. switch (tcp_packet.flags()) {
  491. case TCPFlags::ACK:
  492. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  493. socket->set_state(TCPSocket::State::Closed);
  494. return;
  495. default:
  496. dbgln("handle_tcp: unexpected flags in LastAck state ({:x})", tcp_packet.flags());
  497. (void)socket->send_tcp_packet(TCPFlags::RST);
  498. socket->set_state(TCPSocket::State::Closed);
  499. return;
  500. }
  501. case TCPSocket::State::FinWait1:
  502. switch (tcp_packet.flags()) {
  503. case TCPFlags::ACK:
  504. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  505. socket->set_state(TCPSocket::State::FinWait2);
  506. return;
  507. case TCPFlags::FIN:
  508. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  509. socket->set_state(TCPSocket::State::Closing);
  510. return;
  511. default:
  512. dbgln("handle_tcp: unexpected flags in FinWait1 state ({:x})", tcp_packet.flags());
  513. (void)socket->send_tcp_packet(TCPFlags::RST);
  514. socket->set_state(TCPSocket::State::Closed);
  515. return;
  516. }
  517. case TCPSocket::State::FinWait2:
  518. switch (tcp_packet.flags()) {
  519. case TCPFlags::FIN:
  520. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  521. socket->set_state(TCPSocket::State::TimeWait);
  522. return;
  523. case TCPFlags::ACK | TCPFlags::RST:
  524. socket->set_state(TCPSocket::State::Closed);
  525. return;
  526. default:
  527. dbgln("handle_tcp: unexpected flags in FinWait2 state ({:x})", tcp_packet.flags());
  528. (void)socket->send_tcp_packet(TCPFlags::RST);
  529. socket->set_state(TCPSocket::State::Closed);
  530. return;
  531. }
  532. case TCPSocket::State::Closing:
  533. switch (tcp_packet.flags()) {
  534. case TCPFlags::ACK:
  535. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  536. socket->set_state(TCPSocket::State::TimeWait);
  537. return;
  538. default:
  539. dbgln("handle_tcp: unexpected flags in Closing state ({:x})", tcp_packet.flags());
  540. (void)socket->send_tcp_packet(TCPFlags::RST);
  541. socket->set_state(TCPSocket::State::Closed);
  542. return;
  543. }
  544. case TCPSocket::State::Established:
  545. if (tcp_packet.has_rst()) {
  546. socket->set_state(TCPSocket::State::Closed);
  547. return;
  548. }
  549. if (tcp_packet.sequence_number() != socket->ack_number()) {
  550. dbgln_if(TCP_DEBUG, "Discarding out of order packet: seq {} vs. ack {}", tcp_packet.sequence_number(), socket->ack_number());
  551. if (socket->duplicate_acks() < TCPSocket::maximum_duplicate_acks) {
  552. dbgln_if(TCP_DEBUG, "Sending ACK with same ack number to trigger fast retransmission");
  553. socket->set_duplicate_acks(socket->duplicate_acks() + 1);
  554. [[maybe_unused]] auto result = socket->send_ack(true);
  555. }
  556. return;
  557. }
  558. socket->set_duplicate_acks(0);
  559. if (tcp_packet.has_fin()) {
  560. if (payload_size != 0)
  561. socket->did_receive(ipv4_packet.source(), tcp_packet.source_port(), { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp);
  562. socket->set_ack_number(tcp_packet.sequence_number() + payload_size + 1);
  563. send_delayed_tcp_ack(socket);
  564. socket->set_state(TCPSocket::State::CloseWait);
  565. socket->set_connected(false);
  566. return;
  567. }
  568. if (payload_size) {
  569. if (socket->did_receive(ipv4_packet.source(), tcp_packet.source_port(), { &ipv4_packet, sizeof(IPv4Packet) + ipv4_packet.payload_size() }, packet_timestamp)) {
  570. socket->set_ack_number(tcp_packet.sequence_number() + payload_size);
  571. dbgln_if(TCP_DEBUG, "Got packet with ack_no={}, seq_no={}, payload_size={}, acking it with new ack_no={}, seq_no={}",
  572. tcp_packet.ack_number(), tcp_packet.sequence_number(), payload_size, socket->ack_number(), socket->sequence_number());
  573. send_delayed_tcp_ack(socket);
  574. }
  575. }
  576. }
  577. }
  578. void retransmit_tcp_packets()
  579. {
  580. // We must keep the sockets alive until after we've unlocked the hash table
  581. // in case retransmit_packets() realizes that it wants to close the socket.
  582. NonnullRefPtrVector<TCPSocket, 16> sockets;
  583. TCPSocket::sockets_for_retransmit().for_each_shared([&](const auto& socket) {
  584. sockets.append(socket);
  585. });
  586. for (auto& socket : sockets) {
  587. MutexLocker socket_locker(socket.mutex());
  588. socket.retransmit_packets();
  589. }
  590. }
  591. }