ResourceLoader.cpp 7.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220
  1. /*
  2. * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/Base64.h>
  7. #include <AK/Debug.h>
  8. #include <AK/JsonObject.h>
  9. #include <LibCore/EventLoop.h>
  10. #include <LibCore/File.h>
  11. #include <LibProtocol/Request.h>
  12. #include <LibProtocol/RequestClient.h>
  13. #include <LibWeb/Loader/ContentFilter.h>
  14. #include <LibWeb/Loader/LoadRequest.h>
  15. #include <LibWeb/Loader/Resource.h>
  16. #include <LibWeb/Loader/ResourceLoader.h>
  17. namespace Web {
  18. ResourceLoader& ResourceLoader::the()
  19. {
  20. static ResourceLoader* s_the;
  21. if (!s_the)
  22. s_the = &ResourceLoader::construct().leak_ref();
  23. return *s_the;
  24. }
  25. ResourceLoader::ResourceLoader()
  26. : m_protocol_client(Protocol::RequestClient::construct())
  27. , m_user_agent(default_user_agent)
  28. {
  29. }
  30. void ResourceLoader::load_sync(const LoadRequest& request, Function<void(ReadonlyBytes, const HashMap<String, String, CaseInsensitiveStringTraits>& response_headers, Optional<u32> status_code)> success_callback, Function<void(const String&, Optional<u32> status_code)> error_callback)
  31. {
  32. Core::EventLoop loop;
  33. load(
  34. request,
  35. [&](auto data, auto& response_headers, auto status_code) {
  36. success_callback(data, response_headers, status_code);
  37. loop.quit(0);
  38. },
  39. [&](auto& string, auto status_code) {
  40. if (error_callback)
  41. error_callback(string, status_code);
  42. loop.quit(0);
  43. });
  44. loop.exec();
  45. }
  46. static HashMap<LoadRequest, NonnullRefPtr<Resource>> s_resource_cache;
  47. RefPtr<Resource> ResourceLoader::load_resource(Resource::Type type, const LoadRequest& request)
  48. {
  49. if (!request.is_valid())
  50. return nullptr;
  51. bool use_cache = request.url().protocol() != "file";
  52. if (use_cache) {
  53. auto it = s_resource_cache.find(request);
  54. if (it != s_resource_cache.end()) {
  55. if (it->value->type() != type) {
  56. dbgln("FIXME: Not using cached resource for {} since there's a type mismatch.", request.url());
  57. } else {
  58. dbgln_if(CACHE_DEBUG, "Reusing cached resource for: {}", request.url());
  59. return it->value;
  60. }
  61. }
  62. }
  63. auto resource = Resource::create({}, type, request);
  64. if (use_cache)
  65. s_resource_cache.set(request, resource);
  66. load(
  67. request,
  68. [=](auto data, auto& headers, auto status_code) {
  69. const_cast<Resource&>(*resource).did_load({}, data, headers, status_code);
  70. },
  71. [=](auto& error, auto status_code) {
  72. const_cast<Resource&>(*resource).did_fail({}, error, status_code);
  73. });
  74. return resource;
  75. }
  76. void ResourceLoader::load(const LoadRequest& request, Function<void(ReadonlyBytes, const HashMap<String, String, CaseInsensitiveStringTraits>& response_headers, Optional<u32> status_code)> success_callback, Function<void(const String&, Optional<u32> status_code)> error_callback)
  77. {
  78. auto& url = request.url();
  79. if (is_port_blocked(url.port())) {
  80. dbgln("ResourceLoader::load: Error: blocked port {} from URL {}", url.port(), url);
  81. return;
  82. }
  83. if (ContentFilter::the().is_filtered(url)) {
  84. dbgln("\033[32;1mResourceLoader::load: URL was filtered! {}\033[0m", url);
  85. error_callback("URL was filtered", {});
  86. return;
  87. }
  88. if (url.protocol() == "about") {
  89. dbgln_if(SPAM_DEBUG, "Loading about: URL {}", url);
  90. deferred_invoke([success_callback = move(success_callback)] {
  91. success_callback(String::empty().to_byte_buffer(), {}, {});
  92. });
  93. return;
  94. }
  95. if (url.protocol() == "data") {
  96. dbgln_if(SPAM_DEBUG, "ResourceLoader loading a data URL with mime-type: '{}', base64={}, payload='{}'",
  97. url.data_mime_type(),
  98. url.data_payload_is_base64(),
  99. url.data_payload());
  100. ByteBuffer data;
  101. if (url.data_payload_is_base64())
  102. data = decode_base64(url.data_payload());
  103. else
  104. data = url.data_payload().to_byte_buffer();
  105. deferred_invoke([data = move(data), success_callback = move(success_callback)] {
  106. success_callback(data, {}, {});
  107. });
  108. return;
  109. }
  110. if (url.protocol() == "file") {
  111. auto f = Core::File::construct();
  112. f->set_filename(url.path());
  113. if (!f->open(Core::OpenMode::ReadOnly)) {
  114. dbgln("ResourceLoader::load: Error: {}", f->error_string());
  115. if (error_callback)
  116. error_callback(f->error_string(), {});
  117. return;
  118. }
  119. auto data = f->read_all();
  120. deferred_invoke([data = move(data), success_callback = move(success_callback)] {
  121. success_callback(data, {}, {});
  122. });
  123. return;
  124. }
  125. if (url.protocol() == "http" || url.protocol() == "https" || url.protocol() == "gemini") {
  126. HashMap<String, String> headers;
  127. headers.set("User-Agent", m_user_agent);
  128. headers.set("Accept-Encoding", "gzip, deflate");
  129. for (auto& it : request.headers()) {
  130. headers.set(it.key, it.value);
  131. }
  132. auto protocol_request = protocol_client().start_request(request.method(), url, headers, request.body());
  133. if (!protocol_request) {
  134. if (error_callback)
  135. error_callback("Failed to initiate load", {});
  136. return;
  137. }
  138. protocol_request->on_buffered_request_finish = [this, success_callback = move(success_callback), error_callback = move(error_callback), protocol_request](bool success, auto, auto& response_headers, auto status_code, ReadonlyBytes payload) {
  139. --m_pending_loads;
  140. if (on_load_counter_change)
  141. on_load_counter_change();
  142. if (!success) {
  143. if (error_callback)
  144. error_callback("HTTP load failed", {});
  145. return;
  146. }
  147. deferred_invoke([protocol_request] {
  148. // Clear circular reference of `protocol_request` captured by copy
  149. const_cast<Protocol::Request&>(*protocol_request).on_buffered_request_finish = nullptr;
  150. });
  151. success_callback(payload, response_headers, status_code);
  152. };
  153. protocol_request->set_should_buffer_all_input(true);
  154. protocol_request->on_certificate_requested = []() -> Protocol::Request::CertificateAndKey {
  155. return {};
  156. };
  157. ++m_pending_loads;
  158. if (on_load_counter_change)
  159. on_load_counter_change();
  160. return;
  161. }
  162. if (error_callback)
  163. error_callback(String::formatted("Protocol not implemented: {}", url.protocol()), {});
  164. }
  165. void ResourceLoader::load(const URL& url, Function<void(ReadonlyBytes, const HashMap<String, String, CaseInsensitiveStringTraits>& response_headers, Optional<u32> status_code)> success_callback, Function<void(const String&, Optional<u32> status_code)> error_callback)
  166. {
  167. LoadRequest request;
  168. request.set_url(url);
  169. load(request, move(success_callback), move(error_callback));
  170. }
  171. bool ResourceLoader::is_port_blocked(int port)
  172. {
  173. int ports[] { 1, 7, 9, 11, 13, 15, 17, 19, 20, 21, 22, 23, 25, 37, 42,
  174. 43, 53, 77, 79, 87, 95, 101, 102, 103, 104, 109, 110, 111, 113,
  175. 115, 117, 119, 123, 135, 139, 143, 179, 389, 465, 512, 513, 514,
  176. 515, 526, 530, 531, 532, 540, 556, 563, 587, 601, 636, 993, 995,
  177. 2049, 3659, 4045, 6000, 6379, 6665, 6666, 6667, 6668, 6669, 9000 };
  178. for (auto blocked_port : ports)
  179. if (port == blocked_port)
  180. return true;
  181. return false;
  182. }
  183. void ResourceLoader::clear_cache()
  184. {
  185. dbgln_if(CACHE_DEBUG, "Clearing {} items from ResourceLoader cache", s_resource_cache.size());
  186. s_resource_cache.clear();
  187. }
  188. }