HTMLHyperlinkElementUtils.cpp 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579
  1. /*
  2. * Copyright (c) 2021, Andreas Kling <kling@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/URLParser.h>
  7. #include <LibWeb/DOM/Document.h>
  8. #include <LibWeb/HTML/HTMLHyperlinkElementUtils.h>
  9. #include <LibWeb/Infra/CharacterTypes.h>
  10. #include <LibWeb/Loader/FrameLoader.h>
  11. namespace Web::HTML {
  12. HTMLHyperlinkElementUtils::~HTMLHyperlinkElementUtils() = default;
  13. // https://html.spec.whatwg.org/multipage/links.html#reinitialise-url
  14. void HTMLHyperlinkElementUtils::reinitialize_url() const
  15. {
  16. // 1. If element's url is non-null, its scheme is "blob", and its cannot-be-a-basFe-URL is true, terminate these steps.
  17. if (m_url.has_value() && m_url->scheme() == "blob"sv && m_url->cannot_be_a_base_url())
  18. return;
  19. // 2. Set the url.
  20. const_cast<HTMLHyperlinkElementUtils*>(this)->set_the_url();
  21. }
  22. // https://html.spec.whatwg.org/multipage/links.html#concept-hyperlink-url-set
  23. void HTMLHyperlinkElementUtils::set_the_url()
  24. {
  25. // 1. If this element's href content attribute is absent, set this element's url to null.
  26. auto href_content_attribute = hyperlink_element_utils_href();
  27. if (href_content_attribute.is_null()) {
  28. m_url = {};
  29. return;
  30. }
  31. // 2. Otherwise, parse this element's href content attribute value relative to this element's node document.
  32. // If parsing is successful, set this element's url to the result; otherwise, set this element's url to null.
  33. m_url = hyperlink_element_utils_document().parse_url(href_content_attribute);
  34. }
  35. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-origin
  36. DeprecatedString HTMLHyperlinkElementUtils::origin() const
  37. {
  38. // 1. Reinitialize url.
  39. reinitialize_url();
  40. // 2. If this element's url is null, return the empty string.
  41. if (!m_url.has_value())
  42. return DeprecatedString::empty();
  43. // 3. Return the serialization of this element's url's origin.
  44. return m_url->serialize_origin();
  45. }
  46. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-protocol
  47. DeprecatedString HTMLHyperlinkElementUtils::protocol() const
  48. {
  49. // 1. Reinitialize url.
  50. reinitialize_url();
  51. // 2. If this element's url is null, return ":".
  52. if (!m_url.has_value())
  53. return ":"sv;
  54. // 3. Return this element's url's scheme, followed by ":".
  55. return DeprecatedString::formatted("{}:", m_url->scheme());
  56. }
  57. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-protocol
  58. void HTMLHyperlinkElementUtils::set_protocol(DeprecatedString protocol)
  59. {
  60. // 1. Reinitialize url.
  61. reinitialize_url();
  62. // 2. If this element's url is null, terminate these steps.
  63. if (!m_url.has_value())
  64. return;
  65. // 3. Basic URL parse the given value, followed by ":", with this element's url as url and scheme start state as state override.
  66. auto result_url = URLParser::parse(DeprecatedString::formatted("{}:", protocol), nullptr, m_url, URLParser::State::SchemeStart);
  67. if (result_url.is_valid())
  68. m_url = move(result_url);
  69. // 4. Update href.
  70. update_href();
  71. }
  72. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-username
  73. DeprecatedString HTMLHyperlinkElementUtils::username() const
  74. {
  75. // 1. Reinitialize url.
  76. reinitialize_url();
  77. // 2. If this element's url is null, return the empty string.
  78. if (!m_url.has_value())
  79. return DeprecatedString::empty();
  80. // 3. Return this element's url's username.
  81. return m_url->username();
  82. }
  83. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-username
  84. void HTMLHyperlinkElementUtils::set_username(DeprecatedString username)
  85. {
  86. // 1. Reinitialize url.
  87. reinitialize_url();
  88. // 2. Let url be this element's url.
  89. auto& url = m_url;
  90. // 3. If url is null or url cannot have a username/password/port, then return.
  91. if (!url.has_value() || url->cannot_have_a_username_or_password_or_port())
  92. return;
  93. // 4. Set the username given this’s URL and the given value.
  94. url->set_username(AK::URL::percent_encode(username, AK::URL::PercentEncodeSet::Userinfo));
  95. // 5. Update href.
  96. update_href();
  97. }
  98. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-password
  99. DeprecatedString HTMLHyperlinkElementUtils::password() const
  100. {
  101. // 1. Reinitialize url.
  102. reinitialize_url();
  103. // 2. Let url be this element's url.
  104. auto& url = m_url;
  105. // 3. If url is null, then return the empty string.
  106. if (!url.has_value())
  107. return DeprecatedString::empty();
  108. // 4. Return url's password.
  109. return url->password();
  110. }
  111. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-password
  112. void HTMLHyperlinkElementUtils::set_password(DeprecatedString password)
  113. {
  114. // 1. Reinitialize url.
  115. reinitialize_url();
  116. // 2. Let url be this element's url.
  117. auto& url = m_url;
  118. // 3. If url is null or url cannot have a username/password/port, then return.
  119. if (!url.has_value() || url->cannot_have_a_username_or_password_or_port())
  120. return;
  121. // 4. Set the password, given url and the given value.
  122. url->set_password(move(password));
  123. // 5. Update href.
  124. update_href();
  125. }
  126. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-host
  127. DeprecatedString HTMLHyperlinkElementUtils::host() const
  128. {
  129. // 1. Reinitialize url.
  130. reinitialize_url();
  131. // 2. Let url be this element's url.
  132. auto& url = m_url;
  133. // 3. If url or url's host is null, return the empty string.
  134. if (!url.has_value() || url->host().is_null())
  135. return DeprecatedString::empty();
  136. // 4. If url's port is null, return url's host, serialized.
  137. if (!url->port().has_value())
  138. return url->host();
  139. // 5. Return url's host, serialized, followed by ":" and url's port, serialized.
  140. return DeprecatedString::formatted("{}:{}", url->host(), url->port().value());
  141. }
  142. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-host
  143. void HTMLHyperlinkElementUtils::set_host(DeprecatedString host)
  144. {
  145. // 1. Reinitialize url.
  146. reinitialize_url();
  147. // 2. Let url be this element's url.
  148. auto& url = m_url;
  149. // 3. If url is null or url's cannot-be-a-base-URL is true, then return.
  150. if (!url.has_value() || url->cannot_be_a_base_url())
  151. return;
  152. // 4. Basic URL parse the given value, with url as url and host state as state override.
  153. auto result_url = URLParser::parse(host, nullptr, url, URLParser::State::Host);
  154. if (result_url.is_valid())
  155. m_url = move(result_url);
  156. // 5. Update href.
  157. update_href();
  158. }
  159. DeprecatedString HTMLHyperlinkElementUtils::hostname() const
  160. {
  161. // 1. Reinitialize url.
  162. //
  163. // 2. Let url be this element's url.
  164. //
  165. // 3. If url or url's host is null, return the empty string.
  166. //
  167. // 4. Return url's host, serialized.
  168. return AK::URL(href()).host();
  169. }
  170. void HTMLHyperlinkElementUtils::set_hostname(DeprecatedString hostname)
  171. {
  172. // 1. Reinitialize url.
  173. reinitialize_url();
  174. // 2. Let url be this element's url.
  175. auto& url = m_url;
  176. // 3. If url is null or url's cannot-be-a-base-URL is true, then return.
  177. if (!url.has_value() || url->cannot_be_a_base_url())
  178. return;
  179. // 4. Basic URL parse the given value, with url as url and hostname state as state override.
  180. auto result_url = URLParser::parse(hostname, nullptr, m_url, URLParser::State::Hostname);
  181. if (result_url.is_valid())
  182. m_url = move(result_url);
  183. // 5. Update href.
  184. update_href();
  185. }
  186. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-port
  187. DeprecatedString HTMLHyperlinkElementUtils::port() const
  188. {
  189. // 1. Reinitialize url.
  190. reinitialize_url();
  191. // 2. Let url be this element's url.
  192. auto& url = m_url;
  193. // 3. If url or url's port is null, return the empty string.
  194. if (!url.has_value() || !url->port().has_value())
  195. return DeprecatedString::empty();
  196. // 4. Return url's port, serialized.
  197. return DeprecatedString::number(url->port().value());
  198. }
  199. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-port
  200. void HTMLHyperlinkElementUtils::set_port(DeprecatedString port)
  201. {
  202. // 1. Reinitialize url.
  203. reinitialize_url();
  204. // 2. Let url be this element's url.
  205. // 3. If url is null or url cannot have a username/password/port, then return.
  206. if (!m_url.has_value() || m_url->cannot_have_a_username_or_password_or_port())
  207. return;
  208. // 4. If the given value is the empty string, then set url's port to null.
  209. if (port.is_empty()) {
  210. m_url->set_port({});
  211. } else {
  212. // 5. Otherwise, basic URL parse the given value, with url as url and port state as state override.
  213. auto result_url = URLParser::parse(port, nullptr, m_url, URLParser::State::Port);
  214. if (result_url.is_valid())
  215. m_url = move(result_url);
  216. }
  217. // 6. Update href.
  218. update_href();
  219. }
  220. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-pathname
  221. DeprecatedString HTMLHyperlinkElementUtils::pathname() const
  222. {
  223. // 1. Reinitialize url.
  224. reinitialize_url();
  225. // 2. Let url be this element's url.
  226. // 3. If url is null, return the empty string.
  227. if (!m_url.has_value())
  228. return DeprecatedString::empty();
  229. // 4. If url's cannot-be-a-base-URL is true, then return url's path[0].
  230. // 5. If url's path is empty, then return the empty string.
  231. // 6. Return "/", followed by the strings in url's path (including empty strings), separated from each other by "/".
  232. return m_url->path();
  233. }
  234. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-pathname
  235. void HTMLHyperlinkElementUtils::set_pathname(DeprecatedString pathname)
  236. {
  237. // 1. Reinitialize url.
  238. reinitialize_url();
  239. // 2. Let url be this element's url.
  240. // 3. If url is null or url's cannot-be-a-base-URL is true, then return.
  241. if (!m_url.has_value() || m_url->cannot_be_a_base_url())
  242. return;
  243. // 4. Set url's path to the empty list.
  244. auto url = m_url; // We copy the URL here to follow other browser's behaviour of reverting the path change if the parse failed.
  245. url->set_paths({});
  246. // 5. Basic URL parse the given value, with url as url and path start state as state override.
  247. auto result_url = URLParser::parse(pathname, nullptr, move(url), URLParser::State::PathStart);
  248. if (result_url.is_valid())
  249. m_url = move(result_url);
  250. // 6. Update href.
  251. update_href();
  252. }
  253. DeprecatedString HTMLHyperlinkElementUtils::search() const
  254. {
  255. // 1. Reinitialize url.
  256. reinitialize_url();
  257. // 2. Let url be this element's url.
  258. // 3. If url is null, or url's query is either null or the empty string, return the empty string.
  259. if (!m_url.has_value() || m_url->query().is_null() || m_url->query().is_empty())
  260. return DeprecatedString::empty();
  261. // 4. Return "?", followed by url's query.
  262. return DeprecatedString::formatted("?{}", m_url->query());
  263. }
  264. void HTMLHyperlinkElementUtils::set_search(DeprecatedString search)
  265. {
  266. // 1. Reinitialize url.
  267. reinitialize_url();
  268. // 2. Let url be this element's url.
  269. // 3. If url is null, terminate these steps.
  270. if (!m_url.has_value())
  271. return;
  272. // 4. If the given value is the empty string, set url's query to null.
  273. if (search.is_empty()) {
  274. m_url->set_query({});
  275. } else {
  276. // 5. Otherwise:
  277. // 1. Let input be the given value with a single leading "?" removed, if any.
  278. auto input = search.substring_view(search.starts_with('?'));
  279. // 2. Set url's query to the empty string.
  280. auto url_copy = m_url; // We copy the URL here to follow other browser's behaviour of reverting the search change if the parse failed.
  281. url_copy->set_query(DeprecatedString::empty());
  282. // 3. Basic URL parse input, with null, this element's node document's document's character encoding, url as url, and query state as state override.
  283. auto result_url = URLParser::parse(input, nullptr, move(url_copy), URLParser::State::Query);
  284. if (result_url.is_valid())
  285. m_url = move(result_url);
  286. }
  287. // 6. Update href.
  288. update_href();
  289. }
  290. DeprecatedString HTMLHyperlinkElementUtils::hash() const
  291. {
  292. // 1. Reinitialize url.
  293. reinitialize_url();
  294. // 2. Let url be this element's url.
  295. // 3. If url is null, or url's fragment is either null or the empty string, return the empty string.
  296. if (!m_url.has_value() || m_url->fragment().is_null() || m_url->fragment().is_empty())
  297. return DeprecatedString::empty();
  298. // 4. Return "#", followed by url's fragment.
  299. return DeprecatedString::formatted("#{}", m_url->fragment());
  300. }
  301. void HTMLHyperlinkElementUtils::set_hash(DeprecatedString hash)
  302. {
  303. // 1. Reinitialize url.
  304. reinitialize_url();
  305. // 2. Let url be this element's url.
  306. // 3. If url is null, then return.
  307. if (!m_url.has_value())
  308. return;
  309. // 4. If the given value is the empty string, set url's fragment to null.
  310. if (hash.is_empty()) {
  311. m_url->set_fragment({});
  312. } else {
  313. // 5. Otherwise:
  314. // 1. Let input be the given value with a single leading "#" removed, if any.
  315. auto input = hash.substring_view(hash.starts_with('#'));
  316. // 2. Set url's fragment to the empty string.
  317. auto url_copy = m_url; // We copy the URL here to follow other browser's behaviour of reverting the hash change if the parse failed.
  318. url_copy->set_fragment(DeprecatedString::empty());
  319. // 3. Basic URL parse input, with url as url and fragment state as state override.
  320. auto result_url = URLParser::parse(input, nullptr, move(url_copy), URLParser::State::Fragment);
  321. if (result_url.is_valid())
  322. m_url = move(result_url);
  323. }
  324. // 6. Update href.
  325. update_href();
  326. }
  327. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-href
  328. DeprecatedString HTMLHyperlinkElementUtils::href() const
  329. {
  330. // 1. Reinitialize url.
  331. reinitialize_url();
  332. // 2. Let url be this element's url.
  333. auto& url = m_url;
  334. // 3. If url is null and this element has no href content attribute, return the empty string.
  335. auto href_content_attribute = hyperlink_element_utils_href();
  336. if (!url.has_value() && href_content_attribute.is_null())
  337. return DeprecatedString::empty();
  338. // 4. Otherwise, if url is null, return this element's href content attribute's value.
  339. if (!url->is_valid())
  340. return href_content_attribute;
  341. // 5. Return url, serialized.
  342. return url->serialize();
  343. }
  344. // https://html.spec.whatwg.org/multipage/links.html#dom-hyperlink-href
  345. void HTMLHyperlinkElementUtils::set_href(DeprecatedString href)
  346. {
  347. // The href attribute's setter must set this element's href content attribute's value to the given value.
  348. set_hyperlink_element_utils_href(move(href));
  349. }
  350. // https://html.spec.whatwg.org/multipage/links.html#update-href
  351. void HTMLHyperlinkElementUtils::update_href()
  352. {
  353. // To update href, set the element's href content attribute's value to the element's url, serialized.
  354. }
  355. bool HTMLHyperlinkElementUtils::cannot_navigate() const
  356. {
  357. // An element element cannot navigate if one of the following is true:
  358. // 1. element's node document is not fully active
  359. auto const& document = const_cast<HTMLHyperlinkElementUtils*>(this)->hyperlink_element_utils_document();
  360. if (!document.is_fully_active())
  361. return true;
  362. // 2. element is not an a element and is not connected.
  363. if (!hyperlink_element_utils_is_html_anchor_element() && !hyperlink_element_utils_is_connected())
  364. return true;
  365. return false;
  366. }
  367. // https://html.spec.whatwg.org/multipage/links.html#following-hyperlinks-2
  368. void HTMLHyperlinkElementUtils::follow_the_hyperlink(Optional<DeprecatedString> hyperlink_suffix)
  369. {
  370. // To follow the hyperlink created by an element subject, given an optional hyperlinkSuffix (default null):
  371. // 1. If subject cannot navigate, then return.
  372. if (cannot_navigate())
  373. return;
  374. // FIXME: 2. Let replace be false.
  375. // 3. Let source be subject's node document's browsing context.
  376. auto* source = hyperlink_element_utils_document().browsing_context();
  377. if (!source)
  378. return;
  379. // 4. Let targetAttributeValue be the empty string.
  380. // 5. If subject is an a or area element, then set targetAttributeValue to
  381. // the result of getting an element's target given subject.
  382. DeprecatedString target_attribute_value = get_an_elements_target();
  383. // 6. Let noopener be the result of getting an element's noopener with subject and targetAttributeValue.
  384. bool noopener = get_an_elements_noopener(target_attribute_value);
  385. // 7. Let target be the first return value of applying the rules for
  386. // choosing a browsing context given targetAttributeValue, source, and
  387. // noopener.
  388. auto target = source->choose_a_browsing_context(target_attribute_value, noopener).browsing_context;
  389. // 8. If target is null, then return.
  390. if (!target)
  391. return;
  392. // 9. Parse a URL given subject's href attribute, relative to subject's node
  393. // document.
  394. auto url = source->active_document()->parse_url(href());
  395. // 10. If that is successful, let URL be the resulting URL string.
  396. auto url_string = url.to_deprecated_string();
  397. // 11. Otherwise, if parsing the URL failed, the user agent may report the
  398. // error to the user in a user-agent-specific manner, may queue an element
  399. // task on the DOM manipulation task source given subject to navigate the
  400. // target browsing context to an error page to report the error, or may
  401. // ignore the error and do nothing. In any case, the user agent must then
  402. // return.
  403. // 12. If hyperlinkSuffix is non-null, then append it to URL.
  404. if (hyperlink_suffix.has_value()) {
  405. StringBuilder url_builder;
  406. url_builder.append(url_string);
  407. url_builder.append(*hyperlink_suffix);
  408. url_string = url_builder.to_deprecated_string();
  409. }
  410. // FIXME: 13. Let request be a new request whose URL is URL and whose
  411. // referrer policy is the current state of subject's referrerpolicy content
  412. // attribute.
  413. // FIXME: 14. If subject's link types includes the noreferrer keyword, then
  414. // set request's referrer to "no-referrer".
  415. // 15. Queue an element task on the DOM manipulation task source given
  416. // subject to navigate target to request with the source browsing context
  417. // set to source.
  418. // FIXME: "navigate" means implementing the navigation algorithm here:
  419. // https://html.spec.whatwg.org/multipage/browsing-the-web.html#navigate
  420. hyperlink_element_utils_queue_an_element_task(Task::Source::DOMManipulation, [url_string, target] {
  421. target->loader().load(url_string, FrameLoader::Type::Navigation);
  422. });
  423. }
  424. DeprecatedString HTMLHyperlinkElementUtils::get_an_elements_target() const
  425. {
  426. // To get an element's target, given an a, area, or form element element, run these steps:
  427. // 1. If element has a target attribute, then return that attribute's value.
  428. if (auto target = hyperlink_element_utils_target(); !target.is_empty())
  429. return target;
  430. // FIXME: 2. If element's node document contains a base element with a
  431. // target attribute, then return the value of the target attribute of the
  432. // first such base element.
  433. // 3. Return the empty string.
  434. return "";
  435. }
  436. // https://html.spec.whatwg.org/multipage/links.html#get-an-element's-noopener
  437. bool HTMLHyperlinkElementUtils::get_an_elements_noopener(StringView target) const
  438. {
  439. // To get an element's noopener, given an a, area, or form element element and a string target:
  440. auto rel = hyperlink_element_utils_rel().to_lowercase();
  441. auto link_types = rel.view().split_view_if(Infra::is_ascii_whitespace);
  442. // 1. If element's link types include the noopener or noreferrer keyword, then return true.
  443. if (link_types.contains_slow("noopener"sv) || link_types.contains_slow("noreferrer"sv))
  444. return true;
  445. // 2. If element's link types do not include the opener keyword and
  446. // target is an ASCII case-insensitive match for "_blank", then return true.
  447. if (!link_types.contains_slow("opener"sv) && target.equals_ignoring_case("_blank"sv))
  448. return true;
  449. // 3. Return false.
  450. return false;
  451. }
  452. }