123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472 |
- /*
- * Copyright (c) 2018-2021, Andreas Kling <kling@serenityos.org>
- * Copyright (c) 2022, Tobias Christiansen <tobyase@serenityos.org>
- *
- * SPDX-License-Identifier: BSD-2-Clause
- */
- #include <AK/CharacterTypes.h>
- #include <AK/StringBuilder.h>
- #include <LibUnicode/CharacterTypes.h>
- #include <LibWeb/DOM/Document.h>
- #include <LibWeb/Layout/BlockContainer.h>
- #include <LibWeb/Layout/InlineFormattingContext.h>
- #include <LibWeb/Layout/TextNode.h>
- #include <LibWeb/Painting/TextPaintable.h>
- namespace Web::Layout {
- TextNode::TextNode(DOM::Document& document, DOM::Text& text)
- : Node(document, &text)
- {
- }
- TextNode::~TextNode() = default;
- static bool is_all_whitespace(StringView string)
- {
- for (size_t i = 0; i < string.length(); ++i) {
- if (!is_ascii_space(string[i]))
- return false;
- }
- return true;
- }
- // https://w3c.github.io/mathml-core/#new-text-transform-values
- static String apply_math_auto_text_transform(String const& string)
- {
- // https://w3c.github.io/mathml-core/#italic-mappings
- auto map_code_point_to_italic = [](u32 code_point) -> u32 {
- switch (code_point) {
- case 0x0041:
- return 0x1D434;
- case 0x0042:
- return 0x1D435;
- case 0x0043:
- return 0x1D436;
- case 0x0044:
- return 0x1D437;
- case 0x0045:
- return 0x1D438;
- case 0x0046:
- return 0x1D439;
- case 0x0047:
- return 0x1D43A;
- case 0x0048:
- return 0x1D43B;
- case 0x0049:
- return 0x1D43C;
- case 0x004A:
- return 0x1D43D;
- case 0x004B:
- return 0x1D43E;
- case 0x004C:
- return 0x1D43F;
- case 0x004D:
- return 0x1D440;
- case 0x004E:
- return 0x1D441;
- case 0x004F:
- return 0x1D442;
- case 0x0050:
- return 0x1D443;
- case 0x0051:
- return 0x1D444;
- case 0x0052:
- return 0x1D445;
- case 0x0053:
- return 0x1D446;
- case 0x0054:
- return 0x1D447;
- case 0x0055:
- return 0x1D448;
- case 0x0056:
- return 0x1D449;
- case 0x0057:
- return 0x1D44A;
- case 0x0058:
- return 0x1D44B;
- case 0x0059:
- return 0x1D44C;
- case 0x005A:
- return 0x1D44D;
- case 0x0061:
- return 0x1D44E;
- case 0x0062:
- return 0x1D44F;
- case 0x0063:
- return 0x1D450;
- case 0x0064:
- return 0x1D451;
- case 0x0065:
- return 0x1D452;
- case 0x0066:
- return 0x1D453;
- case 0x0067:
- return 0x1D454;
- case 0x0068:
- return 0x0210E;
- case 0x0069:
- return 0x1D456;
- case 0x006A:
- return 0x1D457;
- case 0x006B:
- return 0x1D458;
- case 0x006C:
- return 0x1D459;
- case 0x006D:
- return 0x1D45A;
- case 0x006E:
- return 0x1D45B;
- case 0x006F:
- return 0x1D45C;
- case 0x0070:
- return 0x1D45D;
- case 0x0071:
- return 0x1D45E;
- case 0x0072:
- return 0x1D45F;
- case 0x0073:
- return 0x1D460;
- case 0x0074:
- return 0x1D461;
- case 0x0075:
- return 0x1D462;
- case 0x0076:
- return 0x1D463;
- case 0x0077:
- return 0x1D464;
- case 0x0078:
- return 0x1D465;
- case 0x0079:
- return 0x1D466;
- case 0x007A:
- return 0x1D467;
- case 0x0131:
- return 0x1D6A4;
- case 0x0237:
- return 0x1D6A5;
- case 0x0391:
- return 0x1D6E2;
- case 0x0392:
- return 0x1D6E3;
- case 0x0393:
- return 0x1D6E4;
- case 0x0394:
- return 0x1D6E5;
- case 0x0395:
- return 0x1D6E6;
- case 0x0396:
- return 0x1D6E7;
- case 0x0397:
- return 0x1D6E8;
- case 0x0398:
- return 0x1D6E9;
- case 0x0399:
- return 0x1D6EA;
- case 0x039A:
- return 0x1D6EB;
- case 0x039B:
- return 0x1D6EC;
- case 0x039C:
- return 0x1D6ED;
- case 0x039D:
- return 0x1D6EE;
- case 0x039E:
- return 0x1D6EF;
- case 0x039F:
- return 0x1D6F0;
- case 0x03A0:
- return 0x1D6F1;
- case 0x03A1:
- return 0x1D6F2;
- case 0x03F4:
- return 0x1D6F3;
- case 0x03A3:
- return 0x1D6F4;
- case 0x03A4:
- return 0x1D6F5;
- case 0x03A5:
- return 0x1D6F6;
- case 0x03A6:
- return 0x1D6F7;
- case 0x03A7:
- return 0x1D6F8;
- case 0x03A8:
- return 0x1D6F9;
- case 0x03A9:
- return 0x1D6FA;
- case 0x2207:
- return 0x1D6FB;
- case 0x03B1:
- return 0x1D6FC;
- case 0x03B2:
- return 0x1D6FD;
- case 0x03B3:
- return 0x1D6FE;
- case 0x03B4:
- return 0x1D6FF;
- case 0x03B5:
- return 0x1D700;
- case 0x03B6:
- return 0x1D701;
- case 0x03B7:
- return 0x1D702;
- case 0x03B8:
- return 0x1D703;
- case 0x03B9:
- return 0x1D704;
- case 0x03BA:
- return 0x1D705;
- case 0x03BB:
- return 0x1D706;
- case 0x03BC:
- return 0x1D707;
- case 0x03BD:
- return 0x1D708;
- case 0x03BE:
- return 0x1D709;
- case 0x03BF:
- return 0x1D70A;
- case 0x03C0:
- return 0x1D70B;
- case 0x03C1:
- return 0x1D70C;
- case 0x03C2:
- return 0x1D70D;
- case 0x03C3:
- return 0x1D70E;
- case 0x03C4:
- return 0x1D70F;
- case 0x03C5:
- return 0x1D710;
- case 0x03C6:
- return 0x1D711;
- case 0x03C7:
- return 0x1D712;
- case 0x03C8:
- return 0x1D713;
- case 0x03C9:
- return 0x1D714;
- case 0x2202:
- return 0x1D715;
- case 0x03F5:
- return 0x1D716;
- case 0x03D1:
- return 0x1D717;
- case 0x03F0:
- return 0x1D718;
- case 0x03D5:
- return 0x1D719;
- case 0x03F1:
- return 0x1D71A;
- case 0x03D6:
- return 0x1D71B;
- default:
- return code_point;
- }
- };
- StringBuilder builder(string.bytes().size());
- for (auto code_point : string.code_points())
- builder.append_code_point(map_code_point_to_italic(code_point));
- return MUST(builder.to_string());
- }
- static ErrorOr<String> apply_text_transform(String const& string, CSS::TextTransform text_transform)
- {
- switch (text_transform) {
- case CSS::TextTransform::Uppercase:
- return string.to_uppercase();
- case CSS::TextTransform::Lowercase:
- return string.to_lowercase();
- case CSS::TextTransform::None:
- return string;
- case CSS::TextTransform::MathAuto:
- return apply_math_auto_text_transform(string);
- case CSS::TextTransform::Capitalize: {
- return string.to_titlecase({}, TrailingCodePointTransformation::PreserveExisting);
- }
- case CSS::TextTransform::FullSizeKana:
- case CSS::TextTransform::FullWidth:
- // FIXME: Implement these!
- return string;
- }
- VERIFY_NOT_REACHED();
- }
- void TextNode::invalidate_text_for_rendering()
- {
- m_text_for_rendering = {};
- }
- String const& TextNode::text_for_rendering() const
- {
- if (!m_text_for_rendering.has_value())
- const_cast<TextNode*>(this)->compute_text_for_rendering();
- return *m_text_for_rendering;
- }
- // NOTE: This collapses whitespace into a single ASCII space if the CSS white-space property tells us to.
- void TextNode::compute_text_for_rendering()
- {
- bool collapse = [](CSS::WhiteSpace white_space) {
- switch (white_space) {
- case CSS::WhiteSpace::Normal:
- case CSS::WhiteSpace::Nowrap:
- case CSS::WhiteSpace::PreLine:
- return true;
- case CSS::WhiteSpace::Pre:
- case CSS::WhiteSpace::PreWrap:
- return false;
- }
- VERIFY_NOT_REACHED();
- }(computed_values().white_space());
- if (dom_node().is_editable() && !dom_node().is_uninteresting_whitespace_node())
- collapse = false;
- auto data = apply_text_transform(dom_node().data(), computed_values().text_transform()).release_value_but_fixme_should_propagate_errors();
- auto data_view = data.bytes_as_string_view();
- if (dom_node().is_password_input()) {
- m_text_for_rendering = MUST(String::repeated('*', data_view.length()));
- return;
- }
- if (!collapse || data.is_empty()) {
- m_text_for_rendering = data;
- return;
- }
- // NOTE: A couple fast returns to avoid unnecessarily allocating a StringBuilder.
- if (data_view.length() == 1) {
- if (is_ascii_space(data_view[0])) {
- static String s_single_space_string = " "_string;
- m_text_for_rendering = s_single_space_string;
- } else {
- m_text_for_rendering = data;
- }
- return;
- }
- bool contains_space = false;
- for (auto c : data_view) {
- if (is_ascii_space(c)) {
- contains_space = true;
- break;
- }
- }
- if (!contains_space) {
- m_text_for_rendering = data;
- return;
- }
- StringBuilder builder(data_view.length());
- size_t index = 0;
- auto skip_over_whitespace = [&index, &data_view] {
- while (index < data_view.length() && is_ascii_space(data_view[index]))
- ++index;
- };
- while (index < data_view.length()) {
- if (is_ascii_space(data_view[index])) {
- builder.append(' ');
- ++index;
- skip_over_whitespace();
- } else {
- builder.append(data_view[index]);
- ++index;
- }
- }
- m_text_for_rendering = MUST(builder.to_string());
- }
- TextNode::ChunkIterator::ChunkIterator(StringView text, bool wrap_lines, bool respect_linebreaks)
- : m_wrap_lines(wrap_lines)
- , m_respect_linebreaks(respect_linebreaks)
- , m_utf8_view(text)
- , m_iterator(m_utf8_view.begin())
- {
- }
- Optional<TextNode::Chunk> TextNode::ChunkIterator::next()
- {
- if (m_iterator == m_utf8_view.end())
- return {};
- auto start_of_chunk = m_iterator;
- while (m_iterator != m_utf8_view.end()) {
- if (m_respect_linebreaks && *m_iterator == '\n') {
- // Newline encountered, and we're supposed to preserve them.
- // If we have accumulated some code points in the current chunk, commit them now and continue with the newline next time.
- if (auto result = try_commit_chunk(start_of_chunk, m_iterator, false); result.has_value())
- return result.release_value();
- // Otherwise, commit the newline!
- ++m_iterator;
- auto result = try_commit_chunk(start_of_chunk, m_iterator, true);
- VERIFY(result.has_value());
- return result.release_value();
- }
- if (m_wrap_lines) {
- if (is_ascii_space(*m_iterator)) {
- // Whitespace encountered, and we're allowed to break on whitespace.
- // If we have accumulated some code points in the current chunk, commit them now and continue with the whitespace next time.
- if (auto result = try_commit_chunk(start_of_chunk, m_iterator, false); result.has_value())
- return result.release_value();
- // Otherwise, commit the whitespace!
- ++m_iterator;
- if (auto result = try_commit_chunk(start_of_chunk, m_iterator, false); result.has_value())
- return result.release_value();
- continue;
- }
- }
- ++m_iterator;
- }
- if (start_of_chunk != m_utf8_view.end()) {
- // Try to output whatever's left at the end of the text node.
- if (auto result = try_commit_chunk(start_of_chunk, m_utf8_view.end(), false); result.has_value())
- return result.release_value();
- }
- return {};
- }
- Optional<TextNode::Chunk> TextNode::ChunkIterator::try_commit_chunk(Utf8View::Iterator const& start, Utf8View::Iterator const& end, bool has_breaking_newline) const
- {
- auto byte_offset = m_utf8_view.byte_offset_of(start);
- auto byte_length = m_utf8_view.byte_offset_of(end) - byte_offset;
- if (byte_length > 0) {
- auto chunk_view = m_utf8_view.substring_view(byte_offset, byte_length);
- return Chunk {
- .view = chunk_view,
- .start = byte_offset,
- .length = byte_length,
- .has_breaking_newline = has_breaking_newline,
- .is_all_whitespace = is_all_whitespace(chunk_view.as_string()),
- };
- }
- return {};
- }
- JS::GCPtr<Painting::Paintable> TextNode::create_paintable() const
- {
- return Painting::TextPaintable::create(*this);
- }
- }
|