/* * Copyright (c) 2023, Tim Flynn * * SPDX-License-Identifier: BSD-2-Clause */ #include #include #include #include #include #include #include #include namespace AK { struct FlyStringTableHashTraits : public Traits { static u32 hash(Detail::StringData const* string) { return string->hash(); } static bool equals(Detail::StringData const* a, Detail::StringData const* b) { return *a == *b; } }; static auto& all_fly_strings() { static Singleton> table; return *table; } ErrorOr FlyString::from_utf8(StringView string) { if (string.is_empty()) return FlyString {}; if (string.length() <= Detail::MAX_SHORT_STRING_BYTE_COUNT) return FlyString { TRY(String::from_utf8(string)) }; if (auto it = all_fly_strings().find(string.hash(), [&](auto& entry) { return entry->bytes_as_string_view() == string; }); it != all_fly_strings().end()) return FlyString { Detail::StringBase(**it) }; return FlyString { TRY(String::from_utf8(string)) }; } FlyString FlyString::from_utf8_without_validation(ReadonlyBytes string) { if (string.is_empty()) return FlyString {}; if (string.size() <= Detail::MAX_SHORT_STRING_BYTE_COUNT) return FlyString { String::from_utf8_without_validation(string) }; if (auto it = all_fly_strings().find(StringView(string).hash(), [&](auto& entry) { return entry->bytes_as_string_view() == string; }); it != all_fly_strings().end()) return FlyString { Detail::StringBase(**it) }; return FlyString { String::from_utf8_without_validation(string) }; } FlyString::FlyString(String const& string) { if (string.is_short_string()) { m_data = string; return; } if (string.m_data->is_fly_string()) { m_data = string; return; } auto it = all_fly_strings().find(string.m_data); if (it == all_fly_strings().end()) { m_data = string; all_fly_strings().set(string.m_data); string.m_data->set_fly_string(true); } else { m_data.m_data = *it; m_data.m_data->ref(); } } FlyString& FlyString::operator=(String const& string) { *this = FlyString { string }; return *this; } bool FlyString::is_empty() const { return bytes_as_string_view().is_empty(); } unsigned FlyString::hash() const { return m_data.hash(); } u32 FlyString::ascii_case_insensitive_hash() const { return case_insensitive_string_hash(reinterpret_cast(bytes().data()), bytes().size()); } FlyString::operator String() const { return to_string(); } String FlyString::to_string() const { Detail::StringBase copy = m_data; return String(move(copy)); } Utf8View FlyString::code_points() const { return Utf8View { bytes_as_string_view() }; } ReadonlyBytes FlyString::bytes() const { return bytes_as_string_view().bytes(); } StringView FlyString::bytes_as_string_view() const { return m_data.bytes(); } bool FlyString::operator==(String const& other) const { return m_data == other; } bool FlyString::operator==(StringView string) const { return bytes_as_string_view() == string; } bool FlyString::operator==(char const* string) const { return bytes_as_string_view() == string; } void FlyString::did_destroy_fly_string_data(Badge, Detail::StringData const& string_data) { all_fly_strings().remove(&string_data); } Detail::StringBase FlyString::data(Badge) const { return m_data; } size_t FlyString::number_of_fly_strings() { return all_fly_strings().size(); } DeprecatedFlyString FlyString::to_deprecated_fly_string() const { return DeprecatedFlyString(bytes_as_string_view()); } ErrorOr FlyString::from_deprecated_fly_string(DeprecatedFlyString const& deprecated_fly_string) { return FlyString::from_utf8(deprecated_fly_string.view()); } unsigned Traits::hash(FlyString const& fly_string) { return fly_string.hash(); } int FlyString::operator<=>(FlyString const& other) const { return bytes_as_string_view().compare(other.bytes_as_string_view()); } ErrorOr Formatter::format(FormatBuilder& builder, FlyString const& fly_string) { return Formatter::format(builder, fly_string.bytes_as_string_view()); } FlyString FlyString::to_ascii_lowercase() const { bool const has_ascii_uppercase = [&] { for (u8 const byte : bytes()) { if (AK::is_ascii_upper_alpha(byte)) return true; } return false; }(); if (!has_ascii_uppercase) return *this; Vector lowercase_bytes; lowercase_bytes.ensure_capacity(bytes().size()); for (u8 const byte : bytes()) { if (AK::is_ascii_upper_alpha(byte)) lowercase_bytes.unchecked_append(AK::to_ascii_lowercase(byte)); else lowercase_bytes.unchecked_append(byte); } return String::from_utf8_without_validation(lowercase_bytes); } FlyString FlyString::to_ascii_uppercase() const { bool const has_ascii_lowercase = [&] { for (u8 const byte : bytes()) { if (AK::is_ascii_lower_alpha(byte)) return true; } return false; }(); if (!has_ascii_lowercase) return *this; Vector uppercase_bytes; uppercase_bytes.ensure_capacity(bytes().size()); for (u8 const byte : bytes()) { if (AK::is_ascii_lower_alpha(byte)) uppercase_bytes.unchecked_append(AK::to_ascii_uppercase(byte)); else uppercase_bytes.unchecked_append(byte); } return String::from_utf8_without_validation(uppercase_bytes); } bool FlyString::equals_ignoring_ascii_case(FlyString const& other) const { if (*this == other) return true; return StringUtils::equals_ignoring_ascii_case(bytes_as_string_view(), other.bytes_as_string_view()); } bool FlyString::equals_ignoring_ascii_case(StringView other) const { return StringUtils::equals_ignoring_ascii_case(bytes_as_string_view(), other); } bool FlyString::starts_with_bytes(StringView bytes, CaseSensitivity case_sensitivity) const { return bytes_as_string_view().starts_with(bytes, case_sensitivity); } bool FlyString::ends_with_bytes(StringView bytes, CaseSensitivity case_sensitivity) const { return bytes_as_string_view().ends_with(bytes, case_sensitivity); } }