DateTimeFormat.cpp 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337
  1. /*
  2. * Copyright (c) 2021-2022, Tim Flynn <trflynn89@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include <AK/Array.h>
  7. #include <AK/StringBuilder.h>
  8. #include <LibUnicode/DateTimeFormat.h>
  9. #include <LibUnicode/Locale.h>
  10. #include <LibUnicode/NumberFormat.h>
  11. #include <stdlib.h>
  12. namespace Unicode {
  13. HourCycle hour_cycle_from_string(StringView hour_cycle)
  14. {
  15. if (hour_cycle == "h11"sv)
  16. return Unicode::HourCycle::H11;
  17. else if (hour_cycle == "h12"sv)
  18. return Unicode::HourCycle::H12;
  19. else if (hour_cycle == "h23"sv)
  20. return Unicode::HourCycle::H23;
  21. else if (hour_cycle == "h24"sv)
  22. return Unicode::HourCycle::H24;
  23. VERIFY_NOT_REACHED();
  24. }
  25. StringView hour_cycle_to_string(HourCycle hour_cycle)
  26. {
  27. switch (hour_cycle) {
  28. case HourCycle::H11:
  29. return "h11"sv;
  30. case HourCycle::H12:
  31. return "h12"sv;
  32. case HourCycle::H23:
  33. return "h23"sv;
  34. case HourCycle::H24:
  35. return "h24"sv;
  36. default:
  37. VERIFY_NOT_REACHED();
  38. }
  39. }
  40. CalendarPatternStyle calendar_pattern_style_from_string(StringView style)
  41. {
  42. if (style == "narrow"sv)
  43. return CalendarPatternStyle::Narrow;
  44. if (style == "short"sv)
  45. return CalendarPatternStyle::Short;
  46. if (style == "long"sv)
  47. return CalendarPatternStyle::Long;
  48. if (style == "numeric"sv)
  49. return CalendarPatternStyle::Numeric;
  50. if (style == "2-digit"sv)
  51. return CalendarPatternStyle::TwoDigit;
  52. if (style == "shortOffset"sv)
  53. return CalendarPatternStyle::ShortOffset;
  54. if (style == "longOffset"sv)
  55. return CalendarPatternStyle::LongOffset;
  56. if (style == "shortGeneric"sv)
  57. return CalendarPatternStyle::ShortGeneric;
  58. if (style == "longGeneric"sv)
  59. return CalendarPatternStyle::LongGeneric;
  60. VERIFY_NOT_REACHED();
  61. }
  62. StringView calendar_pattern_style_to_string(CalendarPatternStyle style)
  63. {
  64. switch (style) {
  65. case CalendarPatternStyle::Narrow:
  66. return "narrow"sv;
  67. case CalendarPatternStyle::Short:
  68. return "short"sv;
  69. case CalendarPatternStyle::Long:
  70. return "long"sv;
  71. case CalendarPatternStyle::Numeric:
  72. return "numeric"sv;
  73. case CalendarPatternStyle::TwoDigit:
  74. return "2-digit"sv;
  75. case CalendarPatternStyle::ShortOffset:
  76. return "shortOffset"sv;
  77. case CalendarPatternStyle::LongOffset:
  78. return "longOffset"sv;
  79. case CalendarPatternStyle::ShortGeneric:
  80. return "shortGeneric"sv;
  81. case CalendarPatternStyle::LongGeneric:
  82. return "longGeneric"sv;
  83. default:
  84. VERIFY_NOT_REACHED();
  85. }
  86. }
  87. Optional<HourCycleRegion> __attribute__((weak)) hour_cycle_region_from_string(StringView) { return {}; }
  88. Vector<HourCycle> __attribute__((weak)) get_regional_hour_cycles(StringView) { return {}; }
  89. template<typename GetRegionalValues>
  90. static auto find_regional_values_for_locale(StringView locale, GetRegionalValues&& get_regional_values)
  91. {
  92. auto has_value = [](auto const& container) {
  93. if constexpr (requires { container.has_value(); })
  94. return container.has_value();
  95. else
  96. return !container.is_empty();
  97. };
  98. if (auto regional_values = get_regional_values(locale); has_value(regional_values))
  99. return regional_values;
  100. auto return_default_values = [&]() { return get_regional_values("001"sv); };
  101. auto language = parse_unicode_language_id(locale);
  102. if (!language.has_value())
  103. return return_default_values();
  104. if (!language->region.has_value())
  105. language = add_likely_subtags(*language);
  106. if (!language.has_value() || !language->region.has_value())
  107. return return_default_values();
  108. if (auto regional_values = get_regional_values(*language->region); has_value(regional_values))
  109. return regional_values;
  110. return return_default_values();
  111. }
  112. // https://unicode.org/reports/tr35/tr35-dates.html#Date_Field_Symbol_Table
  113. Vector<Unicode::HourCycle> get_locale_hour_cycles(StringView locale)
  114. {
  115. return find_regional_values_for_locale(locale, get_regional_hour_cycles);
  116. }
  117. Optional<Unicode::HourCycle> get_default_regional_hour_cycle(StringView locale)
  118. {
  119. if (auto hour_cycles = get_locale_hour_cycles(locale); !hour_cycles.is_empty())
  120. return hour_cycles.first();
  121. return {};
  122. }
  123. Optional<MinimumDaysRegion> __attribute__((weak)) minimum_days_region_from_string(StringView) { return {}; }
  124. Optional<u8> __attribute__((weak)) get_regional_minimum_days(StringView) { return {}; }
  125. Optional<u8> get_locale_minimum_days(StringView locale)
  126. {
  127. return find_regional_values_for_locale(locale, get_regional_minimum_days);
  128. }
  129. Optional<FirstDayRegion> __attribute__((weak)) first_day_region_from_string(StringView) { return {}; }
  130. Optional<Weekday> __attribute__((weak)) get_regional_first_day(StringView) { return {}; }
  131. Optional<Weekday> get_locale_first_day(StringView locale)
  132. {
  133. return find_regional_values_for_locale(locale, get_regional_first_day);
  134. }
  135. Optional<WeekendStartRegion> __attribute__((weak)) weekend_start_region_from_string(StringView) { return {}; }
  136. Optional<Weekday> __attribute__((weak)) get_regional_weekend_start(StringView) { return {}; }
  137. Optional<Weekday> get_locale_weekend_start(StringView locale)
  138. {
  139. return find_regional_values_for_locale(locale, get_regional_weekend_start);
  140. }
  141. Optional<WeekendEndRegion> __attribute__((weak)) weekend_end_region_from_string(StringView) { return {}; }
  142. Optional<Weekday> __attribute__((weak)) get_regional_weekend_end(StringView) { return {}; }
  143. Optional<Weekday> get_locale_weekend_end(StringView locale)
  144. {
  145. return find_regional_values_for_locale(locale, get_regional_weekend_end);
  146. }
  147. String combine_skeletons(StringView first, StringView second)
  148. {
  149. // https://unicode.org/reports/tr35/tr35-dates.html#availableFormats_appendItems
  150. constexpr auto field_order = Array {
  151. "G"sv, // Era
  152. "yYuUr"sv, // Year
  153. "ML"sv, // Month
  154. "dDFg"sv, // Day
  155. "Eec"sv, // Weekday
  156. "abB"sv, // Period
  157. "hHKk"sv, // Hour
  158. "m"sv, // Minute
  159. "sSA"sv, // Second
  160. "zZOvVXx"sv, // Zone
  161. };
  162. StringBuilder builder;
  163. auto append_from_skeleton = [&](auto skeleton, auto ch) {
  164. auto first_index = skeleton.find(ch);
  165. if (!first_index.has_value())
  166. return false;
  167. auto last_index = skeleton.find_last(ch);
  168. builder.append(skeleton.substring_view(*first_index, *last_index - *first_index + 1));
  169. return true;
  170. };
  171. for (auto fields : field_order) {
  172. for (auto ch : fields) {
  173. if (append_from_skeleton(first, ch))
  174. break;
  175. if (append_from_skeleton(second, ch))
  176. break;
  177. }
  178. }
  179. return builder.build();
  180. }
  181. Optional<CalendarFormat> __attribute__((weak)) get_calendar_date_format(StringView, StringView) { return {}; }
  182. Optional<CalendarFormat> __attribute__((weak)) get_calendar_time_format(StringView, StringView) { return {}; }
  183. Optional<CalendarFormat> __attribute__((weak)) get_calendar_date_time_format(StringView, StringView) { return {}; }
  184. Optional<CalendarFormat> get_calendar_format(StringView locale, StringView calendar, CalendarFormatType type)
  185. {
  186. switch (type) {
  187. case CalendarFormatType::Date:
  188. return get_calendar_date_format(locale, calendar);
  189. case CalendarFormatType::Time:
  190. return get_calendar_time_format(locale, calendar);
  191. case CalendarFormatType::DateTime:
  192. return get_calendar_date_time_format(locale, calendar);
  193. default:
  194. VERIFY_NOT_REACHED();
  195. }
  196. }
  197. Vector<CalendarPattern> __attribute__((weak)) get_calendar_available_formats(StringView, StringView) { return {}; }
  198. Optional<CalendarRangePattern> __attribute__((weak)) get_calendar_default_range_format(StringView, StringView) { return {}; }
  199. Vector<CalendarRangePattern> __attribute__((weak)) get_calendar_range_formats(StringView, StringView, StringView) { return {}; }
  200. Vector<CalendarRangePattern> __attribute__((weak)) get_calendar_range12_formats(StringView, StringView, StringView) { return {}; }
  201. Optional<StringView> __attribute__((weak)) get_calendar_era_symbol(StringView, StringView, CalendarPatternStyle, Era) { return {}; }
  202. Optional<StringView> __attribute__((weak)) get_calendar_month_symbol(StringView, StringView, CalendarPatternStyle, Month) { return {}; }
  203. Optional<StringView> __attribute__((weak)) get_calendar_weekday_symbol(StringView, StringView, CalendarPatternStyle, Weekday) { return {}; }
  204. Optional<StringView> __attribute__((weak)) get_calendar_day_period_symbol(StringView, StringView, CalendarPatternStyle, DayPeriod) { return {}; }
  205. Optional<StringView> __attribute__((weak)) get_calendar_day_period_symbol_for_hour(StringView, StringView, CalendarPatternStyle, u8) { return {}; }
  206. Optional<StringView> __attribute__((weak)) get_time_zone_name(StringView, StringView, CalendarPatternStyle, TimeZone::InDST) { return {}; }
  207. Optional<TimeZoneFormat> __attribute__((weak)) get_time_zone_format(StringView) { return {}; }
  208. static Optional<String> format_time_zone_offset(StringView locale, CalendarPatternStyle style, i64 offset_seconds)
  209. {
  210. auto formats = get_time_zone_format(locale);
  211. if (!formats.has_value())
  212. return {};
  213. auto number_system = get_default_number_system(locale);
  214. if (!number_system.has_value())
  215. return {};
  216. if (offset_seconds == 0)
  217. return formats->gmt_zero_format;
  218. auto sign = offset_seconds > 0 ? formats->symbol_ahead_sign : formats->symbol_behind_sign;
  219. auto separator = offset_seconds > 0 ? formats->symbol_ahead_separator : formats->symbol_behind_separator;
  220. offset_seconds = llabs(offset_seconds);
  221. auto offset_hours = offset_seconds / 3'600;
  222. offset_seconds %= 3'600;
  223. auto offset_minutes = offset_seconds / 60;
  224. offset_seconds %= 60;
  225. StringBuilder builder;
  226. builder.append(sign);
  227. switch (style) {
  228. // The long format always uses 2-digit hours field and minutes field, with optional 2-digit seconds field.
  229. case CalendarPatternStyle::LongOffset:
  230. builder.appendff("{:02}{}{:02}", offset_hours, separator, offset_minutes);
  231. if (offset_seconds > 0)
  232. builder.appendff("{}{:02}", separator, offset_seconds);
  233. break;
  234. // The short format is intended for the shortest representation and uses hour fields without leading zero, with optional 2-digit minutes and seconds fields.
  235. case CalendarPatternStyle::ShortOffset:
  236. builder.appendff("{}", offset_hours);
  237. if (offset_minutes > 0) {
  238. builder.appendff("{}{:02}", separator, offset_minutes);
  239. if (offset_seconds > 0)
  240. builder.appendff("{}{:02}", separator, offset_seconds);
  241. }
  242. break;
  243. default:
  244. VERIFY_NOT_REACHED();
  245. }
  246. // The digits used for hours, minutes and seconds fields in this format are the locale's default decimal digits.
  247. auto result = replace_digits_for_number_system(*number_system, builder.build());
  248. return formats->gmt_format.replace("{0}"sv, result, ReplaceMode::FirstOnly);
  249. }
  250. // https://unicode.org/reports/tr35/tr35-dates.html#Time_Zone_Format_Terminology
  251. String format_time_zone(StringView locale, StringView time_zone, CalendarPatternStyle style, AK::Time time)
  252. {
  253. auto offset = TimeZone::get_time_zone_offset(time_zone, time);
  254. if (!offset.has_value())
  255. return time_zone;
  256. switch (style) {
  257. case CalendarPatternStyle::Short:
  258. case CalendarPatternStyle::Long:
  259. case CalendarPatternStyle::ShortGeneric:
  260. case CalendarPatternStyle::LongGeneric:
  261. if (auto name = get_time_zone_name(locale, time_zone, style, offset->in_dst); name.has_value())
  262. return *name;
  263. break;
  264. case CalendarPatternStyle::ShortOffset:
  265. case CalendarPatternStyle::LongOffset:
  266. return format_time_zone_offset(locale, style, offset->seconds).value_or(time_zone);
  267. default:
  268. VERIFY_NOT_REACHED();
  269. }
  270. // If more styles are added, consult the following table to ensure always falling back to GMT offset is still correct:
  271. // https://unicode.org/reports/tr35/tr35-dates.html#dfst-zone
  272. switch (style) {
  273. case CalendarPatternStyle::Short:
  274. case CalendarPatternStyle::ShortGeneric:
  275. return format_time_zone(locale, time_zone, CalendarPatternStyle::ShortOffset, time);
  276. case CalendarPatternStyle::Long:
  277. case CalendarPatternStyle::LongGeneric:
  278. return format_time_zone(locale, time_zone, CalendarPatternStyle::LongOffset, time);
  279. default:
  280. VERIFY_NOT_REACHED();
  281. }
  282. }
  283. }