GenerateTimeZoneData.cpp 30 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836
  1. /*
  2. * Copyright (c) 2022, Tim Flynn <trflynn89@serenityos.org>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #include "../LibUnicode/GeneratorUtil.h" // FIXME: Move this somewhere common.
  7. #include <AK/DateConstants.h>
  8. #include <AK/Format.h>
  9. #include <AK/HashMap.h>
  10. #include <AK/SourceGenerator.h>
  11. #include <AK/String.h>
  12. #include <AK/StringBuilder.h>
  13. #include <AK/Vector.h>
  14. #include <LibCore/ArgsParser.h>
  15. #include <LibCore/Stream.h>
  16. #include <LibTimeZone/TimeZone.h>
  17. namespace {
  18. using StringIndexType = u16;
  19. constexpr auto s_string_index_type = "u16"sv;
  20. struct DateTime {
  21. u16 year { 0 };
  22. Optional<u8> month;
  23. Optional<u8> day;
  24. Optional<u8> last_weekday;
  25. Optional<u8> after_weekday;
  26. Optional<u8> before_weekday;
  27. Optional<u8> hour;
  28. Optional<u8> minute;
  29. Optional<u8> second;
  30. };
  31. struct TimeZoneOffset {
  32. i64 offset { 0 };
  33. Optional<DateTime> until;
  34. Optional<String> dst_rule;
  35. Optional<i32> dst_rule_index;
  36. i64 dst_offset { 0 };
  37. StringIndexType standard_format { 0 };
  38. StringIndexType daylight_format { 0 };
  39. };
  40. struct DaylightSavingsOffset {
  41. i64 offset { 0 };
  42. u16 year_from { 0 };
  43. Optional<u16> year_to;
  44. DateTime in_effect;
  45. StringIndexType format { 0 };
  46. };
  47. struct TimeZoneData {
  48. UniqueStringStorage<StringIndexType> unique_strings;
  49. HashMap<String, Vector<TimeZoneOffset>> time_zones;
  50. Vector<String> time_zone_names;
  51. Vector<Alias> time_zone_aliases;
  52. HashMap<String, Vector<DaylightSavingsOffset>> dst_offsets;
  53. Vector<String> dst_offset_names;
  54. HashMap<String, TimeZone::Location> time_zone_coordinates;
  55. HashMap<String, Vector<StringIndexType>> time_zone_regions;
  56. Vector<String> time_zone_region_names;
  57. };
  58. }
  59. template<>
  60. struct AK::Formatter<DateTime> : Formatter<FormatString> {
  61. ErrorOr<void> format(FormatBuilder& builder, DateTime const& date_time)
  62. {
  63. return Formatter<FormatString>::format(builder,
  64. "{{ {}, {}, {}, {}, {}, {}, {}, {}, {} }}"sv,
  65. date_time.year,
  66. date_time.month.value_or(1),
  67. date_time.day.value_or(1),
  68. date_time.last_weekday.value_or(0),
  69. date_time.after_weekday.value_or(0),
  70. date_time.before_weekday.value_or(0),
  71. date_time.hour.value_or(0),
  72. date_time.minute.value_or(0),
  73. date_time.second.value_or(0));
  74. }
  75. };
  76. template<>
  77. struct AK::Formatter<TimeZoneOffset> : Formatter<FormatString> {
  78. ErrorOr<void> format(FormatBuilder& builder, TimeZoneOffset const& time_zone_offset)
  79. {
  80. return Formatter<FormatString>::format(builder,
  81. "{{ {}, {}, {}, {}, {}, {}, {} }}"sv,
  82. time_zone_offset.offset,
  83. time_zone_offset.until.value_or({}),
  84. time_zone_offset.until.has_value(),
  85. time_zone_offset.dst_rule_index.value_or(-1),
  86. time_zone_offset.dst_offset,
  87. time_zone_offset.standard_format,
  88. time_zone_offset.daylight_format);
  89. }
  90. };
  91. template<>
  92. struct AK::Formatter<DaylightSavingsOffset> : Formatter<FormatString> {
  93. ErrorOr<void> format(FormatBuilder& builder, DaylightSavingsOffset const& dst_offset)
  94. {
  95. auto format_time = [&](auto year) {
  96. return String::formatted("AK::Time::from_timestamp({}, 1, 1, 0, 0, 0, 0)", year);
  97. };
  98. static String max_year_as_time("max_year_as_time"sv);
  99. return Formatter<FormatString>::format(builder,
  100. "{{ {}, {}, {}, {}, {} }}"sv,
  101. dst_offset.offset,
  102. format_time(dst_offset.year_from),
  103. dst_offset.year_to.has_value()
  104. ? format_time(*dst_offset.year_to + 1)
  105. : max_year_as_time,
  106. dst_offset.in_effect,
  107. dst_offset.format);
  108. }
  109. };
  110. template<>
  111. struct AK::Formatter<TimeZone::Coordinate> : Formatter<FormatString> {
  112. ErrorOr<void> format(FormatBuilder& builder, TimeZone::Coordinate const& coordinate)
  113. {
  114. return Formatter<FormatString>::format(builder,
  115. "{{ {}, {}, {} }}"sv,
  116. coordinate.degrees,
  117. coordinate.minutes,
  118. coordinate.seconds);
  119. }
  120. };
  121. template<>
  122. struct AK::Formatter<TimeZone::Location> : Formatter<FormatString> {
  123. ErrorOr<void> format(FormatBuilder& builder, TimeZone::Location const& location)
  124. {
  125. return Formatter<FormatString>::format(builder,
  126. "{{ {}, {} }}"sv,
  127. location.latitude,
  128. location.longitude);
  129. }
  130. };
  131. static Optional<DateTime> parse_date_time(Span<StringView const> segments)
  132. {
  133. auto comment_index = find_index(segments.begin(), segments.end(), "#"sv);
  134. if (comment_index != segments.size())
  135. segments = segments.slice(0, comment_index);
  136. if (segments.is_empty())
  137. return {};
  138. DateTime date_time {};
  139. date_time.year = segments[0].to_uint().value();
  140. if (segments.size() > 1)
  141. date_time.month = find_index(short_month_names.begin(), short_month_names.end(), segments[1]) + 1;
  142. if (segments.size() > 2) {
  143. if (segments[2].starts_with("last"sv)) {
  144. auto weekday = segments[2].substring_view("last"sv.length());
  145. date_time.last_weekday = find_index(short_day_names.begin(), short_day_names.end(), weekday);
  146. } else if (auto index = segments[2].find(">="sv); index.has_value()) {
  147. auto weekday = segments[2].substring_view(0, *index);
  148. date_time.after_weekday = find_index(short_day_names.begin(), short_day_names.end(), weekday);
  149. auto day = segments[2].substring_view(*index + ">="sv.length());
  150. date_time.day = day.to_uint().value();
  151. } else if (auto index = segments[2].find("<="sv); index.has_value()) {
  152. auto weekday = segments[2].substring_view(0, *index);
  153. date_time.before_weekday = find_index(short_day_names.begin(), short_day_names.end(), weekday);
  154. auto day = segments[2].substring_view(*index + "<="sv.length());
  155. date_time.day = day.to_uint().value();
  156. } else {
  157. date_time.day = segments[2].to_uint().value();
  158. }
  159. }
  160. if (segments.size() > 3) {
  161. // FIXME: Some times end with a letter, e.g. "2:00u" and "2:00s". Figure out what this means and handle it.
  162. auto time_segments = segments[3].split_view(':');
  163. date_time.hour = time_segments[0].to_int().value();
  164. date_time.minute = time_segments.size() > 1 ? time_segments[1].substring_view(0, 2).to_uint().value() : 0;
  165. date_time.second = time_segments.size() > 2 ? time_segments[2].substring_view(0, 2).to_uint().value() : 0;
  166. }
  167. return date_time;
  168. }
  169. static i64 parse_time_offset(StringView segment)
  170. {
  171. auto segments = segment.split_view(':');
  172. i64 hours = segments[0].to_int().value();
  173. i64 minutes = segments.size() > 1 ? segments[1].to_uint().value() : 0;
  174. i64 seconds = segments.size() > 2 ? segments[2].to_uint().value() : 0;
  175. i64 sign = ((hours < 0) || (segments[0] == "-0"sv)) ? -1 : 1;
  176. return (hours * 3600) + sign * ((minutes * 60) + seconds);
  177. }
  178. static void parse_dst_rule(StringView segment, TimeZoneOffset& time_zone)
  179. {
  180. if (segment.contains(':'))
  181. time_zone.dst_offset = parse_time_offset(segment);
  182. else if (segment != "-"sv)
  183. time_zone.dst_rule = segment;
  184. }
  185. static void parse_format(StringView format, TimeZoneData& time_zone_data, TimeZoneOffset& time_zone)
  186. {
  187. auto formats = format.replace("%s"sv, "{}"sv, ReplaceMode::FirstOnly).split('/');
  188. VERIFY(formats.size() <= 2);
  189. time_zone.standard_format = time_zone_data.unique_strings.ensure(formats[0]);
  190. if (formats.size() == 2)
  191. time_zone.daylight_format = time_zone_data.unique_strings.ensure(formats[1]);
  192. else
  193. time_zone.daylight_format = time_zone.standard_format;
  194. }
  195. static Vector<TimeZoneOffset>& parse_zone(StringView zone_line, TimeZoneData& time_zone_data)
  196. {
  197. auto segments = zone_line.split_view_if([](char ch) { return (ch == '\t') || (ch == ' '); });
  198. // "Zone" NAME STDOFF RULES FORMAT [UNTIL]
  199. VERIFY(segments[0] == "Zone"sv);
  200. auto name = segments[1];
  201. TimeZoneOffset time_zone {};
  202. time_zone.offset = parse_time_offset(segments[2]);
  203. parse_dst_rule(segments[3], time_zone);
  204. parse_format(segments[4], time_zone_data, time_zone);
  205. if (segments.size() > 5)
  206. time_zone.until = parse_date_time(segments.span().slice(5));
  207. auto& time_zones = time_zone_data.time_zones.ensure(name);
  208. time_zones.append(move(time_zone));
  209. if (!time_zone_data.time_zone_names.contains_slow(name))
  210. time_zone_data.time_zone_names.append(name);
  211. return time_zones;
  212. }
  213. static void parse_zone_continuation(StringView zone_line, TimeZoneData& time_zone_data, Vector<TimeZoneOffset>& time_zones)
  214. {
  215. auto segments = zone_line.split_view_if([](char ch) { return (ch == '\t') || (ch == ' '); });
  216. // STDOFF RULES FORMAT [UNTIL]
  217. TimeZoneOffset time_zone {};
  218. time_zone.offset = parse_time_offset(segments[0]);
  219. parse_dst_rule(segments[1], time_zone);
  220. parse_format(segments[2], time_zone_data, time_zone);
  221. if (segments.size() > 3)
  222. time_zone.until = parse_date_time(segments.span().slice(3));
  223. time_zones.append(move(time_zone));
  224. }
  225. static void parse_link(StringView link_line, TimeZoneData& time_zone_data)
  226. {
  227. auto segments = link_line.split_view_if([](char ch) { return (ch == '\t') || (ch == ' '); });
  228. // Link TARGET LINK-NAME
  229. VERIFY(segments[0] == "Link"sv);
  230. auto target = segments[1];
  231. auto alias = segments[2];
  232. time_zone_data.time_zone_aliases.append({ target, alias });
  233. }
  234. static void parse_rule(StringView rule_line, TimeZoneData& time_zone_data)
  235. {
  236. auto segments = rule_line.split_view_if([](char ch) { return (ch == '\t') || (ch == ' '); });
  237. // Rule NAME FROM TO TYPE IN ON AT SAVE LETTER/S
  238. VERIFY(segments[0] == "Rule"sv);
  239. auto name = segments[1];
  240. DaylightSavingsOffset dst_offset {};
  241. dst_offset.offset = parse_time_offset(segments[8]);
  242. dst_offset.year_from = segments[2].to_uint().value();
  243. if (segments[3] == "only")
  244. dst_offset.year_to = dst_offset.year_from;
  245. else if (segments[3] != "max"sv)
  246. dst_offset.year_to = segments[3].to_uint().value();
  247. auto in_effect = Array { "0"sv, segments[5], segments[6], segments[7] };
  248. dst_offset.in_effect = parse_date_time(in_effect).release_value();
  249. if (segments[9] != "-"sv)
  250. dst_offset.format = time_zone_data.unique_strings.ensure(segments[9]);
  251. auto& dst_offsets = time_zone_data.dst_offsets.ensure(name);
  252. dst_offsets.append(move(dst_offset));
  253. if (!time_zone_data.dst_offset_names.contains_slow(name))
  254. time_zone_data.dst_offset_names.append(name);
  255. }
  256. static ErrorOr<void> parse_time_zones(StringView time_zone_path, TimeZoneData& time_zone_data)
  257. {
  258. // For reference, the man page for `zic` has the best documentation of the TZDB file format.
  259. auto file = TRY(open_file(time_zone_path, Core::Stream::OpenMode::Read));
  260. Array<u8, 1024> buffer {};
  261. Vector<TimeZoneOffset>* last_parsed_zone = nullptr;
  262. while (TRY(file->can_read_line())) {
  263. auto line = TRY(file->read_line(buffer));
  264. if (line.is_empty() || line.trim_whitespace(TrimMode::Left).starts_with('#'))
  265. continue;
  266. if (line.starts_with("Zone"sv)) {
  267. last_parsed_zone = &parse_zone(line, time_zone_data);
  268. } else if (line.starts_with('\t')) {
  269. VERIFY(last_parsed_zone != nullptr);
  270. parse_zone_continuation(line, time_zone_data, *last_parsed_zone);
  271. } else {
  272. last_parsed_zone = nullptr;
  273. if (line.starts_with("Link"sv))
  274. parse_link(line, time_zone_data);
  275. else if (line.starts_with("Rule"sv))
  276. parse_rule(line, time_zone_data);
  277. }
  278. }
  279. return {};
  280. }
  281. static ErrorOr<void> parse_time_zone_coordinates(Core::Stream::BufferedFile& file, TimeZoneData& time_zone_data)
  282. {
  283. auto parse_coordinate = [](auto coordinate) {
  284. VERIFY(coordinate.substring_view(0, 1).is_one_of("+"sv, "-"sv));
  285. TimeZone::Coordinate parsed {};
  286. if (coordinate.length() == 5) {
  287. // ±DDMM
  288. parsed.degrees = coordinate.substring_view(0, 3).to_int().value();
  289. parsed.minutes = coordinate.substring_view(3).to_int().value();
  290. } else if (coordinate.length() == 6) {
  291. // ±DDDMM
  292. parsed.degrees = coordinate.substring_view(0, 4).to_int().value();
  293. parsed.minutes = coordinate.substring_view(4).to_int().value();
  294. } else if (coordinate.length() == 7) {
  295. // ±DDMMSS
  296. parsed.degrees = coordinate.substring_view(0, 3).to_int().value();
  297. parsed.minutes = coordinate.substring_view(3, 2).to_int().value();
  298. parsed.seconds = coordinate.substring_view(5).to_int().value();
  299. } else if (coordinate.length() == 8) {
  300. // ±DDDDMMSS
  301. parsed.degrees = coordinate.substring_view(0, 4).to_int().value();
  302. parsed.minutes = coordinate.substring_view(4, 2).to_int().value();
  303. parsed.seconds = coordinate.substring_view(6).to_int().value();
  304. } else {
  305. VERIFY_NOT_REACHED();
  306. }
  307. return parsed;
  308. };
  309. Array<u8, 1024> buffer {};
  310. while (TRY(file.can_read_line())) {
  311. auto line = TRY(file.read_line(buffer));
  312. if (line.is_empty() || line.trim_whitespace(TrimMode::Left).starts_with('#'))
  313. continue;
  314. auto segments = line.split_view('\t');
  315. auto regions = segments[0];
  316. auto coordinates = segments[1];
  317. auto zone = segments[2];
  318. VERIFY(time_zone_data.time_zones.contains(zone));
  319. auto index = coordinates.find_any_of("+-"sv, StringView::SearchDirection::Backward).value();
  320. auto latitude = parse_coordinate(coordinates.substring_view(0, index));
  321. auto longitude = parse_coordinate(coordinates.substring_view(index));
  322. time_zone_data.time_zone_coordinates.set(zone, { latitude, longitude });
  323. regions.for_each_split_view(',', SplitBehavior::Nothing, [&](auto region) {
  324. auto index = time_zone_data.unique_strings.ensure(zone);
  325. time_zone_data.time_zone_regions.ensure(region).append(index);
  326. if (!time_zone_data.time_zone_region_names.contains_slow(region))
  327. time_zone_data.time_zone_region_names.append(region);
  328. });
  329. }
  330. return {};
  331. }
  332. static void set_dst_rule_indices(TimeZoneData& time_zone_data)
  333. {
  334. for (auto& time_zone : time_zone_data.time_zones) {
  335. for (auto& time_zone_offset : time_zone.value) {
  336. if (!time_zone_offset.dst_rule.has_value())
  337. continue;
  338. auto dst_rule_index = time_zone_data.dst_offset_names.find_first_index(*time_zone_offset.dst_rule);
  339. time_zone_offset.dst_rule_index = static_cast<i32>(dst_rule_index.value());
  340. }
  341. }
  342. }
  343. static String format_identifier(StringView owner, String identifier)
  344. {
  345. constexpr auto gmt_time_zones = Array { "Etc/GMT"sv, "GMT"sv };
  346. for (auto gmt_time_zone : gmt_time_zones) {
  347. if (identifier.starts_with(gmt_time_zone)) {
  348. auto offset = identifier.substring_view(gmt_time_zone.length());
  349. if (offset.starts_with('+'))
  350. identifier = String::formatted("{}_Ahead_{}", gmt_time_zone, offset.substring_view(1));
  351. else if (offset.starts_with('-'))
  352. identifier = String::formatted("{}_Behind_{}", gmt_time_zone, offset.substring_view(1));
  353. }
  354. }
  355. identifier = identifier.replace("-"sv, "_"sv, ReplaceMode::All);
  356. identifier = identifier.replace("/"sv, "_"sv, ReplaceMode::All);
  357. if (all_of(identifier, is_ascii_digit))
  358. return String::formatted("{}_{}", owner[0], identifier);
  359. if (is_ascii_lower_alpha(identifier[0]))
  360. return String::formatted("{:c}{}", to_ascii_uppercase(identifier[0]), identifier.substring_view(1));
  361. return identifier;
  362. }
  363. static ErrorOr<void> generate_time_zone_data_header(Core::Stream::BufferedFile& file, TimeZoneData& time_zone_data)
  364. {
  365. StringBuilder builder;
  366. SourceGenerator generator { builder };
  367. generator.append(R"~~~(
  368. #pragma once
  369. #include <AK/Types.h>
  370. namespace TimeZone {
  371. )~~~");
  372. generate_enum(generator, format_identifier, "TimeZone"sv, {}, time_zone_data.time_zone_names, time_zone_data.time_zone_aliases);
  373. generate_enum(generator, format_identifier, "DaylightSavingsRule"sv, {}, time_zone_data.dst_offset_names);
  374. generate_enum(generator, format_identifier, "Region"sv, {}, time_zone_data.time_zone_region_names);
  375. generator.append(R"~~~(
  376. }
  377. )~~~");
  378. TRY(file.write(generator.as_string_view().bytes()));
  379. return {};
  380. }
  381. static ErrorOr<void> generate_time_zone_data_implementation(Core::Stream::BufferedFile& file, TimeZoneData& time_zone_data)
  382. {
  383. StringBuilder builder;
  384. SourceGenerator generator { builder };
  385. generator.set("string_index_type"sv, s_string_index_type);
  386. set_dst_rule_indices(time_zone_data);
  387. generator.append(R"~~~(
  388. #include <AK/Array.h>
  389. #include <AK/BinarySearch.h>
  390. #include <AK/Optional.h>
  391. #include <AK/Span.h>
  392. #include <AK/NumericLimits.h>
  393. #include <AK/StringView.h>
  394. #include <AK/Time.h>
  395. #include <LibTimeZone/TimeZone.h>
  396. #include <LibTimeZone/TimeZoneData.h>
  397. namespace TimeZone {
  398. static constexpr auto max_year_as_time = AK::Time::from_timestamp(NumericLimits<u16>::max(), 1, 1, 0, 0, 0, 0);
  399. struct DateTime {
  400. AK::Time time_since_epoch() const
  401. {
  402. // FIXME: This implementation does not take last_weekday, after_weekday, or before_weekday into account.
  403. return AK::Time::from_timestamp(year, month, day, hour, minute, second, 0);
  404. }
  405. u16 year { 0 };
  406. u8 month { 1 };
  407. u8 day { 1 };
  408. u8 last_weekday { 0 };
  409. u8 after_weekday { 0 };
  410. u8 before_weekday { 0 };
  411. u8 hour { 0 };
  412. u8 minute { 0 };
  413. u8 second { 0 };
  414. };
  415. struct TimeZoneOffset {
  416. i64 offset { 0 };
  417. DateTime until {};
  418. bool has_until { false };
  419. i32 dst_rule { -1 };
  420. i64 dst_offset { 0 };
  421. @string_index_type@ standard_format { 0 };
  422. @string_index_type@ daylight_format { 0 };
  423. };
  424. struct DaylightSavingsOffset {
  425. AK::Time time_in_effect(AK::Time time) const
  426. {
  427. auto in_effect = this->in_effect;
  428. in_effect.year = seconds_since_epoch_to_year(time.to_seconds());
  429. return in_effect.time_since_epoch();
  430. }
  431. i64 offset { 0 };
  432. AK::Time year_from {};
  433. AK::Time year_to {};
  434. DateTime in_effect {};
  435. @string_index_type@ format { 0 };
  436. };
  437. )~~~");
  438. time_zone_data.unique_strings.generate(generator);
  439. auto append_offsets = [&](auto const& name, auto type, auto const& offsets) {
  440. generator.set("name", name);
  441. generator.set("type", type);
  442. generator.set("size", String::number(offsets.size()));
  443. generator.append(R"~~~(
  444. static constexpr Array<@type@, @size@> @name@ { {
  445. )~~~");
  446. for (auto const& offset : offsets)
  447. generator.append(String::formatted(" {},\n", offset));
  448. generator.append("} };\n");
  449. };
  450. generate_mapping(generator, time_zone_data.time_zone_names, "TimeZoneOffset"sv, "s_time_zone_offsets"sv, "s_time_zone_offsets_{}"sv, format_identifier,
  451. [&](auto const& name, auto const& value) {
  452. auto const& time_zone_offsets = time_zone_data.time_zones.find(value)->value;
  453. append_offsets(name, "TimeZoneOffset"sv, time_zone_offsets);
  454. });
  455. generate_mapping(generator, time_zone_data.dst_offset_names, "DaylightSavingsOffset"sv, "s_dst_offsets"sv, "s_dst_offsets_{}"sv, format_identifier,
  456. [&](auto const& name, auto const& value) {
  457. auto const& dst_offsets = time_zone_data.dst_offsets.find(value)->value;
  458. append_offsets(name, "DaylightSavingsOffset"sv, dst_offsets);
  459. });
  460. generate_mapping(generator, time_zone_data.time_zone_region_names, s_string_index_type, "s_regional_time_zones"sv, "s_regional_time_zones_{}"sv, format_identifier,
  461. [&](auto const& name, auto const& value) {
  462. auto const& time_zones = time_zone_data.time_zone_regions.find(value)->value;
  463. generator.set("name", name);
  464. generator.set("size", String::number(time_zones.size()));
  465. generator.append(R"~~~(
  466. static constexpr Array<@string_index_type@, @size@> @name@ { {)~~~");
  467. bool first = true;
  468. for (auto const& time_zone : time_zones) {
  469. generator.append(first ? " "sv : ", "sv);
  470. generator.append(String::number(time_zone));
  471. first = false;
  472. }
  473. generator.append(" } };");
  474. });
  475. generator.set("size", String::number(time_zone_data.time_zone_names.size()));
  476. generator.append(R"~~~(
  477. static constexpr Array<Location, @size@> s_time_zone_locations { {
  478. )~~~");
  479. for (auto const& time_zone : time_zone_data.time_zone_names) {
  480. auto location = time_zone_data.time_zone_coordinates.get(time_zone).value_or({});
  481. generator.append(String::formatted(" {},\n", location));
  482. }
  483. generator.append("} };\n");
  484. auto append_string_conversions = [&](StringView enum_title, StringView enum_snake, auto const& values, Vector<Alias> const& aliases = {}) {
  485. HashValueMap<String> hashes;
  486. hashes.ensure_capacity(values.size());
  487. auto hash = [](auto const& value) {
  488. return CaseInsensitiveStringViewTraits::hash(value);
  489. };
  490. for (auto const& value : values)
  491. hashes.set(hash(value), format_identifier(enum_title, value));
  492. for (auto const& alias : aliases)
  493. hashes.set(hash(alias.alias), format_identifier(enum_title, alias.alias));
  494. ValueFromStringOptions options {};
  495. options.sensitivity = CaseSensitivity::CaseInsensitive;
  496. generate_value_from_string(generator, "{}_from_string"sv, enum_title, enum_snake, move(hashes), options);
  497. generate_value_to_string(generator, "{}_to_string"sv, enum_title, enum_snake, format_identifier, values);
  498. };
  499. append_string_conversions("TimeZone"sv, "time_zone"sv, time_zone_data.time_zone_names, time_zone_data.time_zone_aliases);
  500. append_string_conversions("DaylightSavingsRule"sv, "daylight_savings_rule"sv, time_zone_data.dst_offset_names);
  501. append_string_conversions("Region"sv, "region"sv, time_zone_data.time_zone_region_names);
  502. generator.append(R"~~~(
  503. static Array<DaylightSavingsOffset const*, 2> find_dst_offsets(TimeZoneOffset const& time_zone_offset, AK::Time time)
  504. {
  505. auto const& dst_rules = s_dst_offsets[time_zone_offset.dst_rule];
  506. DaylightSavingsOffset const* standard_offset = nullptr;
  507. DaylightSavingsOffset const* daylight_offset = nullptr;
  508. DaylightSavingsOffset const* last_offset = nullptr;
  509. auto preferred_rule = [&](auto* current_offset, auto& new_offset) {
  510. if (!current_offset)
  511. return &new_offset;
  512. auto new_time_in_effect = new_offset.time_in_effect(time);
  513. return (time >= new_time_in_effect) ? &new_offset : current_offset;
  514. };
  515. for (size_t index = 0; (index < dst_rules.size()) && (!standard_offset || !daylight_offset); ++index) {
  516. auto const& dst_rule = dst_rules[index];
  517. if (last_offset == nullptr)
  518. last_offset = &dst_rule;
  519. else if (dst_rule.time_in_effect(dst_rule.year_to) > last_offset->time_in_effect(last_offset->year_to))
  520. last_offset = &dst_rule;
  521. if ((time < dst_rule.year_from) || (time >= dst_rule.year_to))
  522. continue;
  523. if (dst_rule.offset == 0)
  524. standard_offset = preferred_rule(standard_offset, dst_rule);
  525. else
  526. daylight_offset = preferred_rule(daylight_offset, dst_rule);
  527. }
  528. // If there isn't a standard or daylight rule in effect, fall back to the last rule given in the TZDB.
  529. if (!standard_offset) {
  530. VERIFY(last_offset != nullptr);
  531. standard_offset = last_offset;
  532. }
  533. return { standard_offset, daylight_offset ? daylight_offset : standard_offset };
  534. }
  535. static Offset get_active_dst_offset(TimeZoneOffset const& time_zone_offset, AK::Time time)
  536. {
  537. auto offsets = find_dst_offsets(time_zone_offset, time);
  538. if (offsets[0] == offsets[1])
  539. return { offsets[0]->offset, InDST::No };
  540. auto standard_time_in_effect = offsets[0]->time_in_effect(time);
  541. auto daylight_time_in_effect = offsets[1]->time_in_effect(time);
  542. if (daylight_time_in_effect < standard_time_in_effect) {
  543. if ((time < daylight_time_in_effect) || (time >= standard_time_in_effect))
  544. return { offsets[0]->offset, InDST::No };
  545. } else {
  546. if ((time >= standard_time_in_effect) && (time < daylight_time_in_effect))
  547. return { offsets[0]->offset, InDST::No };
  548. }
  549. return { offsets[1]->offset, InDST::Yes };
  550. }
  551. static TimeZoneOffset const& find_time_zone_offset(TimeZone time_zone, AK::Time time)
  552. {
  553. auto const& time_zone_offsets = s_time_zone_offsets[to_underlying(time_zone)];
  554. size_t index = 0;
  555. for (; index < time_zone_offsets.size(); ++index) {
  556. auto const& time_zone_offset = time_zone_offsets[index];
  557. if (!time_zone_offset.has_until || (time_zone_offset.until.time_since_epoch() > time))
  558. break;
  559. }
  560. VERIFY(index < time_zone_offsets.size());
  561. return time_zone_offsets[index];
  562. }
  563. Optional<Offset> get_time_zone_offset(TimeZone time_zone, AK::Time time)
  564. {
  565. auto const& time_zone_offset = find_time_zone_offset(time_zone, time);
  566. Offset dst_offset {};
  567. if (time_zone_offset.dst_rule != -1) {
  568. dst_offset = get_active_dst_offset(time_zone_offset, time);
  569. } else {
  570. auto in_dst = time_zone_offset.dst_offset == 0 ? InDST::No : InDST::Yes;
  571. dst_offset = { time_zone_offset.dst_offset, in_dst };
  572. }
  573. dst_offset.seconds += time_zone_offset.offset;
  574. return dst_offset;
  575. }
  576. Optional<Array<NamedOffset, 2>> get_named_time_zone_offsets(TimeZone time_zone, AK::Time time)
  577. {
  578. auto const& time_zone_offset = find_time_zone_offset(time_zone, time);
  579. Array<NamedOffset, 2> named_offsets;
  580. auto format_name = [](auto format, auto offset) -> String {
  581. if (offset == 0)
  582. return decode_string(format).replace("{}"sv, ""sv, ReplaceMode::FirstOnly);
  583. return String::formatted(decode_string(format), decode_string(offset));
  584. };
  585. auto set_named_offset = [&](auto& named_offset, auto dst_offset, auto in_dst, auto format, auto offset) {
  586. named_offset.seconds = time_zone_offset.offset + dst_offset;
  587. named_offset.in_dst = in_dst;
  588. named_offset.name = format_name(format, offset);
  589. };
  590. if (time_zone_offset.dst_rule != -1) {
  591. auto offsets = find_dst_offsets(time_zone_offset, time);
  592. auto in_dst = offsets[1]->offset == 0 ? InDST::No : InDST::Yes;
  593. set_named_offset(named_offsets[0], offsets[0]->offset, InDST::No, time_zone_offset.standard_format, offsets[0]->format);
  594. set_named_offset(named_offsets[1], offsets[1]->offset, in_dst, time_zone_offset.daylight_format, offsets[1]->format);
  595. } else {
  596. auto in_dst = time_zone_offset.dst_offset == 0 ? InDST::No : InDST::Yes;
  597. set_named_offset(named_offsets[0], time_zone_offset.dst_offset, in_dst, time_zone_offset.standard_format, 0);
  598. set_named_offset(named_offsets[1], time_zone_offset.dst_offset, in_dst, time_zone_offset.daylight_format, 0);
  599. }
  600. return named_offsets;
  601. }
  602. Optional<Location> get_time_zone_location(TimeZone time_zone)
  603. {
  604. auto is_valid_coordinate = [](auto const& coordinate) {
  605. return (coordinate.degrees != 0) || (coordinate.minutes != 0) || (coordinate.seconds != 0);
  606. };
  607. auto const& location = s_time_zone_locations[to_underlying(time_zone)];
  608. if (is_valid_coordinate(location.latitude) && is_valid_coordinate(location.longitude))
  609. return location;
  610. return {};
  611. }
  612. Vector<StringView> time_zones_in_region(StringView region)
  613. {
  614. auto region_value = region_from_string(region);
  615. if (!region_value.has_value())
  616. return {};
  617. auto region_index = to_underlying(*region_value);
  618. auto const& regional_time_zones = s_regional_time_zones[region_index];
  619. Vector<StringView> time_zones;
  620. time_zones.ensure_capacity(regional_time_zones.size());
  621. for (auto time_zone : regional_time_zones)
  622. time_zones.unchecked_append(decode_string(time_zone));
  623. return time_zones;
  624. }
  625. )~~~");
  626. generate_available_values(generator, "all_time_zones"sv, time_zone_data.time_zone_names);
  627. generator.append(R"~~~(
  628. }
  629. )~~~");
  630. TRY(file.write(generator.as_string_view().bytes()));
  631. return {};
  632. }
  633. ErrorOr<int> serenity_main(Main::Arguments arguments)
  634. {
  635. StringView generated_header_path;
  636. StringView generated_implementation_path;
  637. StringView time_zone_coordinates_path;
  638. Vector<StringView> time_zone_paths;
  639. Core::ArgsParser args_parser;
  640. args_parser.add_option(generated_header_path, "Path to the time zone data header file to generate", "generated-header-path", 'h', "generated-header-path");
  641. args_parser.add_option(generated_implementation_path, "Path to the time zone data implementation file to generate", "generated-implementation-path", 'c', "generated-implementation-path");
  642. args_parser.add_option(time_zone_coordinates_path, "Path to the time zone data coordinates file", "time-zone-coordinates-path", 'z', "time-zone-coordinates-path");
  643. args_parser.add_positional_argument(time_zone_paths, "Paths to the time zone database files", "time-zone-paths");
  644. args_parser.parse(arguments);
  645. auto generated_header_file = TRY(open_file(generated_header_path, Core::Stream::OpenMode::Write));
  646. auto generated_implementation_file = TRY(open_file(generated_implementation_path, Core::Stream::OpenMode::Write));
  647. auto time_zone_coordinates_file = TRY(open_file(time_zone_coordinates_path, Core::Stream::OpenMode::Read));
  648. TimeZoneData time_zone_data {};
  649. for (auto time_zone_path : time_zone_paths)
  650. TRY(parse_time_zones(time_zone_path, time_zone_data));
  651. TRY(parse_time_zone_coordinates(*time_zone_coordinates_file, time_zone_data));
  652. TRY(generate_time_zone_data_header(*generated_header_file, time_zone_data));
  653. TRY(generate_time_zone_data_implementation(*generated_implementation_file, time_zone_data));
  654. return 0;
  655. }