GeneratorUtil.h 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460
  1. /*
  2. * Copyright (c) 2021, Tim Flynn <trflynn89@pm.me>
  3. *
  4. * SPDX-License-Identifier: BSD-2-Clause
  5. */
  6. #pragma once
  7. #include <AK/Format.h>
  8. #include <AK/HashFunctions.h>
  9. #include <AK/HashMap.h>
  10. #include <AK/LexicalPath.h>
  11. #include <AK/Optional.h>
  12. #include <AK/QuickSort.h>
  13. #include <AK/SourceGenerator.h>
  14. #include <AK/String.h>
  15. #include <AK/StringView.h>
  16. #include <AK/Traits.h>
  17. #include <AK/Vector.h>
  18. #include <LibCore/DirIterator.h>
  19. #include <LibCore/File.h>
  20. #include <LibUnicode/Locale.h>
  21. template<class T>
  22. inline constexpr bool StorageTypeIsList = false;
  23. template<class T>
  24. inline constexpr bool StorageTypeIsList<Vector<T>> = true;
  25. template<typename T>
  26. concept IntegralOrEnum = Integral<T> || Enum<T>;
  27. template<IntegralOrEnum T>
  28. struct AK::Traits<Vector<T>> : public GenericTraits<Vector<T>> {
  29. static unsigned hash(Vector<T> const& list)
  30. {
  31. auto hash = int_hash(static_cast<u32>(list.size()));
  32. for (auto value : list) {
  33. if constexpr (Enum<T>)
  34. hash = pair_int_hash(hash, to_underlying(value));
  35. else
  36. hash = pair_int_hash(hash, value);
  37. }
  38. return hash;
  39. }
  40. };
  41. template<typename StorageType, typename IndexType>
  42. class UniqueStorage {
  43. public:
  44. IndexType ensure(StorageType value)
  45. {
  46. // We maintain a set of unique values in two structures: a vector which stores the values in
  47. // the order they are added, and a hash map which maps that value to its index in the vector.
  48. // The vector is to ensure the values are generated in an easily known order, and the map is
  49. // to allow quickly deciding if a value is actually unique (otherwise, we'd have to linearly
  50. // search the vector for each value).
  51. //
  52. // Also note that index 0 will be reserved for the default-initialized value, so the index
  53. // returned from this method is actually the real index in the vector + 1.
  54. if (auto index = m_storage_indices.get(value); index.has_value())
  55. return *index;
  56. m_storage.append(move(value));
  57. size_t index = m_storage.size();
  58. VERIFY(index < NumericLimits<IndexType>::max());
  59. auto storage_index = static_cast<IndexType>(index);
  60. m_storage_indices.set(m_storage.last(), storage_index);
  61. return storage_index;
  62. }
  63. StorageType const& get(IndexType index) const
  64. {
  65. if (index == 0) {
  66. static StorageType empty {};
  67. return empty;
  68. }
  69. VERIFY(index <= m_storage.size());
  70. return m_storage.at(index - 1);
  71. }
  72. void generate(SourceGenerator& generator, StringView type, StringView name, size_t max_values_per_row) requires(!StorageTypeIsList<StorageType>)
  73. {
  74. generator.set("type"sv, type);
  75. generator.set("name"sv, name);
  76. generator.set("size"sv, String::number(m_storage.size()));
  77. generator.append(R"~~~(
  78. static constexpr Array<@type@, @size@ + 1> @name@ { {
  79. {})~~~");
  80. size_t values_in_current_row = 1;
  81. for (auto const& value : m_storage) {
  82. if (values_in_current_row++ > 0)
  83. generator.append(", ");
  84. if constexpr (IsSame<StorageType, String>)
  85. generator.append(String::formatted("\"{}\"sv", value));
  86. else
  87. generator.append(String::formatted("{}", value));
  88. if (values_in_current_row == max_values_per_row) {
  89. values_in_current_row = 0;
  90. generator.append(",\n ");
  91. }
  92. }
  93. generator.append(R"~~~(
  94. } };
  95. )~~~");
  96. }
  97. void generate(SourceGenerator& generator, StringView type, StringView name) requires(StorageTypeIsList<StorageType>)
  98. {
  99. generator.set("type"sv, type);
  100. generator.set("name"sv, name);
  101. for (size_t i = 0; i < m_storage.size(); ++i) {
  102. auto const& list = m_storage[i];
  103. generator.set("index"sv, String::number(i));
  104. generator.set("size"sv, String::number(list.size()));
  105. generator.append(R"~~~(
  106. static constexpr Array<@type@, @size@> @name@@index@ { {)~~~");
  107. bool first = true;
  108. for (auto const& value : list) {
  109. generator.append(first ? " " : ", ");
  110. generator.append(String::formatted("{}", value));
  111. first = false;
  112. }
  113. generator.append(" } };");
  114. }
  115. generator.set("size"sv, String::number(m_storage.size()));
  116. generator.append(R"~~~(
  117. static constexpr Array<Span<@type@ const>, @size@ + 1> @name@ { {
  118. {})~~~");
  119. constexpr size_t max_values_per_row = 10;
  120. size_t values_in_current_row = 1;
  121. for (size_t i = 0; i < m_storage.size(); ++i) {
  122. if (values_in_current_row++ > 0)
  123. generator.append(", ");
  124. generator.set("index"sv, String::number(i));
  125. generator.append("@name@@index@.span()");
  126. if (values_in_current_row == max_values_per_row) {
  127. values_in_current_row = 0;
  128. generator.append(",\n ");
  129. }
  130. }
  131. generator.append(R"~~~(
  132. } };
  133. )~~~");
  134. }
  135. // clang-format off
  136. // clang-format gets confused by the requires() clauses above, and formats this section very weirdly.
  137. private:
  138. Vector<StorageType> m_storage;
  139. HashMap<StorageType, IndexType> m_storage_indices;
  140. // clang-format on
  141. };
  142. template<typename StringIndexType>
  143. class UniqueStringStorage : public UniqueStorage<String, StringIndexType> {
  144. using Base = UniqueStorage<String, StringIndexType>;
  145. public:
  146. void generate(SourceGenerator& generator)
  147. {
  148. Base::generate(generator, "StringView"sv, "s_string_list"sv, 40);
  149. }
  150. };
  151. struct Alias {
  152. String name;
  153. String alias;
  154. };
  155. template<typename StringIndexType>
  156. struct CanonicalLanguageID {
  157. static ErrorOr<CanonicalLanguageID> parse(UniqueStringStorage<StringIndexType>& unique_strings, StringView language)
  158. {
  159. CanonicalLanguageID language_id {};
  160. auto segments = language.split_view('-');
  161. VERIFY(!segments.is_empty());
  162. size_t index = 0;
  163. if (Unicode::is_unicode_language_subtag(segments[index])) {
  164. language_id.language = unique_strings.ensure(segments[index]);
  165. if (segments.size() == ++index)
  166. return language_id;
  167. } else {
  168. return Error::from_string_literal("Expected language subtag"sv);
  169. }
  170. if (Unicode::is_unicode_script_subtag(segments[index])) {
  171. language_id.script = unique_strings.ensure(segments[index]);
  172. if (segments.size() == ++index)
  173. return language_id;
  174. }
  175. if (Unicode::is_unicode_region_subtag(segments[index])) {
  176. language_id.region = unique_strings.ensure(segments[index]);
  177. if (segments.size() == ++index)
  178. return language_id;
  179. }
  180. while (index < segments.size()) {
  181. if (!Unicode::is_unicode_variant_subtag(segments[index]))
  182. return Error::from_string_literal("Expected variant subtag"sv);
  183. language_id.variants.append(unique_strings.ensure(segments[index++]));
  184. }
  185. return language_id;
  186. }
  187. StringIndexType language { 0 };
  188. StringIndexType script { 0 };
  189. StringIndexType region { 0 };
  190. Vector<StringIndexType> variants {};
  191. };
  192. inline ErrorOr<Core::DirIterator> path_to_dir_iterator(String path, StringView subpath = "main"sv)
  193. {
  194. LexicalPath lexical_path(move(path));
  195. if (!subpath.is_empty())
  196. lexical_path = lexical_path.append(subpath);
  197. Core::DirIterator iterator(lexical_path.string(), Core::DirIterator::SkipParentAndBaseDir);
  198. if (iterator.has_error())
  199. return Error::from_string_literal(iterator.error_string());
  200. return iterator;
  201. }
  202. inline ErrorOr<String> next_path_from_dir_iterator(Core::DirIterator& iterator)
  203. {
  204. auto next_path = iterator.next_full_path();
  205. if (iterator.has_error())
  206. return Error::from_string_literal(iterator.error_string());
  207. return next_path;
  208. }
  209. inline void ensure_from_string_types_are_generated(SourceGenerator& generator)
  210. {
  211. static bool generated_from_string_types = false;
  212. if (generated_from_string_types)
  213. return;
  214. generator.append(R"~~~(
  215. template <typename ValueType>
  216. struct HashValuePair {
  217. unsigned hash { 0 };
  218. ValueType value {};
  219. };
  220. template <typename ValueType>
  221. struct HashValueComparator
  222. {
  223. constexpr int operator()(unsigned hash, HashValuePair<ValueType> const& pair)
  224. {
  225. if (hash > pair.hash)
  226. return 1;
  227. if (hash < pair.hash)
  228. return -1;
  229. return 0;
  230. }
  231. };
  232. )~~~");
  233. generated_from_string_types = true;
  234. }
  235. template<typename ValueType>
  236. using HashValueMap = HashMap<unsigned, ValueType>;
  237. struct ValueFromStringOptions {
  238. Optional<StringView> return_type {};
  239. StringView return_format { "{}"sv };
  240. CaseSensitivity sensitivity { CaseSensitivity::CaseSensitive };
  241. };
  242. template<typename ValueType>
  243. void generate_value_from_string(SourceGenerator& generator, StringView method_name_format, StringView value_type, StringView value_name, HashValueMap<ValueType> hashes, ValueFromStringOptions options = {})
  244. {
  245. ensure_from_string_types_are_generated(generator);
  246. generator.set("method_name", String::formatted(method_name_format, value_name));
  247. generator.set("value_type", value_type);
  248. generator.set("value_name", value_name);
  249. generator.set("return_type", options.return_type.has_value() ? *options.return_type : value_type);
  250. generator.set("size", String::number(hashes.size()));
  251. generator.append(R"~~~(
  252. Optional<@return_type@> @method_name@(StringView key)
  253. {
  254. constexpr Array<HashValuePair<@value_type@>, @size@> hash_pairs { {
  255. )~~~");
  256. auto hash_keys = hashes.keys();
  257. quick_sort(hash_keys);
  258. constexpr size_t max_values_per_row = 10;
  259. size_t values_in_current_row = 0;
  260. for (auto hash_key : hash_keys) {
  261. if (values_in_current_row++ > 0)
  262. generator.append(" ");
  263. if constexpr (IsIntegral<ValueType>)
  264. generator.set("value"sv, String::number(hashes.get(hash_key).value()));
  265. else
  266. generator.set("value"sv, String::formatted("{}::{}", value_type, hashes.get(hash_key).value()));
  267. generator.set("hash"sv, String::number(hash_key));
  268. generator.append("{ @hash@U, @value@ },"sv);
  269. if (values_in_current_row == max_values_per_row) {
  270. generator.append("\n ");
  271. values_in_current_row = 0;
  272. }
  273. }
  274. generator.set("return_statement", String::formatted(options.return_format, "value->value"sv));
  275. generator.append(R"~~~(
  276. } };
  277. )~~~");
  278. if (options.sensitivity == CaseSensitivity::CaseSensitive) {
  279. generator.append(R"~~~(
  280. auto hash = key.hash();
  281. )~~~");
  282. } else {
  283. generator.append(R"~~~(
  284. auto hash = CaseInsensitiveStringViewTraits::hash(key);
  285. )~~~");
  286. }
  287. generator.append(R"~~~(
  288. if (auto const* value = binary_search(hash_pairs, hash, nullptr, HashValueComparator<@value_type@> {}))
  289. return @return_statement@;
  290. return {};
  291. }
  292. )~~~");
  293. }
  294. template<typename IdentifierFormatter>
  295. void generate_enum(SourceGenerator& generator, IdentifierFormatter&& format_identifier, StringView name, StringView default_, Vector<String>& values, Vector<Alias> aliases = {})
  296. {
  297. quick_sort(values, [](auto const& value1, auto const& value2) { return value1.to_lowercase() < value2.to_lowercase(); });
  298. quick_sort(aliases, [](auto const& alias1, auto const& alias2) { return alias1.alias.to_lowercase() < alias2.alias.to_lowercase(); });
  299. generator.set("name", name);
  300. generator.set("underlying", ((values.size() + !default_.is_empty()) < 256) ? "u8"sv : "u16"sv);
  301. generator.append(R"~~~(
  302. enum class @name@ : @underlying@ {)~~~");
  303. if (!default_.is_empty()) {
  304. generator.set("default", default_);
  305. generator.append(R"~~~(
  306. @default@,)~~~");
  307. }
  308. for (auto const& value : values) {
  309. generator.set("value", format_identifier(name, value));
  310. generator.append(R"~~~(
  311. @value@,)~~~");
  312. }
  313. for (auto const& alias : aliases) {
  314. generator.set("alias", format_identifier(name, alias.alias));
  315. generator.set("value", format_identifier(name, alias.name));
  316. generator.append(R"~~~(
  317. @alias@ = @value@,)~~~");
  318. }
  319. generator.append(R"~~~(
  320. };
  321. )~~~");
  322. }
  323. template<typename LocalesType, typename IdentifierFormatter, typename ListFormatter>
  324. void generate_mapping(SourceGenerator& generator, LocalesType const& locales, StringView type, StringView name, StringView format, IdentifierFormatter&& format_identifier, ListFormatter&& format_list)
  325. {
  326. auto format_mapping_name = [&](StringView format, StringView name) {
  327. String mapping_name;
  328. if constexpr (IsNullPointer<IdentifierFormatter>)
  329. mapping_name = name.replace("-"sv, "_"sv, true);
  330. else
  331. mapping_name = format_identifier(type, name);
  332. return String::formatted(format, mapping_name.to_lowercase());
  333. };
  334. Vector<String> mapping_names;
  335. for (auto const& locale : locales) {
  336. String mapping_name;
  337. if constexpr (requires { locale.key; }) {
  338. mapping_name = format_mapping_name(format, locale.key);
  339. format_list(mapping_name, locale.value);
  340. } else {
  341. mapping_name = format_mapping_name(format, locale);
  342. format_list(mapping_name, locale);
  343. }
  344. mapping_names.append(move(mapping_name));
  345. }
  346. quick_sort(mapping_names);
  347. generator.set("type", type);
  348. generator.set("name", name);
  349. generator.set("size", String::number(locales.size()));
  350. generator.append(R"~~~(
  351. static constexpr Array<Span<@type@ const>, @size@> @name@ { {
  352. )~~~");
  353. constexpr size_t max_values_per_row = 10;
  354. size_t values_in_current_row = 0;
  355. for (auto& mapping_name : mapping_names) {
  356. if (values_in_current_row++ > 0)
  357. generator.append(" ");
  358. generator.set("name", move(mapping_name));
  359. generator.append("@name@.span(),");
  360. if (values_in_current_row == max_values_per_row) {
  361. values_in_current_row = 0;
  362. generator.append("\n ");
  363. }
  364. }
  365. generator.append(R"~~~(
  366. } };
  367. )~~~");
  368. }