unicode_data.cmake 7.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140
  1. option(ENABLE_UNICODE_DATABASE_DOWNLOAD "Enable download of Unicode UCD files at build time" ON)
  2. set(UNICODE_DATA_URL https://www.unicode.org/Public/13.0.0/ucd/UnicodeData.txt)
  3. set(UNICODE_DATA_PATH ${CMAKE_BINARY_DIR}/UCD/UnicodeData.txt)
  4. set(SPECIAL_CASING_URL https://www.unicode.org/Public/13.0.0/ucd/SpecialCasing.txt)
  5. set(SPECIAL_CASING_PATH ${CMAKE_BINARY_DIR}/UCD/SpecialCasing.txt)
  6. set(DERIVED_GENERAL_CATEGORY_URL https://www.unicode.org/Public/13.0.0/ucd/extracted/DerivedGeneralCategory.txt)
  7. set(DERIVED_GENERAL_CATEGORY_PATH ${CMAKE_BINARY_DIR}/UCD/DerivedGeneralCategory.txt)
  8. set(PROP_LIST_URL https://www.unicode.org/Public/13.0.0/ucd/PropList.txt)
  9. set(PROP_LIST_PATH ${CMAKE_BINARY_DIR}/UCD/PropList.txt)
  10. set(DERIVED_CORE_PROP_URL https://www.unicode.org/Public/13.0.0/ucd/DerivedCoreProperties.txt)
  11. set(DERIVED_CORE_PROP_PATH ${CMAKE_BINARY_DIR}/UCD/DerivedCoreProperties.txt)
  12. set(DERIVED_BINARY_PROP_URL https://www.unicode.org/Public/13.0.0/ucd/extracted/DerivedBinaryProperties.txt)
  13. set(DERIVED_BINARY_PROP_PATH ${CMAKE_BINARY_DIR}/UCD/DerivedBinaryProperties.txt)
  14. set(PROP_ALIAS_URL https://www.unicode.org/Public/13.0.0/ucd/PropertyAliases.txt)
  15. set(PROP_ALIAS_PATH ${CMAKE_BINARY_DIR}/UCD/PropertyAliases.txt)
  16. set(PROP_VALUE_ALIAS_URL https://www.unicode.org/Public/13.0.0/ucd/PropertyValueAliases.txt)
  17. set(PROP_VALUE_ALIAS_PATH ${CMAKE_BINARY_DIR}/UCD/PropertyValueAliases.txt)
  18. set(SCRIPTS_URL https://www.unicode.org/Public/13.0.0/ucd/Scripts.txt)
  19. set(SCRIPTS_PATH ${CMAKE_BINARY_DIR}/UCD/Scripts.txt)
  20. set(SCRIPT_EXTENSIONS_URL https://www.unicode.org/Public/13.0.0/ucd/ScriptExtensions.txt)
  21. set(SCRIPT_EXTENSIONS_PATH ${CMAKE_BINARY_DIR}/UCD/ScriptExtensions.txt)
  22. set(EMOJI_DATA_URL https://www.unicode.org/Public/13.0.0/ucd/emoji/emoji-data.txt)
  23. set(EMOJI_DATA_PATH ${CMAKE_BINARY_DIR}/UCD/emoji-data.txt)
  24. set(NORM_PROPS_URL https://www.unicode.org/Public/13.0.0/ucd/DerivedNormalizationProps.txt)
  25. set(NORM_PROPS_PATH ${CMAKE_BINARY_DIR}/UCD/DerivedNormalizationProps.txt)
  26. set(CLDR_PATH ${CMAKE_BINARY_DIR}/CLDR)
  27. set(CLDR_ZIP_URL https://github.com/unicode-org/cldr-json/releases/download/39.0.0/cldr-39.0.0-json-modern.zip)
  28. set(CLDR_ZIP_PATH ${CLDR_PATH}/cldr.zip)
  29. set(CLDR_LOCALES_SOURCE cldr-localenames-modern)
  30. set(CLDR_LOCALES_PATH ${CLDR_PATH}/${CLDR_LOCALES_SOURCE})
  31. if (ENABLE_UNICODE_DATABASE_DOWNLOAD)
  32. if (NOT EXISTS ${UNICODE_DATA_PATH})
  33. message(STATUS "Downloading UCD UnicodeData.txt from ${UNICODE_DATA_URL}...")
  34. file(DOWNLOAD ${UNICODE_DATA_URL} ${UNICODE_DATA_PATH} INACTIVITY_TIMEOUT 10)
  35. endif()
  36. if (NOT EXISTS ${SPECIAL_CASING_PATH})
  37. message(STATUS "Downloading UCD SpecialCasing.txt from ${SPECIAL_CASING_URL}...")
  38. file(DOWNLOAD ${SPECIAL_CASING_URL} ${SPECIAL_CASING_PATH} INACTIVITY_TIMEOUT 10)
  39. endif()
  40. if (NOT EXISTS ${DERIVED_GENERAL_CATEGORY_PATH})
  41. message(STATUS "Downloading UCD DerivedGeneralCategory.txt from ${DERIVED_GENERAL_CATEGORY_URL}...")
  42. file(DOWNLOAD ${DERIVED_GENERAL_CATEGORY_URL} ${DERIVED_GENERAL_CATEGORY_PATH} INACTIVITY_TIMEOUT 10)
  43. endif()
  44. if (NOT EXISTS ${PROP_LIST_PATH})
  45. message(STATUS "Downloading UCD PropList.txt from ${PROP_LIST_URL}...")
  46. file(DOWNLOAD ${PROP_LIST_URL} ${PROP_LIST_PATH} INACTIVITY_TIMEOUT 10)
  47. endif()
  48. if (NOT EXISTS ${DERIVED_CORE_PROP_PATH})
  49. message(STATUS "Downloading UCD DerivedCoreProperties.txt from ${DERIVED_CORE_PROP_URL}...")
  50. file(DOWNLOAD ${DERIVED_CORE_PROP_URL} ${DERIVED_CORE_PROP_PATH} INACTIVITY_TIMEOUT 10)
  51. endif()
  52. if (NOT EXISTS ${DERIVED_BINARY_PROP_PATH})
  53. message(STATUS "Downloading UCD DerivedBinaryProperties.txt from ${DERIVED_BINARY_PROP_URL}...")
  54. file(DOWNLOAD ${DERIVED_BINARY_PROP_URL} ${DERIVED_BINARY_PROP_PATH} INACTIVITY_TIMEOUT 10)
  55. endif()
  56. if (NOT EXISTS ${PROP_ALIAS_PATH})
  57. message(STATUS "Downloading UCD PropertyAliases.txt from ${PROP_ALIAS_URL}...")
  58. file(DOWNLOAD ${PROP_ALIAS_URL} ${PROP_ALIAS_PATH} INACTIVITY_TIMEOUT 10)
  59. endif()
  60. if (NOT EXISTS ${PROP_VALUE_ALIAS_PATH})
  61. message(STATUS "Downloading UCD PropertyValueAliases.txt from ${PROP_VALUE_ALIAS_URL}...")
  62. file(DOWNLOAD ${PROP_VALUE_ALIAS_URL} ${PROP_VALUE_ALIAS_PATH} INACTIVITY_TIMEOUT 10)
  63. endif()
  64. if (NOT EXISTS ${SCRIPTS_PATH})
  65. message(STATUS "Downloading UCD Scripts.txt from ${SCRIPTS_URL}...")
  66. file(DOWNLOAD ${SCRIPTS_URL} ${SCRIPTS_PATH} INACTIVITY_TIMEOUT 10)
  67. endif()
  68. if (NOT EXISTS ${SCRIPT_EXTENSIONS_PATH})
  69. message(STATUS "Downloading UCD ScriptExtensions.txt from ${SCRIPT_EXTENSIONS_URL}...")
  70. file(DOWNLOAD ${SCRIPT_EXTENSIONS_URL} ${SCRIPT_EXTENSIONS_PATH} INACTIVITY_TIMEOUT 10)
  71. endif()
  72. if (NOT EXISTS ${EMOJI_DATA_PATH})
  73. message(STATUS "Downloading UCD emoji-data.txt from ${EMOJI_DATA_URL}...")
  74. file(DOWNLOAD ${EMOJI_DATA_URL} ${EMOJI_DATA_PATH} INACTIVITY_TIMEOUT 10)
  75. endif()
  76. if (NOT EXISTS ${NORM_PROPS_PATH})
  77. message(STATUS "Downloading UCD DerivedNormalizationProps.txt from ${NORM_PROPS_URL}...")
  78. file(DOWNLOAD ${NORM_PROPS_URL} ${NORM_PROPS_PATH} INACTIVITY_TIMEOUT 10)
  79. endif()
  80. if (NOT EXISTS ${CLDR_ZIP_PATH})
  81. message(STATUS "Downloading CLDR database from ${CLDR_ZIP_URL}...")
  82. file(DOWNLOAD ${CLDR_ZIP_URL} ${CLDR_ZIP_PATH} INACTIVITY_TIMEOUT 10)
  83. endif()
  84. if(EXISTS ${CLDR_ZIP_PATH} AND NOT EXISTS ${CLDR_LOCALES_PATH})
  85. message(STATUS "Extracting CLDR ${CLDR_LOCALES_SOURCE} from ${CLDR_ZIP_PATH}...")
  86. execute_process(COMMAND unzip -q ${CLDR_ZIP_PATH} "${CLDR_LOCALES_SOURCE}/*" -d ${CLDR_PATH} RESULT_VARIABLE unzip_result)
  87. if (NOT unzip_result EQUAL 0)
  88. message(FATAL_ERROR "Failed to unzip ${CLDR_ZIP_PATH} with status ${unzip_result}")
  89. endif()
  90. endif()
  91. set(UNICODE_DATA_HEADER LibUnicode/UnicodeData.h)
  92. set(UNICODE_DATA_IMPLEMENTATION LibUnicode/UnicodeData.cpp)
  93. set(UNICODE_LOCALE_HEADER LibUnicode/UnicodeLocale.h)
  94. set(UNICODE_LOCALE_IMPLEMENTATION LibUnicode/UnicodeLocale.cpp)
  95. if (CMAKE_CURRENT_BINARY_DIR MATCHES ".*/LibUnicode") # Serenity build.
  96. set(UNICODE_DATA_HEADER UnicodeData.h)
  97. set(UNICODE_DATA_IMPLEMENTATION UnicodeData.cpp)
  98. set(UNICODE_LOCALE_HEADER UnicodeLocale.h)
  99. set(UNICODE_LOCALE_IMPLEMENTATION UnicodeLocale.cpp)
  100. endif()
  101. add_custom_command(
  102. OUTPUT ${UNICODE_DATA_HEADER} ${UNICODE_DATA_IMPLEMENTATION}
  103. COMMAND $<TARGET_FILE:GenerateUnicodeData> -h ${UNICODE_DATA_HEADER} -c ${UNICODE_DATA_IMPLEMENTATION} -u ${UNICODE_DATA_PATH} -s ${SPECIAL_CASING_PATH} -g ${DERIVED_GENERAL_CATEGORY_PATH} -p ${PROP_LIST_PATH} -d ${DERIVED_CORE_PROP_PATH} -b ${DERIVED_BINARY_PROP_PATH} -a ${PROP_ALIAS_PATH} -v ${PROP_VALUE_ALIAS_PATH} -r ${SCRIPTS_PATH} -x ${SCRIPT_EXTENSIONS_PATH} -e ${EMOJI_DATA_PATH} -n ${NORM_PROPS_PATH}
  104. VERBATIM
  105. DEPENDS GenerateUnicodeData ${UNICODE_DATA_PATH} ${SPECIAL_CASING_PATH} ${DERIVED_GENERAL_CATEGORY_PATH} ${PROP_LIST_PATH} ${DERIVED_CORE_PROP_PATH} ${DERIVED_BINARY_PROP_PATH} ${PROP_ALIAS_PATH} ${PROP_VALUE_ALIAS_PATH} ${SCRIPTS_PATH} ${SCRIPT_EXTENSIONS_PATH} ${EMOJI_DATA_PATH} ${NORM_PROPS_PATH}
  106. )
  107. add_custom_command(
  108. OUTPUT ${UNICODE_LOCALE_HEADER} ${UNICODE_LOCALE_IMPLEMENTATION}
  109. COMMAND $<TARGET_FILE:GenerateUnicodeLocale> -h ${UNICODE_LOCALE_HEADER} -c ${UNICODE_LOCALE_IMPLEMENTATION} -l ${CLDR_LOCALES_PATH}
  110. VERBATIM
  111. DEPENDS GenerateUnicodeLocale ${CLDR_LOCALES_PATH}
  112. )
  113. set(UNICODE_DATA_SOURCES ${UNICODE_DATA_HEADER} ${UNICODE_DATA_IMPLEMENTATION} ${UNICODE_LOCALE_HEADER} ${UNICODE_LOCALE_IMPLEMENTATION})
  114. add_compile_definitions(ENABLE_UNICODE_DATA=1)
  115. else()
  116. add_compile_definitions(ENABLE_UNICODE_DATA=0)
  117. endif()