fontAnalyzer.js 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388
  1. var debug = require('debug')('ylt:fontAnalyzer');
  2. var Q = require('q');
  3. var fontkit = require('fontkit');
  4. var FontAnalyzer = function() {
  5. function analyzeFont(entry, charsListOnPage) {
  6. var deferred = Q.defer();
  7. if (!entry.weightCheck || !entry.weightCheck.bodyBuffer) {
  8. // No valid file available
  9. deferred.resolve(entry);
  10. return deferred.promise;
  11. }
  12. var fileSize = entry.weightCheck.uncompressedSize;
  13. if (entry.isWebFont) {
  14. debug('File %s is a font. Let\'s have a look inside!', entry.url);
  15. getMetricsFromFont(entry, charsListOnPage)
  16. .then(function(fontMetrics) {
  17. entry.fontMetrics = fontMetrics;
  18. deferred.resolve(entry);
  19. })
  20. .fail(function(error) {
  21. debug('Could not open the font: %s', error);
  22. deferred.resolve(entry);
  23. });
  24. } else {
  25. deferred.resolve(entry);
  26. }
  27. return deferred.promise;
  28. }
  29. function getMetricsFromFont(entry, charsListOnPage) {
  30. var deferred = Q.defer();
  31. try {
  32. var startTime = Date.now();
  33. var font = fontkit.create(entry.weightCheck.bodyBuffer);
  34. var result = {
  35. name: font.fullName || font.postscriptName || font.familyName,
  36. numGlyphs: font.numGlyphs,
  37. averageGlyphComplexity: getAverageGlyphComplexity(font),
  38. compressedWeight: entry.weightCheck.afterCompression || entry.weightCheck.bodySize,
  39. unicodeRanges: readUnicodeRanges(font.characterSet, charsListOnPage),
  40. numGlyphsInCommonWithPageContent: countPossiblyUsedGlyphs(getCharacterSetAsString(font.characterSet), charsListOnPage)
  41. };
  42. var endTime = Date.now();
  43. debug('Font analysis took %dms', endTime - startTime);
  44. // Mark fonts that are not used on the page (#224)
  45. var fontIsUsed = false;
  46. for (var range in result.unicodeRanges) {
  47. if (result.unicodeRanges[range].numGlyphsInCommonWithPageContent > 0) {
  48. fontIsUsed = true;
  49. break;
  50. }
  51. }
  52. result.isUsed = fontIsUsed;
  53. deferred.resolve(result);
  54. } catch(error) {
  55. deferred.reject(error);
  56. }
  57. return deferred.promise;
  58. }
  59. // Reads the number of vector commands (complexity) needed to render glyphs and
  60. // returns the average. Only first 100 glyphes are tested, otherwise it would take tool long;
  61. function getAverageGlyphComplexity(font) {
  62. var max = Math.min(font.numGlyphs, 100);
  63. var totalPathsCommands = 0;
  64. for (var i = 0; i < max; i++) {
  65. totalPathsCommands += font.getGlyph(i).path.commands.length;
  66. }
  67. return Math.round(totalPathsCommands / max * 10) / 10;
  68. }
  69. function readUnicodeRanges(charsetInFont, charsListOnPage) {
  70. var ranges = {};
  71. // Assign a range to each char found in the font
  72. charsetInFont.forEach(function(char) {
  73. var currentRange = getUnicodeRangeFromChar(char);
  74. var currentRangeName = currentRange.name;
  75. if (!ranges[currentRangeName]) {
  76. // Cloning the object
  77. ranges[currentRangeName] = Object.assign({}, currentRange);
  78. }
  79. if (!ranges[currentRangeName].charset) {
  80. ranges[currentRangeName].charset = '';
  81. }
  82. ranges[currentRangeName].charset += String.fromCharCode(char);
  83. });
  84. var range;
  85. var expectedLength;
  86. var actualLength;
  87. for (var rangeName in ranges) {
  88. /*jshint loopfunc: true */
  89. range = ranges[rangeName];
  90. // Estimate if range is used, based on the characters found in the page
  91. range.numGlyphsInCommonWithPageContent = countPossiblyUsedGlyphs(range.charset, charsListOnPage);
  92. // Calculate coverage
  93. if (rangeName !== 'Others') {
  94. expectedLength = range.rangeEnd - range.rangeStart + 1;
  95. actualLength = range.charset.length;
  96. range.coverage = Math.min(actualLength / expectedLength, 1);
  97. }
  98. }
  99. return ranges;
  100. }
  101. function countPossiblyUsedGlyphs(charsetInFont, charsListOnPage) {
  102. var count = 0;
  103. charsListOnPage.split('').forEach(function(char) {
  104. if (charsetInFont.indexOf(char) >= 0) {
  105. count ++;
  106. }
  107. });
  108. return count;
  109. }
  110. function getCharacterSetAsString(characterSet) {
  111. var str = '';
  112. characterSet.forEach(function(charCode) {
  113. str += String.fromCharCode(charCode);
  114. });
  115. return str;
  116. }
  117. function getUnicodeRangeFromChar(char) {
  118. return UNICODE_RANGES.find(function(range) {
  119. return (char >= range.rangeStart && char <= range.rangeEnd);
  120. }) || {name: 'Others'};
  121. }
  122. var UNICODE_RANGES = [
  123. {
  124. name: 'Basic Latin',
  125. rangeStart: 0x0020,
  126. rangeEnd: 0x007F
  127. },
  128. {
  129. name: 'Latin-1 Supplement',
  130. rangeStart: 0x00A0,
  131. rangeEnd: 0x00FF
  132. },
  133. {
  134. name: 'Latin Extended',
  135. rangeStart: 0x0100,
  136. rangeEnd: 0x024F
  137. },
  138. {
  139. name: 'IPA Extensions',
  140. rangeStart: 0x0250,
  141. rangeEnd: 0x02AF
  142. },
  143. {
  144. name: 'Greek and Coptic',
  145. rangeStart: 0x0370,
  146. rangeEnd: 0x03FF
  147. },
  148. {
  149. name: 'Cyrillic',
  150. rangeStart: 0x0400,
  151. rangeEnd: 0x052F
  152. },
  153. {
  154. name: 'Armenian',
  155. rangeStart: 0x0530,
  156. rangeEnd: 0x058F
  157. },
  158. {
  159. name: 'Hebrew',
  160. rangeStart: 0x0590,
  161. rangeEnd: 0x05FF
  162. },
  163. {
  164. name: 'Arabic',
  165. rangeStart: 0x0600,
  166. rangeEnd: 0x06FF
  167. },
  168. {
  169. name: 'Syriac',
  170. rangeStart: 0x0700,
  171. rangeEnd: 0x074F
  172. },
  173. {
  174. name: 'Thaana',
  175. rangeStart: 0x0780,
  176. rangeEnd: 0x07BF
  177. },
  178. {
  179. name: 'Devanagari',
  180. rangeStart: 0x0900,
  181. rangeEnd: 0x097F
  182. },
  183. {
  184. name: 'Bengali',
  185. rangeStart: 0x0980,
  186. rangeEnd: 0x09FF
  187. },
  188. {
  189. name: 'Gurmukhi',
  190. rangeStart: 0x0A00,
  191. rangeEnd: 0x0A7F
  192. },
  193. {
  194. name: 'Gujarati',
  195. rangeStart: 0x0A80,
  196. rangeEnd: 0x0AFF
  197. },
  198. {
  199. name: 'Oriya',
  200. rangeStart: 0x0B00,
  201. rangeEnd: 0x0B7F
  202. },
  203. {
  204. name: 'Tamil',
  205. rangeStart: 0x0B80,
  206. rangeEnd: 0x0BFF
  207. },
  208. {
  209. name: 'Telugu',
  210. rangeStart: 0x0C00,
  211. rangeEnd: 0x0C7F
  212. },
  213. {
  214. name: 'Kannada',
  215. rangeStart: 0x0C80,
  216. rangeEnd: 0x0CFF
  217. },
  218. {
  219. name: 'Malayalam',
  220. rangeStart: 0x0D00,
  221. rangeEnd: 0x0D7F
  222. },
  223. {
  224. name: 'Sinhala',
  225. rangeStart: 0x0D80,
  226. rangeEnd: 0x0DFF
  227. },
  228. {
  229. name: 'Thai',
  230. rangeStart: 0x0E00,
  231. rangeEnd: 0x0E7F
  232. },
  233. {
  234. name: 'Lao',
  235. rangeStart: 0x0E80,
  236. rangeEnd: 0x0EFF
  237. },
  238. {
  239. name: 'Tibetan',
  240. rangeStart: 0x0F00,
  241. rangeEnd: 0x0FFF
  242. },
  243. {
  244. name: 'Myanmar',
  245. rangeStart: 0x1000,
  246. rangeEnd: 0x109F
  247. },
  248. {
  249. name: 'Georgian',
  250. rangeStart: 0x10A0,
  251. rangeEnd: 0x10FF
  252. },
  253. {
  254. name: 'Hangul Jamo',
  255. rangeStart: 0x1100,
  256. rangeEnd: 0x11FF
  257. },
  258. {
  259. name: 'Ethiopic',
  260. rangeStart: 0x1200,
  261. rangeEnd: 0x137F
  262. },
  263. {
  264. name: 'Cherokee',
  265. rangeStart: 0x13A0,
  266. rangeEnd: 0x13FF
  267. },
  268. {
  269. name: 'Unified Canadian Aboriginal Syllabics',
  270. rangeStart: 0x1400,
  271. rangeEnd: 0x167F
  272. },
  273. {
  274. name: 'Ogham',
  275. rangeStart: 0x1680,
  276. rangeEnd: 0x169F
  277. },
  278. {
  279. name: 'Runic',
  280. rangeStart: 0x16A0,
  281. rangeEnd: 0x16FF
  282. },
  283. {
  284. name: 'Tagalog',
  285. rangeStart: 0x1700,
  286. rangeEnd: 0x171F
  287. },
  288. {
  289. name: 'Hanunoo',
  290. rangeStart: 0x1720,
  291. rangeEnd: 0x173F
  292. },
  293. {
  294. name: 'Buhid',
  295. rangeStart: 0x1740,
  296. rangeEnd: 0x175F
  297. },
  298. {
  299. name: 'Tagbanwa',
  300. rangeStart: 0x1760,
  301. rangeEnd: 0x177F
  302. },
  303. {
  304. name: 'Khmer',
  305. rangeStart: 0x1780,
  306. rangeEnd: 0x17FF
  307. },
  308. {
  309. name: 'Mongolian',
  310. rangeStart: 0x1800,
  311. rangeEnd: 0x18AF
  312. },
  313. {
  314. name: 'Limbu',
  315. rangeStart: 0x1900,
  316. rangeEnd: 0x194F
  317. },
  318. {
  319. name: 'Tai Le',
  320. rangeStart: 0x1950,
  321. rangeEnd: 0x197F
  322. },
  323. {
  324. name: 'Hiragana',
  325. rangeStart: 0x3040,
  326. rangeEnd: 0x309F
  327. },
  328. {
  329. name: 'Katakana',
  330. rangeStart: 0x30A0,
  331. rangeEnd: 0x30FF
  332. },
  333. {
  334. name: 'Bopomofo',
  335. rangeStart: 0x3100,
  336. rangeEnd: 0x312F
  337. }
  338. ];
  339. return {
  340. analyzeFont: analyzeFont,
  341. getMetricsFromFont: getMetricsFromFont,
  342. readUnicodeRanges: readUnicodeRanges,
  343. getAverageGlyphComplexity: getAverageGlyphComplexity,
  344. countPossiblyUsedGlyphs: countPossiblyUsedGlyphs,
  345. getCharacterSetAsString: getCharacterSetAsString,
  346. getUnicodeRangeFromChar: getUnicodeRangeFromChar
  347. };
  348. };
  349. module.exports = new FontAnalyzer();