i18n.php 63 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538
  1. <?php
  2. /**
  3. * i18n.php
  4. *
  5. * Copyright (c) 1999-2003 The SquirrelMail Project Team
  6. * Licensed under the GNU GPL. For full terms see the file COPYING.
  7. *
  8. * This file contains variuos functions that are needed to do
  9. * internationalization of SquirrelMail.
  10. *
  11. * Internally the output character set is used. Other characters are
  12. * encoded using Unicode entities according to HTML 4.0.
  13. *
  14. * $Id$
  15. */
  16. /* Decodes a string to the internal encoding from the given charset */
  17. function charset_decode ($charset, $string) {
  18. global $languages, $squirrelmail_language;
  19. if (isset($languages[$squirrelmail_language]['XTRA_CODE']) &&
  20. function_exists($languages[$squirrelmail_language]['XTRA_CODE'])) {
  21. $string = $languages[$squirrelmail_language]['XTRA_CODE']('decode', $string);
  22. }
  23. /* All HTML special characters are 7 bit and can be replaced first */
  24. $string = htmlspecialchars ($string);
  25. $charset = strtolower($charset);
  26. set_my_charset() ;
  27. if (ereg('iso-8859-([[:digit:]]+)', $charset, $res)) {
  28. if ($res[1] == '1') {
  29. $ret = charset_decode_iso_8859_1 ($string);
  30. } else if ($res[1] == '2') {
  31. $ret = charset_decode_iso_8859_2 ($string);
  32. } else if ($res[1] == '4') {
  33. $ret = charset_decode_iso_8859_4 ($string);
  34. } else if ($res[1] == '5') {
  35. $ret = charset_decode_iso_8859_5 ($string);
  36. } else if ($res[1] == '7') {
  37. $ret = charset_decode_iso_8859_7 ($string);
  38. } else if ($res[1] == '9') {
  39. $ret = charset_decode_iso_8859_9 ($string);
  40. } else if ($res[1] == '13') {
  41. $ret = charset_decode_iso_8859_13 ($string);
  42. } else if ($res[1] == '15') {
  43. $ret = charset_decode_iso_8859_15 ($string);
  44. } else {
  45. $ret = charset_decode_iso_8859_default ($string);
  46. }
  47. } else if ($charset == 'ns_4551-1') {
  48. $ret = charset_decode_ns_4551_1 ($string);
  49. } else if ($charset == 'koi8-r') {
  50. $ret = charset_decode_koi8r ($string);
  51. } else if ($charset == 'windows-1251') {
  52. $ret = charset_decode_windows_1251 ($string);
  53. } else if ($charset == 'windows-1253') {
  54. $ret = charset_decode_windows_1253 ($string);
  55. } else if ($charset == 'windows-1254') {
  56. $ret = charset_decode_windows_1254 ($string);
  57. } else if ($charset == 'windows-1257') {
  58. $ret = charset_decode_windows_1257 ($string);
  59. } else if ($charset == 'utf-8') {
  60. $ret = charset_decode_utf8 ($string);
  61. } else {
  62. $ret = $string;
  63. }
  64. return( $ret );
  65. }
  66. /*
  67. iso-8859-1 is the same as Latin 1 and is normally used
  68. in western europe.
  69. */
  70. function charset_decode_iso_8859_1 ($string) {
  71. global $default_charset;
  72. if (strtolower($default_charset) <> 'iso-8859-1') {
  73. /* Only do the slow convert if there are 8-bit characters */
  74. if (ereg("[\200-\377]", $string)) {
  75. $string = str_replace("\201", '&#129;', $string);
  76. $string = str_replace("\202", '&#130;', $string);
  77. $string = str_replace("\203", '&#131;', $string);
  78. $string = str_replace("\204", '&#132;', $string);
  79. $string = str_replace("\205", '&#133;', $string);
  80. $string = str_replace("\206", '&#134;', $string);
  81. $string = str_replace("\207", '&#135;', $string);
  82. $string = str_replace("\210", '&#136;', $string);
  83. $string = str_replace("\211", '&#137;', $string);
  84. $string = str_replace("\212", '&#138;', $string);
  85. $string = str_replace("\213", '&#139;', $string);
  86. $string = str_replace("\214", '&#140;', $string);
  87. $string = str_replace("\215", '&#141;', $string);
  88. $string = str_replace("\216", '&#142;', $string);
  89. $string = str_replace("\217", '&#143;', $string);
  90. $string = str_replace("\220", '&#144;', $string);
  91. $string = str_replace("\221", '&#145;', $string);
  92. $string = str_replace("\222", '&#146;', $string);
  93. $string = str_replace("\223", '&#147;', $string);
  94. $string = str_replace("\224", '&#148;', $string);
  95. $string = str_replace("\225", '&#149;', $string);
  96. $string = str_replace("\226", '&#150;', $string);
  97. $string = str_replace("\227", '&#151;', $string);
  98. $string = str_replace("\230", '&#152;', $string);
  99. $string = str_replace("\231", '&#153;', $string);
  100. $string = str_replace("\232", '&#154;', $string);
  101. $string = str_replace("\233", '&#155;', $string);
  102. $string = str_replace("\234", '&#156;', $string);
  103. $string = str_replace("\235", '&#157;', $string);
  104. $string = str_replace("\236", '&#158;', $string);
  105. $string = str_replace("\237", '&#159;', $string);
  106. $string = str_replace("\240", '&#160;', $string);
  107. $string = str_replace("\241", '&#161;', $string);
  108. $string = str_replace("\242", '&#162;', $string);
  109. $string = str_replace("\243", '&#163;', $string);
  110. $string = str_replace("\244", '&#164;', $string);
  111. $string = str_replace("\245", '&#165;', $string);
  112. $string = str_replace("\246", '&#166;', $string);
  113. $string = str_replace("\247", '&#167;', $string);
  114. $string = str_replace("\250", '&#168;', $string);
  115. $string = str_replace("\251", '&#169;', $string);
  116. $string = str_replace("\252", '&#170;', $string);
  117. $string = str_replace("\253", '&#171;', $string);
  118. $string = str_replace("\254", '&#172;', $string);
  119. $string = str_replace("\255", '&#173;', $string);
  120. $string = str_replace("\256", '&#174;', $string);
  121. $string = str_replace("\257", '&#175;', $string);
  122. $string = str_replace("\260", '&#176;', $string);
  123. $string = str_replace("\261", '&#177;', $string);
  124. $string = str_replace("\262", '&#178;', $string);
  125. $string = str_replace("\263", '&#179;', $string);
  126. $string = str_replace("\264", '&#180;', $string);
  127. $string = str_replace("\265", '&#181;', $string);
  128. $string = str_replace("\266", '&#182;', $string);
  129. $string = str_replace("\267", '&#183;', $string);
  130. $string = str_replace("\270", '&#184;', $string);
  131. $string = str_replace("\271", '&#185;', $string);
  132. $string = str_replace("\272", '&#186;', $string);
  133. $string = str_replace("\273", '&#187;', $string);
  134. $string = str_replace("\274", '&#188;', $string);
  135. $string = str_replace("\275", '&#189;', $string);
  136. $string = str_replace("\276", '&#190;', $string);
  137. $string = str_replace("\277", '&#191;', $string);
  138. $string = str_replace("\300", '&#192;', $string);
  139. $string = str_replace("\301", '&#193;', $string);
  140. $string = str_replace("\302", '&#194;', $string);
  141. $string = str_replace("\303", '&#195;', $string);
  142. $string = str_replace("\304", '&#196;', $string);
  143. $string = str_replace("\305", '&#197;', $string);
  144. $string = str_replace("\306", '&#198;', $string);
  145. $string = str_replace("\307", '&#199;', $string);
  146. $string = str_replace("\310", '&#200;', $string);
  147. $string = str_replace("\311", '&#201;', $string);
  148. $string = str_replace("\312", '&#202;', $string);
  149. $string = str_replace("\313", '&#203;', $string);
  150. $string = str_replace("\314", '&#204;', $string);
  151. $string = str_replace("\315", '&#205;', $string);
  152. $string = str_replace("\316", '&#206;', $string);
  153. $string = str_replace("\317", '&#207;', $string);
  154. $string = str_replace("\320", '&#208;', $string);
  155. $string = str_replace("\321", '&#209;', $string);
  156. $string = str_replace("\322", '&#210;', $string);
  157. $string = str_replace("\323", '&#211;', $string);
  158. $string = str_replace("\324", '&#212;', $string);
  159. $string = str_replace("\325", '&#213;', $string);
  160. $string = str_replace("\326", '&#214;', $string);
  161. $string = str_replace("\327", '&#215;', $string);
  162. $string = str_replace("\330", '&#216;', $string);
  163. $string = str_replace("\331", '&#217;', $string);
  164. $string = str_replace("\332", '&#218;', $string);
  165. $string = str_replace("\333", '&#219;', $string);
  166. $string = str_replace("\334", '&#220;', $string);
  167. $string = str_replace("\335", '&#221;', $string);
  168. $string = str_replace("\336", '&#222;', $string);
  169. $string = str_replace("\337", '&#223;', $string);
  170. $string = str_replace("\340", '&#224;', $string);
  171. $string = str_replace("\341", '&#225;', $string);
  172. $string = str_replace("\342", '&#226;', $string);
  173. $string = str_replace("\343", '&#227;', $string);
  174. $string = str_replace("\344", '&#228;', $string);
  175. $string = str_replace("\345", '&#229;', $string);
  176. $string = str_replace("\346", '&#230;', $string);
  177. $string = str_replace("\347", '&#231;', $string);
  178. $string = str_replace("\350", '&#232;', $string);
  179. $string = str_replace("\351", '&#233;', $string);
  180. $string = str_replace("\352", '&#234;', $string);
  181. $string = str_replace("\353", '&#235;', $string);
  182. $string = str_replace("\354", '&#236;', $string);
  183. $string = str_replace("\355", '&#237;', $string);
  184. $string = str_replace("\356", '&#238;', $string);
  185. $string = str_replace("\357", '&#239;', $string);
  186. $string = str_replace("\360", '&#240;', $string);
  187. $string = str_replace("\361", '&#241;', $string);
  188. $string = str_replace("\362", '&#242;', $string);
  189. $string = str_replace("\363", '&#243;', $string);
  190. $string = str_replace("\364", '&#244;', $string);
  191. $string = str_replace("\365", '&#245;', $string);
  192. $string = str_replace("\366", '&#246;', $string);
  193. $string = str_replace("\367", '&#247;', $string);
  194. $string = str_replace("\370", '&#248;', $string);
  195. $string = str_replace("\371", '&#249;', $string);
  196. $string = str_replace("\372", '&#250;', $string);
  197. $string = str_replace("\373", '&#251;', $string);
  198. $string = str_replace("\374", '&#252;', $string);
  199. $string = str_replace("\375", '&#253;', $string);
  200. $string = str_replace("\376", '&#254;', $string);
  201. $string = str_replace("\377", '&#255;', $string);
  202. }
  203. }
  204. return ($string);
  205. }
  206. /* iso-8859-2 is used for some eastern European languages */
  207. function charset_decode_iso_8859_2 ($string) {
  208. global $default_charset;
  209. if (strtolower($default_charset) == 'iso-8859-2')
  210. return $string;
  211. /* Only do the slow convert if there are 8-bit characters */
  212. if (! ereg("[\200-\377]", $string))
  213. return $string;
  214. /* NO-BREAK SPACE */
  215. $string = str_replace("\240", '&#160;', $string);
  216. /* LATIN CAPITAL LETTER A WITH OGONEK */
  217. $string = str_replace("\241", '&#260;', $string);
  218. /* BREVE */
  219. $string = str_replace("\242", '&#728;', $string);
  220. // LATIN CAPITAL LETTER L WITH STROKE
  221. $string = str_replace("\243", '&#321;', $string);
  222. // CURRENCY SIGN
  223. $string = str_replace("\244", '&#164;', $string);
  224. // LATIN CAPITAL LETTER L WITH CARON
  225. $string = str_replace("\245", '&#317;', $string);
  226. // LATIN CAPITAL LETTER S WITH ACUTE
  227. $string = str_replace("\246", '&#346;', $string);
  228. // SECTION SIGN
  229. $string = str_replace("\247", '&#167;', $string);
  230. // DIAERESIS
  231. $string = str_replace("\250", '&#168;', $string);
  232. // LATIN CAPITAL LETTER S WITH CARON
  233. $string = str_replace("\251", '&#352;', $string);
  234. // LATIN CAPITAL LETTER S WITH CEDILLA
  235. $string = str_replace("\252", '&#350;', $string);
  236. // LATIN CAPITAL LETTER T WITH CARON
  237. $string = str_replace("\253", '&#356;', $string);
  238. // LATIN CAPITAL LETTER Z WITH ACUTE
  239. $string = str_replace("\254", '&#377;', $string);
  240. // SOFT HYPHEN
  241. $string = str_replace("\255", '&#173;', $string);
  242. // LATIN CAPITAL LETTER Z WITH CARON
  243. $string = str_replace("\256", '&#381;', $string);
  244. // LATIN CAPITAL LETTER Z WITH DOT ABOVE
  245. $string = str_replace("\257", '&#379;', $string);
  246. // DEGREE SIGN
  247. $string = str_replace("\260", '&#176;', $string);
  248. // LATIN SMALL LETTER A WITH OGONEK
  249. $string = str_replace("\261", '&#261;', $string);
  250. // OGONEK
  251. $string = str_replace("\262", '&#731;', $string);
  252. // LATIN SMALL LETTER L WITH STROKE
  253. $string = str_replace("\263", '&#322;', $string);
  254. // ACUTE ACCENT
  255. $string = str_replace("\264", '&#180;', $string);
  256. // LATIN SMALL LETTER L WITH CARON
  257. $string = str_replace("\265", '&#318;', $string);
  258. // LATIN SMALL LETTER S WITH ACUTE
  259. $string = str_replace("\266", '&#347;', $string);
  260. // CARON
  261. $string = str_replace("\267", '&#711;', $string);
  262. // CEDILLA
  263. $string = str_replace("\270", '&#184;', $string);
  264. // LATIN SMALL LETTER S WITH CARON
  265. $string = str_replace("\271", '&#353;', $string);
  266. // LATIN SMALL LETTER S WITH CEDILLA
  267. $string = str_replace("\272", '&#351;', $string);
  268. // LATIN SMALL LETTER T WITH CARON
  269. $string = str_replace("\273", '&#357;', $string);
  270. // LATIN SMALL LETTER Z WITH ACUTE
  271. $string = str_replace("\274", '&#378;', $string);
  272. // DOUBLE ACUTE ACCENT
  273. $string = str_replace("\275", '&#733;', $string);
  274. // LATIN SMALL LETTER Z WITH CARON
  275. $string = str_replace("\276", '&#382;', $string);
  276. // LATIN SMALL LETTER Z WITH DOT ABOVE
  277. $string = str_replace("\277", '&#380;', $string);
  278. // LATIN CAPITAL LETTER R WITH ACUTE
  279. $string = str_replace("\300", '&#340;', $string);
  280. // LATIN CAPITAL LETTER A WITH ACUTE
  281. $string = str_replace("\301", '&#193;', $string);
  282. // LATIN CAPITAL LETTER A WITH CIRCUMFLEX
  283. $string = str_replace("\302", '&#194;', $string);
  284. // LATIN CAPITAL LETTER A WITH BREVE
  285. $string = str_replace("\303", '&#258;', $string);
  286. // LATIN CAPITAL LETTER A WITH DIAERESIS
  287. $string = str_replace("\304", '&#196;', $string);
  288. // LATIN CAPITAL LETTER L WITH ACUTE
  289. $string = str_replace("\305", '&#313;', $string);
  290. // LATIN CAPITAL LETTER C WITH ACUTE
  291. $string = str_replace("\306", '&#262;', $string);
  292. // LATIN CAPITAL LETTER C WITH CEDILLA
  293. $string = str_replace("\307", '&#199;', $string);
  294. // LATIN CAPITAL LETTER C WITH CARON
  295. $string = str_replace("\310", '&#268;', $string);
  296. // LATIN CAPITAL LETTER E WITH ACUTE
  297. $string = str_replace("\311", '&#201;', $string);
  298. // LATIN CAPITAL LETTER E WITH OGONEK
  299. $string = str_replace("\312", '&#280;', $string);
  300. // LATIN CAPITAL LETTER E WITH DIAERESIS
  301. $string = str_replace("\313", '&#203;', $string);
  302. // LATIN CAPITAL LETTER E WITH CARON
  303. $string = str_replace("\314", '&#282;', $string);
  304. // LATIN CAPITAL LETTER I WITH ACUTE
  305. $string = str_replace("\315", '&#205;', $string);
  306. // LATIN CAPITAL LETTER I WITH CIRCUMFLEX
  307. $string = str_replace("\316", '&#206;', $string);
  308. // LATIN CAPITAL LETTER D WITH CARON
  309. $string = str_replace("\317", '&#270;', $string);
  310. // LATIN CAPITAL LETTER D WITH STROKE
  311. $string = str_replace("\320", '&#272;', $string);
  312. // LATIN CAPITAL LETTER N WITH ACUTE
  313. $string = str_replace("\321", '&#323;', $string);
  314. // LATIN CAPITAL LETTER N WITH CARON
  315. $string = str_replace("\322", '&#327;', $string);
  316. // LATIN CAPITAL LETTER O WITH ACUTE
  317. $string = str_replace("\323", '&#211;', $string);
  318. // LATIN CAPITAL LETTER O WITH CIRCUMFLEX
  319. $string = str_replace("\324", '&#212;', $string);
  320. // LATIN CAPITAL LETTER O WITH DOUBLE ACUTE
  321. $string = str_replace("\325", '&#336;', $string);
  322. // LATIN CAPITAL LETTER O WITH DIAERESIS
  323. $string = str_replace("\326", '&#214;', $string);
  324. // MULTIPLICATION SIGN
  325. $string = str_replace("\327", '&#215;', $string);
  326. // LATIN CAPITAL LETTER R WITH CARON
  327. $string = str_replace("\330", '&#344;', $string);
  328. // LATIN CAPITAL LETTER U WITH RING ABOVE
  329. $string = str_replace("\331", '&#366;', $string);
  330. // LATIN CAPITAL LETTER U WITH ACUTE
  331. $string = str_replace("\332", '&#218;', $string);
  332. // LATIN CAPITAL LETTER U WITH DOUBLE ACUTE
  333. $string = str_replace("\333", '&#368;', $string);
  334. // LATIN CAPITAL LETTER U WITH DIAERESIS
  335. $string = str_replace("\334", '&#220;', $string);
  336. // LATIN CAPITAL LETTER Y WITH ACUTE
  337. $string = str_replace("\335", '&#221;', $string);
  338. // LATIN CAPITAL LETTER T WITH CEDILLA
  339. $string = str_replace("\336", '&#354;', $string);
  340. // LATIN SMALL LETTER SHARP S
  341. $string = str_replace("\337", '&#223;', $string);
  342. // LATIN SMALL LETTER R WITH ACUTE
  343. $string = str_replace("\340", '&#341;', $string);
  344. // LATIN SMALL LETTER A WITH ACUTE
  345. $string = str_replace("\341", '&#225;', $string);
  346. // LATIN SMALL LETTER A WITH CIRCUMFLEX
  347. $string = str_replace("\342", '&#226;', $string);
  348. // LATIN SMALL LETTER A WITH BREVE
  349. $string = str_replace("\343", '&#259;', $string);
  350. // LATIN SMALL LETTER A WITH DIAERESIS
  351. $string = str_replace("\344", '&#228;', $string);
  352. // LATIN SMALL LETTER L WITH ACUTE
  353. $string = str_replace("\345", '&#314;', $string);
  354. // LATIN SMALL LETTER C WITH ACUTE
  355. $string = str_replace("\346", '&#263;', $string);
  356. // LATIN SMALL LETTER C WITH CEDILLA
  357. $string = str_replace("\347", '&#231;', $string);
  358. // LATIN SMALL LETTER C WITH CARON
  359. $string = str_replace("\350", '&#269;', $string);
  360. // LATIN SMALL LETTER E WITH ACUTE
  361. $string = str_replace("\351", '&#233;', $string);
  362. // LATIN SMALL LETTER E WITH OGONEK
  363. $string = str_replace("\352", '&#281;', $string);
  364. // LATIN SMALL LETTER E WITH DIAERESIS
  365. $string = str_replace("\353", '&#235;', $string);
  366. // LATIN SMALL LETTER E WITH CARON
  367. $string = str_replace("\354", '&#283;', $string);
  368. // LATIN SMALL LETTER I WITH ACUTE
  369. $string = str_replace("\355", '&#237;', $string);
  370. // LATIN SMALL LETTER I WITH CIRCUMFLEX
  371. $string = str_replace("\356", '&#238;', $string);
  372. // LATIN SMALL LETTER D WITH CARON
  373. $string = str_replace("\357", '&#271;', $string);
  374. // LATIN SMALL LETTER D WITH STROKE
  375. $string = str_replace("\360", '&#273;', $string);
  376. // LATIN SMALL LETTER N WITH ACUTE
  377. $string = str_replace("\361", '&#324;', $string);
  378. // LATIN SMALL LETTER N WITH CARON
  379. $string = str_replace("\362", '&#328;', $string);
  380. // LATIN SMALL LETTER O WITH ACUTE
  381. $string = str_replace("\363", '&#243;', $string);
  382. // LATIN SMALL LETTER O WITH CIRCUMFLEX
  383. $string = str_replace("\364", '&#244;', $string);
  384. // LATIN SMALL LETTER O WITH DOUBLE ACUTE
  385. $string = str_replace("\365", '&#337;', $string);
  386. // LATIN SMALL LETTER O WITH DIAERESIS
  387. $string = str_replace("\366", '&#246;', $string);
  388. // DIVISION SIGN
  389. $string = str_replace("\367", '&#247;', $string);
  390. // LATIN SMALL LETTER R WITH CARON
  391. $string = str_replace("\370", '&#345;', $string);
  392. // LATIN SMALL LETTER U WITH RING ABOVE
  393. $string = str_replace("\371", '&#367;', $string);
  394. // LATIN SMALL LETTER U WITH ACUTE
  395. $string = str_replace("\372", '&#250;', $string);
  396. // LATIN SMALL LETTER U WITH DOUBLE ACUTE
  397. $string = str_replace("\373", '&#369;', $string);
  398. // LATIN SMALL LETTER U WITH DIAERESIS
  399. $string = str_replace("\374", '&#252;', $string);
  400. // LATIN SMALL LETTER Y WITH ACUTE
  401. $string = str_replace("\375", '&#253;', $string);
  402. // LATIN SMALL LETTER T WITH CEDILLA
  403. $string = str_replace("\376", '&#355;', $string);
  404. // DOT ABOVE
  405. $string = str_replace("\377", '&#729;', $string);
  406. return $string;
  407. }
  408. /*
  409. ISO/IEC 8859-4:1998 Latin Alphabet No. 4
  410. */
  411. function charset_decode_iso_8859_4 ($string) {
  412. global $default_charset;
  413. if (strtolower($default_charset) == 'iso-8859-4')
  414. return $string;
  415. /* Only do the slow convert if there are 8-bit characters */
  416. if (! ereg("[\200-\377]", $string))
  417. return $string;
  418. $string = str_replace ("\241", '&#260;', $string);
  419. $string = str_replace ("\242", '&#312;', $string);
  420. $string = str_replace ("\243", '&#342;', $string);
  421. $string = str_replace ("\245", '&#296;', $string);
  422. $string = str_replace ("\246", '&#315;', $string);
  423. $string = str_replace ("\251", '&#352;', $string);
  424. $string = str_replace ("\252", '&#274;', $string);
  425. $string = str_replace ("\253", '&#290;', $string);
  426. $string = str_replace ("\254", '&#358;', $string);
  427. $string = str_replace ("\256", '&#381;', $string);
  428. $string = str_replace ("\261", '&#261;', $string);
  429. $string = str_replace ("\262", '&#731;', $string);
  430. $string = str_replace ("\263", '&#343;', $string);
  431. $string = str_replace ("\265", '&#297;', $string);
  432. $string = str_replace ("\266", '&#316;', $string);
  433. $string = str_replace ("\267", '&#711;', $string);
  434. $string = str_replace ("\271", '&#353;', $string);
  435. $string = str_replace ("\272", '&#275;', $string);
  436. $string = str_replace ("\273", '&#291;', $string);
  437. $string = str_replace ("\274", '&#359;', $string);
  438. $string = str_replace ("\275", '&#330;', $string);
  439. $string = str_replace ("\276", '&#382;', $string);
  440. $string = str_replace ("\277", '&#331;', $string);
  441. $string = str_replace ("\300", '&#256;', $string);
  442. $string = str_replace ("\307", '&#302;', $string);
  443. $string = str_replace ("\310", '&#268;', $string);
  444. $string = str_replace ("\312", '&#280;', $string);
  445. $string = str_replace ("\314", '&#278;', $string);
  446. $string = str_replace ("\317", '&#298;', $string);
  447. $string = str_replace ("\320", '&#272;', $string);
  448. $string = str_replace ("\321", '&#325;', $string);
  449. $string = str_replace ("\322", '&#332;', $string);
  450. $string = str_replace ("\323", '&#310;', $string);
  451. $string = str_replace ("\331", '&#370;', $string);
  452. $string = str_replace ("\335", '&#360;', $string);
  453. $string = str_replace ("\336", '&#362;', $string);
  454. $string = str_replace ("\340", '&#257;', $string);
  455. $string = str_replace ("\347", '&#303;', $string);
  456. $string = str_replace ("\350", '&#269;', $string);
  457. $string = str_replace ("\352", '&#281;', $string);
  458. $string = str_replace ("\354", '&#279;', $string);
  459. $string = str_replace ("\357", '&#299;', $string);
  460. $string = str_replace ("\360", '&#273;', $string);
  461. $string = str_replace ("\361", '&#326;', $string);
  462. $string = str_replace ("\362", '&#333;', $string);
  463. $string = str_replace ("\363", '&#311;', $string);
  464. $string = str_replace ("\371", '&#371;', $string);
  465. $string = str_replace ("\375", '&#361;', $string);
  466. $string = str_replace ("\376", '&#363;', $string);
  467. $string = str_replace ("\377", '&#729;', $string);
  468. // rest of charset is the same as ISO-8859-1
  469. return (charset_decode_iso_8859_1($string));
  470. }
  471. /* iso-8859-7 is Greek. */
  472. function charset_decode_iso_8859_7 ($string) {
  473. global $default_charset;
  474. if (strtolower($default_charset) == 'iso-8859-7') {
  475. return $string;
  476. }
  477. /* Only do the slow convert if there are 8-bit characters */
  478. if (!ereg("[\200-\377]", $string)) {
  479. return $string;
  480. }
  481. /* Some diverse characters in the beginning */
  482. $string = str_replace("\240", '&#160;', $string);
  483. $string = str_replace("\241", '&#8216;', $string);
  484. $string = str_replace("\242", '&#8217;', $string);
  485. $string = str_replace("\243", '&#163;', $string);
  486. $string = str_replace("\246", '&#166;', $string);
  487. $string = str_replace("\247", '&#167;', $string);
  488. $string = str_replace("\250", '&#168;', $string);
  489. $string = str_replace("\251", '&#169;', $string);
  490. $string = str_replace("\253", '&#171;', $string);
  491. $string = str_replace("\254", '&#172;', $string);
  492. $string = str_replace("\255", '&#173;', $string);
  493. $string = str_replace("\257", '&#8213;', $string);
  494. $string = str_replace("\260", '&#176;', $string);
  495. $string = str_replace("\261", '&#177;', $string);
  496. $string = str_replace("\262", '&#178;', $string);
  497. $string = str_replace("\263", '&#179;', $string);
  498. /* Horizontal bar (parentheki pavla) */
  499. $string = str_replace ("\257", '&#8213;', $string);
  500. /*
  501. * ISO-8859-7 characters from 11/04 (0xB4) to 11/06 (0xB6)
  502. * These are Unicode 900-902
  503. */
  504. $string = preg_replace("/([\264-\266])/e","'&#' . (ord('\\1')+720);",$string);
  505. /* 11/07 (0xB7) Middle dot is the same in iso-8859-1 */
  506. $string = str_replace("\267", '&#183;', $string);
  507. /*
  508. * ISO-8859-7 characters from 11/08 (0xB8) to 11/10 (0xBA)
  509. * These are Unicode 900-902
  510. */
  511. $string = preg_replace("/([\270-\272])/e","'&#' . (ord('\\1')+720);",$string);
  512. /*
  513. * 11/11 (0xBB) Right angle quotation mark is the same as in
  514. * iso-8859-1
  515. */
  516. $string = str_replace("\273", '&#187;', $string);
  517. /* And now the rest of the charset */
  518. $string = preg_replace("/([\274-\376])/e","'&#'.(ord('\\1')+720);",$string);
  519. return $string;
  520. }
  521. /*
  522. ISOIEC 8859-9:1999 Latin Alphabet No. 5
  523. */
  524. function charset_decode_iso_8859_9 ($string) {
  525. global $default_charset;
  526. if (strtolower($default_charset) == 'iso-8859-9')
  527. return $string;
  528. /* Only do the slow convert if there are 8-bit characters */
  529. if (! ereg("[\200-\377]", $string))
  530. return $string;
  531. // latin capital letter g with breve 208->286
  532. $string = str_replace("\320", '&#286;', $string);
  533. // latin capital letter i with dot above 221->304
  534. $string = str_replace("\335", '&#304;', $string);
  535. // latin capital letter s with cedilla 222->350
  536. $string = str_replace("\336", '&#350;', $string);
  537. // latin small letter g with breve 240->287
  538. $string = str_replace("\360", '&#287;', $string);
  539. // latin small letter dotless i 253->305
  540. $string = str_replace("\375", '&#305;', $string);
  541. // latin small letter s with cedilla 254->351
  542. $string = str_replace("\376", '&#351;', $string);
  543. // rest of charset is the same as ISO-8859-1
  544. return (charset_decode_iso_8859_1($string));
  545. }
  546. /*
  547. ISO/IEC 8859-13:1998 Latin Alphabet No. 7 (Baltic Rim)
  548. */
  549. function charset_decode_iso_8859_13 ($string) {
  550. global $default_charset;
  551. if (strtolower($default_charset) == 'iso-8859-13')
  552. return $string;
  553. /* Only do the slow convert if there are 8-bit characters */
  554. if (! ereg("[\200-\377]", $string))
  555. return $string;
  556. $string = str_replace ("\241", '&#8221;', $string);
  557. $string = str_replace ("\245", '&#8222;', $string);
  558. $string = str_replace ("\250", '&#216;', $string);
  559. $string = str_replace ("\252", '&#342;', $string);
  560. $string = str_replace ("\257", '&#198;', $string);
  561. $string = str_replace ("\264", '&#8220;', $string);
  562. $string = str_replace ("\270", '&#248;', $string);
  563. $string = str_replace ("\272", '&#343;', $string);
  564. $string = str_replace ("\277", '&#230;', $string);
  565. $string = str_replace ("\300", '&#260;', $string);
  566. $string = str_replace ("\301", '&#302;', $string);
  567. $string = str_replace ("\302", '&#256;', $string);
  568. $string = str_replace ("\303", '&#262;', $string);
  569. $string = str_replace ("\306", '&#280;', $string);
  570. $string = str_replace ("\307", '&#274;', $string);
  571. $string = str_replace ("\310", '&#268;', $string);
  572. $string = str_replace ("\312", '&#377;', $string);
  573. $string = str_replace ("\313", '&#278;', $string);
  574. $string = str_replace ("\314", '&#290;', $string);
  575. $string = str_replace ("\315", '&#310;', $string);
  576. $string = str_replace ("\316", '&#298;', $string);
  577. $string = str_replace ("\317", '&#315;', $string);
  578. $string = str_replace ("\320", '&#352;', $string);
  579. $string = str_replace ("\321", '&#323;', $string);
  580. $string = str_replace ("\322", '&#325;', $string);
  581. $string = str_replace ("\324", '&#332;', $string);
  582. $string = str_replace ("\330", '&#370;', $string);
  583. $string = str_replace ("\331", '&#321;', $string);
  584. $string = str_replace ("\332", '&#346;', $string);
  585. $string = str_replace ("\333", '&#362;', $string);
  586. $string = str_replace ("\335", '&#379;', $string);
  587. $string = str_replace ("\336", '&#381;', $string);
  588. $string = str_replace ("\340", '&#261;', $string);
  589. $string = str_replace ("\341", '&#303;', $string);
  590. $string = str_replace ("\342", '&#257;', $string);
  591. $string = str_replace ("\343", '&#263;', $string);
  592. $string = str_replace ("\346", '&#281;', $string);
  593. $string = str_replace ("\347", '&#275;', $string);
  594. $string = str_replace ("\350", '&#269;', $string);
  595. $string = str_replace ("\352", '&#378;', $string);
  596. $string = str_replace ("\353", '&#279;', $string);
  597. $string = str_replace ("\354", '&#291;', $string);
  598. $string = str_replace ("\355", '&#311;', $string);
  599. $string = str_replace ("\356", '&#299;', $string);
  600. $string = str_replace ("\357", '&#316;', $string);
  601. $string = str_replace ("\360", '&#353;', $string);
  602. $string = str_replace ("\361", '&#324;', $string);
  603. $string = str_replace ("\362", '&#326;', $string);
  604. $string = str_replace ("\364", '&#333;', $string);
  605. $string = str_replace ("\370", '&#371;', $string);
  606. $string = str_replace ("\371", '&#322;', $string);
  607. $string = str_replace ("\372", '&#347;', $string);
  608. $string = str_replace ("\373", '&#363;', $string);
  609. $string = str_replace ("\375", '&#380;', $string);
  610. $string = str_replace ("\376", '&#382;', $string);
  611. $string = str_replace ("\377", '&#8217;', $string);
  612. // rest of charset is the same as ISO-8859-1
  613. return (charset_decode_iso_8859_1($string));
  614. }
  615. /*
  616. * iso-8859-15 is Latin 9 and has very much the same use as Latin 1
  617. * but has the Euro symbol and some characters needed for French.
  618. */
  619. function charset_decode_iso_8859_15 ($string) {
  620. // Euro sign
  621. $string = str_replace ("\244", '&#8364;', $string);
  622. // Latin capital letter S with caron
  623. $string = str_replace ("\246", '&#352;', $string);
  624. // Latin small letter s with caron
  625. $string = str_replace ("\250", '&#353;', $string);
  626. // Latin capital letter Z with caron
  627. $string = str_replace ("\264", '&#381;', $string);
  628. // Latin small letter z with caron
  629. $string = str_replace ("\270", '&#382;', $string);
  630. // Latin capital ligature OE
  631. $string = str_replace ("\274", '&#338;', $string);
  632. // Latin small ligature oe
  633. $string = str_replace ("\275", '&#339;', $string);
  634. // Latin capital letter Y with diaeresis
  635. $string = str_replace ("\276", '&#376;', $string);
  636. return (charset_decode_iso_8859_1($string));
  637. }
  638. /* ISO-8859-5 is Cyrillic */
  639. function charset_decode_iso_8859_5 ($string) {
  640. // Convert to KOI8-R, then return this decoded.
  641. $string = convert_cyr_string($string, 'i', 'k');
  642. return charset_decode_koi8r($string);
  643. }
  644. /* Remove all 8 bit characters from all other ISO-8859 character sets */
  645. function charset_decode_iso_8859_default ($string) {
  646. return (strtr($string, "\240\241\242\243\244\245\246\247".
  647. "\250\251\252\253\254\255\256\257".
  648. "\260\261\262\263\264\265\266\267".
  649. "\270\271\272\273\274\275\276\277".
  650. "\300\301\302\303\304\305\306\307".
  651. "\310\311\312\313\314\315\316\317".
  652. "\320\321\322\323\324\325\326\327".
  653. "\330\331\332\333\334\335\336\337".
  654. "\340\341\342\343\344\345\346\347".
  655. "\350\351\352\353\354\355\356\357".
  656. "\360\361\362\363\364\365\366\367".
  657. "\370\371\372\373\374\375\376\377",
  658. "????????????????????????????????????????".
  659. "????????????????????????????????????????".
  660. "????????????????????????????????????????".
  661. "????????"));
  662. }
  663. /*
  664. * This is the same as ISO-646-NO and is used by some
  665. * Microsoft programs when sending Norwegian characters
  666. */
  667. function charset_decode_ns_4551_1 ($string) {
  668. /*
  669. * These characters are:
  670. * Latin capital letter AE
  671. * Latin capital letter O with stroke
  672. * Latin capital letter A with ring above
  673. * and the same as small letters
  674. */
  675. return strtr ($string, "[\\]{|}", "ÆØÅæøå");
  676. }
  677. /*
  678. * KOI8-R is used to encode Russian mail (Cyrrilic). Defined in RFC
  679. * 1489.
  680. */
  681. function charset_decode_koi8r ($string) {
  682. global $default_charset;
  683. if ($default_charset == 'koi8-r') {
  684. return $string;
  685. }
  686. /*
  687. * Convert to Unicode HTML entities.
  688. * This code is rather ineffective.
  689. */
  690. $string = str_replace("\200", '&#9472;', $string);
  691. $string = str_replace("\201", '&#9474;', $string);
  692. $string = str_replace("\202", '&#9484;', $string);
  693. $string = str_replace("\203", '&#9488;', $string);
  694. $string = str_replace("\204", '&#9492;', $string);
  695. $string = str_replace("\205", '&#9496;', $string);
  696. $string = str_replace("\206", '&#9500;', $string);
  697. $string = str_replace("\207", '&#9508;', $string);
  698. $string = str_replace("\210", '&#9516;', $string);
  699. $string = str_replace("\211", '&#9524;', $string);
  700. $string = str_replace("\212", '&#9532;', $string);
  701. $string = str_replace("\213", '&#9600;', $string);
  702. $string = str_replace("\214", '&#9604;', $string);
  703. $string = str_replace("\215", '&#9608;', $string);
  704. $string = str_replace("\216", '&#9612;', $string);
  705. $string = str_replace("\217", '&#9616;', $string);
  706. $string = str_replace("\220", '&#9617;', $string);
  707. $string = str_replace("\221", '&#9618;', $string);
  708. $string = str_replace("\222", '&#9619;', $string);
  709. $string = str_replace("\223", '&#8992;', $string);
  710. $string = str_replace("\224", '&#9632;', $string);
  711. $string = str_replace("\225", '&#8729;', $string);
  712. $string = str_replace("\226", '&#8730;', $string);
  713. $string = str_replace("\227", '&#8776;', $string);
  714. $string = str_replace("\230", '&#8804;', $string);
  715. $string = str_replace("\231", '&#8805;', $string);
  716. $string = str_replace("\232", '&#160;', $string);
  717. $string = str_replace("\233", '&#8993;', $string);
  718. $string = str_replace("\234", '&#176;', $string);
  719. $string = str_replace("\235", '&#178;', $string);
  720. $string = str_replace("\236", '&#183;', $string);
  721. $string = str_replace("\237", '&#247;', $string);
  722. $string = str_replace("\240", '&#9552;', $string);
  723. $string = str_replace("\241", '&#9553;', $string);
  724. $string = str_replace("\242", '&#9554;', $string);
  725. $string = str_replace("\243", '&#1105;', $string);
  726. $string = str_replace("\244", '&#9555;', $string);
  727. $string = str_replace("\245", '&#9556;', $string);
  728. $string = str_replace("\246", '&#9557;', $string);
  729. $string = str_replace("\247", '&#9558;', $string);
  730. $string = str_replace("\250", '&#9559;', $string);
  731. $string = str_replace("\251", '&#9560;', $string);
  732. $string = str_replace("\252", '&#9561;', $string);
  733. $string = str_replace("\253", '&#9562;', $string);
  734. $string = str_replace("\254", '&#9563;', $string);
  735. $string = str_replace("\255", '&#9564;', $string);
  736. $string = str_replace("\256", '&#9565;', $string);
  737. $string = str_replace("\257", '&#9566;', $string);
  738. $string = str_replace("\260", '&#9567;', $string);
  739. $string = str_replace("\261", '&#9568;', $string);
  740. $string = str_replace("\262", '&#9569;', $string);
  741. $string = str_replace("\263", '&#1025;', $string);
  742. $string = str_replace("\264", '&#9570;', $string);
  743. $string = str_replace("\265", '&#9571;', $string);
  744. $string = str_replace("\266", '&#9572;', $string);
  745. $string = str_replace("\267", '&#9573;', $string);
  746. $string = str_replace("\270", '&#9574;', $string);
  747. $string = str_replace("\271", '&#9575;', $string);
  748. $string = str_replace("\272", '&#9576;', $string);
  749. $string = str_replace("\273", '&#9577;', $string);
  750. $string = str_replace("\274", '&#9578;', $string);
  751. $string = str_replace("\275", '&#9579;', $string);
  752. $string = str_replace("\276", '&#9580;', $string);
  753. $string = str_replace("\277", '&#169;', $string);
  754. $string = str_replace("\300", '&#1102;', $string);
  755. $string = str_replace("\301", '&#1072;', $string);
  756. $string = str_replace("\302", '&#1073;', $string);
  757. $string = str_replace("\303", '&#1094;', $string);
  758. $string = str_replace("\304", '&#1076;', $string);
  759. $string = str_replace("\305", '&#1077;', $string);
  760. $string = str_replace("\306", '&#1092;', $string);
  761. $string = str_replace("\307", '&#1075;', $string);
  762. $string = str_replace("\310", '&#1093;', $string);
  763. $string = str_replace("\311", '&#1080;', $string);
  764. $string = str_replace("\312", '&#1081;', $string);
  765. $string = str_replace("\313", '&#1082;', $string);
  766. $string = str_replace("\314", '&#1083;', $string);
  767. $string = str_replace("\315", '&#1084;', $string);
  768. $string = str_replace("\316", '&#1085;', $string);
  769. $string = str_replace("\317", '&#1086;', $string);
  770. $string = str_replace("\320", '&#1087;', $string);
  771. $string = str_replace("\321", '&#1103;', $string);
  772. $string = str_replace("\322", '&#1088;', $string);
  773. $string = str_replace("\323", '&#1089;', $string);
  774. $string = str_replace("\324", '&#1090;', $string);
  775. $string = str_replace("\325", '&#1091;', $string);
  776. $string = str_replace("\326", '&#1078;', $string);
  777. $string = str_replace("\327", '&#1074;', $string);
  778. $string = str_replace("\330", '&#1100;', $string);
  779. $string = str_replace("\331", '&#1099;', $string);
  780. $string = str_replace("\332", '&#1079;', $string);
  781. $string = str_replace("\333", '&#1096;', $string);
  782. $string = str_replace("\334", '&#1101;', $string);
  783. $string = str_replace("\335", '&#1097;', $string);
  784. $string = str_replace("\336", '&#1095;', $string);
  785. $string = str_replace("\337", '&#1098;', $string);
  786. $string = str_replace("\340", '&#1070;', $string);
  787. $string = str_replace("\341", '&#1040;', $string);
  788. $string = str_replace("\342", '&#1041;', $string);
  789. $string = str_replace("\343", '&#1062;', $string);
  790. $string = str_replace("\344", '&#1044;', $string);
  791. $string = str_replace("\345", '&#1045;', $string);
  792. $string = str_replace("\346", '&#1060;', $string);
  793. $string = str_replace("\347", '&#1043;', $string);
  794. $string = str_replace("\350", '&#1061;', $string);
  795. $string = str_replace("\351", '&#1048;', $string);
  796. $string = str_replace("\352", '&#1049;', $string);
  797. $string = str_replace("\353", '&#1050;', $string);
  798. $string = str_replace("\354", '&#1051;', $string);
  799. $string = str_replace("\355", '&#1052;', $string);
  800. $string = str_replace("\356", '&#1053;', $string);
  801. $string = str_replace("\357", '&#1054;', $string);
  802. $string = str_replace("\360", '&#1055;', $string);
  803. $string = str_replace("\361", '&#1071;', $string);
  804. $string = str_replace("\362", '&#1056;', $string);
  805. $string = str_replace("\363", '&#1057;', $string);
  806. $string = str_replace("\364", '&#1058;', $string);
  807. $string = str_replace("\365", '&#1059;', $string);
  808. $string = str_replace("\366", '&#1046;', $string);
  809. $string = str_replace("\367", '&#1042;', $string);
  810. $string = str_replace("\370", '&#1068;', $string);
  811. $string = str_replace("\371", '&#1067;', $string);
  812. $string = str_replace("\372", '&#1047;', $string);
  813. $string = str_replace("\373", '&#1064;', $string);
  814. $string = str_replace("\374", '&#1069;', $string);
  815. $string = str_replace("\375", '&#1065;', $string);
  816. $string = str_replace("\376", '&#1063;', $string);
  817. $string = str_replace("\377", '&#1066;', $string);
  818. return $string;
  819. }
  820. /*
  821. windows-1254 (Turks)
  822. */
  823. function charset_decode_windows_1254 ($string) {
  824. global $default_charset;
  825. if (strtolower($default_charset) == 'windows-1254')
  826. return $string;
  827. /* Only do the slow convert if there are 8-bit characters */
  828. if (! ereg("[\200-\377]", $string))
  829. return $string;
  830. // Euro sign 128 -> 8364
  831. $string = str_replace("\200", '&#8364;', $string);
  832. // Single low-9 quotation mark 130 -> 8218
  833. $string = str_replace("\202", '&#8218;', $string);
  834. // latin small letter f with hook 131 -> 402
  835. $string = str_replace("\203", '&#402;', $string);
  836. // Double low-9 quotation mark 132 -> 8222
  837. $string = str_replace("\204", '&#8222;', $string);
  838. // horizontal ellipsis 133 -> 8230
  839. $string = str_replace("\205", '&#8230;', $string);
  840. // dagger 134 -> 8224
  841. $string = str_replace("\206", '&#8224;', $string);
  842. // double dagger 135 -> 8225
  843. $string = str_replace("\207", '&#8225;', $string);
  844. // modifier letter circumflex accent 136->710
  845. $string = str_replace("\210", '&#710;', $string);
  846. // per mille sign 137 -> 8240
  847. $string = str_replace("\211", '&#8240;', $string);
  848. // latin capital letter s with caron 138 -> 352
  849. $string = str_replace("\212", '&#352;', $string);
  850. // single left-pointing angle quotation mark 139 -> 8249
  851. $string = str_replace("\213", '&#8249;', $string);
  852. // latin capital ligature oe 140 -> 338
  853. $string = str_replace("\214", '&#338;', $string);
  854. // left single quotation mark 145 -> 8216
  855. $string = str_replace("\221", '&#8216;', $string);
  856. // right single quotation mark 146 -> 8217
  857. $string = str_replace("\222", '&#8217;', $string);
  858. // left double quotation mark 147 -> 8220
  859. $string = str_replace("\223", '&#8220;', $string);
  860. // right double quotation mark 148 -> 8221
  861. $string = str_replace("\224", '&#8221;', $string);
  862. // bullet 149 -> 8226
  863. $string = str_replace("\225", '&#8226;', $string);
  864. // en dash 150 -> 8211
  865. $string = str_replace("\226", '&#8211;', $string);
  866. // em dash 151 -> 8212
  867. $string = str_replace("\227", '&#8212;', $string);
  868. // small tilde 152 -> 732
  869. $string = str_replace("\230", '&#732;', $string);
  870. // trade mark sign 153 -> 8482
  871. $string = str_replace("\231", '&#8482;', $string);
  872. // latin small letter s with caron 154 -> 353
  873. $string = str_replace("\232", '&#353;', $string);
  874. // single right-pointing angle quotation mark 155 -> 8250
  875. $string = str_replace("\233", '&#8250;', $string);
  876. // latin small ligature oe 156 -> 339
  877. $string = str_replace("\234", '&#339;', $string);
  878. // latin capital letter y with diaresis 159->376
  879. $string = str_replace("\237", '&#376;', $string);
  880. // latin capital letter g with breve 208->286
  881. $string = str_replace("\320", '&#286;', $string);
  882. // latin capital letter i with dot above 221->304
  883. $string = str_replace("\335", '&#304;', $string);
  884. // latin capital letter s with cedilla 222->350
  885. $string = str_replace("\336", '&#350;', $string);
  886. // latin small letter g with breve 240->287
  887. $string = str_replace("\360", '&#287;', $string);
  888. // latin small letter dotless i 253->305
  889. $string = str_replace("\375", '&#305;', $string);
  890. // latin small letter s with cedilla 254->351
  891. $string = str_replace("\376", '&#351;', $string);
  892. // Rest of charset is like iso-8859-1
  893. return (charset_decode_iso_8859_1($string));
  894. }
  895. /*
  896. windows-1253 (Greek)
  897. */
  898. function charset_decode_windows_1253 ($string) {
  899. global $default_charset;
  900. if (strtolower($default_charset) == 'windows-1253')
  901. return $string;
  902. /* Only do the slow convert if there are 8-bit characters */
  903. if (! ereg("[\200-\377]", $string))
  904. return $string;
  905. $string = str_replace("\200", '&#8364;', $string);
  906. $string = str_replace("\202", '&#8218;', $string);
  907. $string = str_replace("\203", '&#402;', $string);
  908. $string = str_replace("\204", '&#8222;', $string);
  909. $string = str_replace("\205", '&#8230;', $string);
  910. $string = str_replace("\206", '&#8224;', $string);
  911. $string = str_replace("\207", '&#8225;', $string);
  912. $string = str_replace("\211", '&#8240;', $string);
  913. $string = str_replace("\213", '&#8249;', $string);
  914. $string = str_replace("\221", '&#8216;', $string);
  915. $string = str_replace("\222", '&#8217;', $string);
  916. $string = str_replace("\223", '&#8220;', $string);
  917. $string = str_replace("\224", '&#8221;', $string);
  918. $string = str_replace("\225", '&#8226;', $string);
  919. $string = str_replace("\226", '&#8211;', $string);
  920. $string = str_replace("\227", '&#8212;', $string);
  921. $string = str_replace("\231", '&#8482;', $string);
  922. $string = str_replace("\233", '&#8250;', $string);
  923. $string = str_replace("\241", '&#901;', $string);
  924. $string = str_replace("\242", '&#902;', $string);
  925. $string = str_replace ("\257", '&#8213;', $string);
  926. $string = str_replace("\264", '&#900;', $string);
  927. $string = str_replace("\270", '&#904;', $string);
  928. $string = str_replace ("\271", '&#905;', $string);
  929. $string = str_replace ("\272", '&#906;', $string);
  930. $string = str_replace ("\274", '&#908;', $string);
  931. // cycle for 190-254 symbols
  932. $string = preg_replace("/([\274-\376])/e","'&#' . (ord('\\1')+720);",$string);
  933. // Rest of charset is like iso-8859-1
  934. return (charset_decode_iso_8859_1($string));
  935. }
  936. /*
  937. windows-1257 (BaltRim)
  938. */
  939. function charset_decode_windows_1257 ($string) {
  940. global $default_charset;
  941. if (strtolower($default_charset) == 'windows-1257')
  942. return $string;
  943. /* Only do the slow convert if there are 8-bit characters */
  944. if (! ereg("[\200-\377]", $string))
  945. return $string;
  946. $string = str_replace("\200", '&#8364;', $string);
  947. $string = str_replace("\202", '&#8218;', $string);
  948. $string = str_replace("\204", '&#8222;', $string);
  949. $string = str_replace("\205", '&#8230;', $string);
  950. $string = str_replace("\206", '&#8224;', $string);
  951. $string = str_replace("\207", '&#8225;', $string);
  952. $string = str_replace("\211", '&#8240;', $string);
  953. $string = str_replace("\213", '&#8249;', $string);
  954. $string = str_replace("\215", '&#168;', $string);
  955. $string = str_replace("\216", '&#711;', $string);
  956. $string = str_replace("\217", '&#184;', $string);
  957. $string = str_replace("\221", '&#8216;', $string);
  958. $string = str_replace("\222", '&#8217;', $string);
  959. $string = str_replace("\223", '&#8220;', $string);
  960. $string = str_replace("\224", '&#8221;', $string);
  961. $string = str_replace("\225", '&#8226;', $string);
  962. $string = str_replace("\226", '&#8211;', $string);
  963. $string = str_replace("\227", '&#8212;', $string);
  964. $string = str_replace("\231", '&#8482;', $string);
  965. $string = str_replace("\233", '&#8250;', $string);
  966. $string = str_replace("\235", '&#175;', $string);
  967. $string = str_replace("\236", '&#731;', $string);
  968. $string = str_replace ("\250", '&#216;', $string);
  969. $string = str_replace ("\252", '&#342;', $string);
  970. $string = str_replace ("\257", '&#198;', $string);
  971. $string = str_replace ("\270", '&#248;', $string);
  972. $string = str_replace ("\272", '&#343;', $string);
  973. $string = str_replace ("\277", '&#230;', $string);
  974. $string = str_replace ("\300", '&#260;', $string);
  975. $string = str_replace ("\301", '&#302;', $string);
  976. $string = str_replace ("\302", '&#256;', $string);
  977. $string = str_replace ("\303", '&#262;', $string);
  978. $string = str_replace ("\306", '&#280;', $string);
  979. $string = str_replace ("\307", '&#274;', $string);
  980. $string = str_replace ("\310", '&#268;', $string);
  981. $string = str_replace ("\312", '&#377;', $string);
  982. $string = str_replace ("\313", '&#278;', $string);
  983. $string = str_replace ("\314", '&#290;', $string);
  984. $string = str_replace ("\315", '&#310;', $string);
  985. $string = str_replace ("\316", '&#298;', $string);
  986. $string = str_replace ("\317", '&#315;', $string);
  987. $string = str_replace ("\320", '&#352;', $string);
  988. $string = str_replace ("\321", '&#323;', $string);
  989. $string = str_replace ("\322", '&#325;', $string);
  990. $string = str_replace ("\324", '&#332;', $string);
  991. $string = str_replace ("\330", '&#370;', $string);
  992. $string = str_replace ("\331", '&#321;', $string);
  993. $string = str_replace ("\332", '&#340;', $string);
  994. $string = str_replace ("\333", '&#362;', $string);
  995. $string = str_replace ("\335", '&#379;', $string);
  996. $string = str_replace ("\336", '&#381;', $string);
  997. $string = str_replace ("\340", '&#261;', $string);
  998. $string = str_replace ("\341", '&#303;', $string);
  999. $string = str_replace ("\342", '&#257;', $string);
  1000. $string = str_replace ("\343", '&#263;', $string);
  1001. $string = str_replace ("\346", '&#281;', $string);
  1002. $string = str_replace ("\347", '&#275;', $string);
  1003. $string = str_replace ("\350", '&#269;', $string);
  1004. $string = str_replace ("\352", '&#378;', $string);
  1005. $string = str_replace ("\353", '&#279;', $string);
  1006. $string = str_replace ("\354", '&#291;', $string);
  1007. $string = str_replace ("\355", '&#311;', $string);
  1008. $string = str_replace ("\356", '&#299;', $string);
  1009. $string = str_replace ("\357", '&#316;', $string);
  1010. $string = str_replace ("\360", '&#353;', $string);
  1011. $string = str_replace ("\361", '&#324;', $string);
  1012. $string = str_replace ("\362", '&#326;', $string);
  1013. $string = str_replace ("\364", '&#333;', $string);
  1014. $string = str_replace ("\370", '&#371;', $string);
  1015. $string = str_replace ("\371", '&#322;', $string);
  1016. $string = str_replace ("\372", '&#347;', $string);
  1017. $string = str_replace ("\373", '&#363;', $string);
  1018. $string = str_replace ("\375", '&#380;', $string);
  1019. $string = str_replace ("\376", '&#382;', $string);
  1020. $string = str_replace ("\377", '&#729;', $string);
  1021. // Rest of charset is like iso-8859-1
  1022. return (charset_decode_iso_8859_1($string));
  1023. }
  1024. /* windows-1251 is Microsoft Cyrillic encoding */
  1025. function charset_decode_windows_1251 ($string) {
  1026. // Convert to KOI8-R, then return this decoded.
  1027. $string = convert_cyr_string($string, 'w', 'k');
  1028. return charset_decode_koi8r($string);
  1029. }
  1030. /*
  1031. * Set up the language to be output
  1032. * if $do_search is true, then scan the browser information
  1033. * for a possible language that we know
  1034. */
  1035. function set_up_language($sm_language, $do_search = false) {
  1036. static $SetupAlready = 0;
  1037. global $use_gettext, $languages,
  1038. $squirrelmail_language, $squirrelmail_default_language,
  1039. $sm_notAlias;
  1040. if ($SetupAlready) {
  1041. return;
  1042. }
  1043. $SetupAlready = TRUE;
  1044. if ($do_search && ! $sm_language && isset($_SERVER['HTTP_ACCEPT_LANGUAGE'])) {
  1045. $sm_language = substr($_SERVER['HTTP_ACCEPT_LANGUAGE'], 0, 2);
  1046. }
  1047. if (!$sm_language && isset($squirrelmail_default_language)) {
  1048. $squirrelmail_language = $squirrelmail_default_language;
  1049. $sm_language = $squirrelmail_default_language;
  1050. }
  1051. $sm_notAlias = $sm_language;
  1052. while (isset($languages[$sm_notAlias]['ALIAS'])) {
  1053. $sm_notAlias = $languages[$sm_notAlias]['ALIAS'];
  1054. }
  1055. if ( isset($sm_language) &&
  1056. $use_gettext &&
  1057. $sm_language != '' &&
  1058. isset($languages[$sm_notAlias]['CHARSET']) ) {
  1059. bindtextdomain( 'squirrelmail', SM_PATH . 'locale/' );
  1060. textdomain( 'squirrelmail' );
  1061. if ( !ini_get('safe_mode') &&
  1062. getenv( 'LC_ALL' ) != $sm_notAlias ) {
  1063. putenv( "LC_ALL=$sm_notAlias" );
  1064. putenv( "LANG=$sm_notAlias" );
  1065. putenv( "LANGUAGE=$sm_notAlias" );
  1066. }
  1067. setlocale(LC_ALL, $sm_notAlias);
  1068. $squirrelmail_language = $sm_notAlias;
  1069. if ($squirrelmail_language == 'ja_JP' && function_exists('mb_detect_encoding') ) {
  1070. header ('Content-Type: text/html; charset=EUC-JP');
  1071. if (!function_exists('mb_internal_encoding')) {
  1072. echo _("You need to have php4 installed with the multibyte string function enabled (using configure option --with-mbstring).");
  1073. }
  1074. mb_internal_encoding('EUC-JP');
  1075. mb_http_output('pass');
  1076. } else {
  1077. header( 'Content-Type: text/html; charset=' . $languages[$sm_notAlias]['CHARSET'] );
  1078. }
  1079. }
  1080. }
  1081. function set_my_charset(){
  1082. /*
  1083. * There can be a $default_charset setting in the
  1084. * config.php file, but the user may have a different language
  1085. * selected for a user interface. This function checks the
  1086. * language selected by the user and tags the outgoing messages
  1087. * with the appropriate charset corresponding to the language
  1088. * selection. This is "more right" (tm), than just stamping the
  1089. * message blindly with the system-wide $default_charset.
  1090. */
  1091. global $data_dir, $username, $default_charset, $languages, $squirrelmail_default_language;
  1092. $my_language = getPref($data_dir, $username, 'language');
  1093. if (!$my_language) {
  1094. $my_language = $squirrelmail_default_language ;
  1095. }
  1096. while (isset($languages[$my_language]['ALIAS'])) {
  1097. $my_language = $languages[$my_language]['ALIAS'];
  1098. }
  1099. $my_charset = $languages[$my_language]['CHARSET'];
  1100. if ($my_charset) {
  1101. $default_charset = $my_charset;
  1102. }
  1103. }
  1104. /* ------------------------------ main --------------------------- */
  1105. global $squirrelmail_language, $languages, $use_gettext;
  1106. if (! isset($squirrelmail_language)) {
  1107. $squirrelmail_language = '';
  1108. }
  1109. /* This array specifies the available languages. */
  1110. // The glibc locale is ca_ES.
  1111. $languages['ca_ES']['NAME'] = 'Catalan';
  1112. $languages['ca_ES']['CHARSET'] = 'iso-8859-1';
  1113. $languages['ca']['ALIAS'] = 'ca_ES';
  1114. $languages['cs_CZ']['NAME'] = 'Czech';
  1115. $languages['cs_CZ']['CHARSET'] = 'iso-8859-2';
  1116. $languages['cs']['ALIAS'] = 'cs_CZ';
  1117. // Danish locale is da_DK.
  1118. $languages['da_DK']['NAME'] = 'Danish';
  1119. $languages['da_DK']['CHARSET'] = 'iso-8859-1';
  1120. $languages['da']['ALIAS'] = 'da_DK';
  1121. $languages['de_DE']['NAME'] = 'Deutsch';
  1122. $languages['de_DE']['CHARSET'] = 'iso-8859-1';
  1123. $languages['de']['ALIAS'] = 'de_DE';
  1124. // There is no en_EN! There is en_US, en_BR, en_AU, and so forth,
  1125. // but who cares about !US, right? Right? :)
  1126. $languages['el_GR']['NAME'] = 'Greek';
  1127. $languages['el_GR']['CHARSET'] = 'iso-8859-7';
  1128. $languages['el']['ALIAS'] = 'el_GR';
  1129. $languages['en_US']['NAME'] = 'English';
  1130. $languages['en_US']['CHARSET'] = 'iso-8859-1';
  1131. $languages['en']['ALIAS'] = 'en_US';
  1132. $languages['es_ES']['NAME'] = 'Spanish';
  1133. $languages['es_ES']['CHARSET'] = 'iso-8859-1';
  1134. $languages['es']['ALIAS'] = 'es_ES';
  1135. $languages['et_EE']['NAME'] = 'Estonian';
  1136. $languages['et_EE']['CHARSET'] = 'iso-8859-15';
  1137. $languages['et']['ALIAS'] = 'et_EE';
  1138. $languages['fi_FI']['NAME'] = 'Finnish';
  1139. $languages['fi_FI']['CHARSET'] = 'iso-8859-1';
  1140. $languages['fi']['ALIAS'] = 'fi_FI';
  1141. $languages['fr_FR']['NAME'] = 'French';
  1142. $languages['fr_FR']['CHARSET'] = 'iso-8859-1';
  1143. $languages['fr']['ALIAS'] = 'fr_FR';
  1144. $languages['hr_HR']['NAME'] = 'Croatian';
  1145. $languages['hr_HR']['CHARSET'] = 'iso-8859-2';
  1146. $languages['hr']['ALIAS'] = 'hr_HR';
  1147. $languages['hu_HU']['NAME'] = 'Hungarian';
  1148. $languages['hu_HU']['CHARSET'] = 'iso-8859-2';
  1149. $languages['hu']['ALIAS'] = 'hu_HU';
  1150. $languages['id_ID']['NAME'] = 'Indonesian';
  1151. $languages['id_ID']['CHARSET'] = 'iso-8859-1';
  1152. $languages['id']['ALIAS'] = 'id_ID';
  1153. $languages['is_IS']['NAME'] = 'Icelandic';
  1154. $languages['is_IS']['CHARSET'] = 'iso-8859-1';
  1155. $languages['is']['ALIAS'] = 'is_IS';
  1156. $languages['it_IT']['NAME'] = 'Italian';
  1157. $languages['it_IT']['CHARSET'] = 'iso-8859-1';
  1158. $languages['it']['ALIAS'] = 'it_IT';
  1159. $languages['ja_JP']['NAME'] = 'Japanese';
  1160. $languages['ja_JP']['CHARSET'] = 'iso-2022-jp';
  1161. $languages['ja_JP']['XTRA_CODE'] = 'japanese_charset_xtra';
  1162. $languages['ja']['ALIAS'] = 'ja_JP';
  1163. $languages['ko_KR']['NAME'] = 'Korean';
  1164. $languages['ko_KR']['CHARSET'] = 'euc-KR';
  1165. $languages['ko_KR']['XTRA_CODE'] = 'korean_charset_xtra';
  1166. $languages['ko']['ALIAS'] = 'ko_KR';
  1167. $languages['nl_NL']['NAME'] = 'Dutch';
  1168. $languages['nl_NL']['CHARSET'] = 'iso-8859-1';
  1169. $languages['nl']['ALIAS'] = 'nl_NL';
  1170. $languages['no_NO']['NAME'] = 'Norwegian (Bokm&aring;l)';
  1171. $languages['no_NO']['CHARSET'] = 'iso-8859-1';
  1172. $languages['no']['ALIAS'] = 'no_NO';
  1173. $languages['nn_NO']['NAME'] = 'Norwegian (Nynorsk)';
  1174. $languages['nn_NO']['CHARSET'] = 'iso-8859-1';
  1175. $languages['pl_PL']['NAME'] = 'Polish';
  1176. $languages['pl_PL']['CHARSET'] = 'iso-8859-2';
  1177. $languages['pl']['ALIAS'] = 'pl_PL';
  1178. $languages['pt_PT']['NAME'] = 'Portuguese (Portugal)';
  1179. $languages['pt_PT']['CHARSET'] = 'iso-8859-1';
  1180. $languages['pt_BR']['NAME'] = 'Portuguese (Brazil)';
  1181. $languages['pt_BR']['CHARSET'] = 'iso-8859-1';
  1182. $languages['pt']['ALIAS'] = 'pt_PT';
  1183. $languages['ru_RU']['NAME'] = 'Russian';
  1184. $languages['ru_RU']['CHARSET'] = 'koi8-r';
  1185. $languages['ru']['ALIAS'] = 'ru_RU';
  1186. $languages['sr_YU']['NAME'] = 'Serbian';
  1187. $languages['sr_YU']['CHARSET'] = 'iso-8859-2';
  1188. $languages['sr']['ALIAS'] = 'sr_YU';
  1189. $languages['sv_SE']['NAME'] = 'Swedish';
  1190. $languages['sv_SE']['CHARSET'] = 'iso-8859-1';
  1191. $languages['sv']['ALIAS'] = 'sv_SE';
  1192. $languages['tr_TR']['NAME'] = 'Turkish';
  1193. $languages['tr_TR']['CHARSET'] = 'iso-8859-9';
  1194. $languages['tr']['ALIAS'] = 'tr_TR';
  1195. $languages['zh_TW']['NAME'] = 'Chinese Trad';
  1196. $languages['zh_TW']['CHARSET'] = 'big5';
  1197. $languages['tw']['ALIAS'] = 'zh_TW';
  1198. $languages['zh_CN']['NAME'] = 'Chinese Simp';
  1199. $languages['zh_CN']['CHARSET'] = 'gb2312';
  1200. $languages['cn']['ALIAS'] = 'zh_CN';
  1201. $languages['sk_SK']['NAME'] = 'Slovak';
  1202. $languages['sk_SK']['CHARSET'] = 'iso-8859-2';
  1203. $languages['sk']['ALIAS'] = 'sk_SK';
  1204. $languages['ro_RO']['NAME'] = 'Romanian';
  1205. $languages['ro_RO']['CHARSET'] = 'iso-8859-2';
  1206. $languages['ro']['ALIAS'] = 'ro_RO';
  1207. $languages['th_TH']['NAME'] = 'Thai';
  1208. $languages['th_TH']['CHARSET'] = 'tis-620';
  1209. $languages['th']['ALIAS'] = 'th_TH';
  1210. $languages['lt_LT']['NAME'] = 'Lithuanian';
  1211. $languages['lt_LT']['CHARSET'] = 'windows-1257';
  1212. $languages['lt']['ALIAS'] = 'lt_LT';
  1213. $languages['sl_SI']['NAME'] = 'Slovenian';
  1214. $languages['sl_SI']['CHARSET'] = 'iso-8859-2';
  1215. $languages['sl']['ALIAS'] = 'sl_SI';
  1216. $languages['bg_BG']['NAME'] = 'Bulgarian';
  1217. $languages['bg_BG']['CHARSET'] = 'windows-1251';
  1218. $languages['bg']['ALIAS'] = 'bg_BG';
  1219. $languages['uk_UA']['NAME'] = 'Ukrainian';
  1220. $languages['uk_UA']['CHARSET'] = 'koi8-u';
  1221. $languages['uk']['ALIAS'] = 'uk_UA';
  1222. // Right to left languages
  1223. $languages['ar']['NAME'] = 'Arabic';
  1224. $languages['ar']['CHARSET'] = 'windows-1256';
  1225. $languages['ar']['DIR'] = 'rtl';
  1226. $languages['he_IL']['NAME'] = 'Hebrew';
  1227. $languages['he_IL']['CHARSET'] = 'windows-1255';
  1228. $languages['he_IL']['DIR'] = 'rtl';
  1229. $languages['he']['ALIAS'] = 'he_IL';
  1230. /* Detect whether gettext is installed. */
  1231. $gettext_flags = 0;
  1232. if (function_exists('_')) {
  1233. $gettext_flags += 1;
  1234. }
  1235. if (function_exists('bindtextdomain')) {
  1236. $gettext_flags += 2;
  1237. }
  1238. if (function_exists('textdomain')) {
  1239. $gettext_flags += 4;
  1240. }
  1241. /* If gettext is fully loaded, cool */
  1242. if ($gettext_flags == 7) {
  1243. $use_gettext = true;
  1244. }
  1245. /* If we can fake gettext, try that */
  1246. elseif ($gettext_flags == 0) {
  1247. $use_gettext = true;
  1248. include_once(SM_PATH . 'functions/gettext.php');
  1249. } else {
  1250. /* Uh-ho. A weird install */
  1251. if (! $gettext_flags & 1) {
  1252. function _($str) {
  1253. return $str;
  1254. }
  1255. }
  1256. if (! $gettext_flags & 2) {
  1257. function bindtextdomain() {
  1258. return;
  1259. }
  1260. }
  1261. if (! $gettext_flags & 4) {
  1262. function textdomain() {
  1263. return;
  1264. }
  1265. }
  1266. }
  1267. function charset_decode_utf8 ($string) {
  1268. /*
  1269. Every decoded character consists of n bytes. First byte is octal
  1270. 300-375, other bytes - always octals 200-277.
  1271. \a\b characters are decoded to html code octdec(a-300)*64 + octdec(b-200)
  1272. \a\b\c characters are decoded to html code octdec(a-340)*64*64 + octdec(b-200)*64 + octdec(c-200)
  1273. decoding cycle is unfinished. please test and report problems to tokul@users.sourceforge.net
  1274. */
  1275. global $default_charset, $languages, $sm_notAlias;
  1276. if (strtolower($default_charset) == 'utf-8')
  1277. return $string;
  1278. if (strtolower($languages[$sm_notAlias]['CHARSET']) == 'utf-8')
  1279. return $string;
  1280. /* Only do the slow convert if there are 8-bit characters */
  1281. if (! ereg("[\200-\377]", $string))
  1282. return $string;
  1283. // decode three byte unicode characters
  1284. $string = preg_replace("/([\340-\357])([\200-\277])([\200-\277])/e",
  1285. "'&#'.((ord('\\1')-224)*4096+(ord('\\2')-128)*64+(ord('\\3')-128)).';'",
  1286. $string);
  1287. // decode two byte unicode characters
  1288. $string = preg_replace("/([\300-\337])([\200-\277])/e",
  1289. "'&#'.((ord('\\1')-192)*64+(ord('\\2')-128)).';'",
  1290. $string);
  1291. return $string;
  1292. }
  1293. /*
  1294. * Japanese charset extra function
  1295. *
  1296. */
  1297. function japanese_charset_xtra() {
  1298. $ret = func_get_arg(1); /* default return value */
  1299. if (function_exists('mb_detect_encoding')) {
  1300. switch (func_get_arg(0)) { /* action */
  1301. case 'decode':
  1302. $detect_encoding = mb_detect_encoding($ret);
  1303. if ($detect_encoding == 'JIS' ||
  1304. $detect_encoding == 'EUC-JP' ||
  1305. $detect_encoding == 'SJIS') {
  1306. $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO');
  1307. }
  1308. break;
  1309. case 'encode':
  1310. $detect_encoding = mb_detect_encoding($ret);
  1311. if ($detect_encoding == 'JIS' ||
  1312. $detect_encoding == 'EUC-JP' ||
  1313. $detect_encoding == 'SJIS') {
  1314. $ret = mb_convert_encoding($ret, 'JIS', 'AUTO');
  1315. }
  1316. break;
  1317. case 'strimwidth':
  1318. $width = func_get_arg(2);
  1319. $ret = mb_strimwidth($ret, 0, $width, '...');
  1320. break;
  1321. case 'encodeheader':
  1322. $result = '';
  1323. if (strlen($ret) > 0) {
  1324. $tmpstr = mb_substr($ret, 0, 1);
  1325. $prevcsize = strlen($tmpstr);
  1326. for ($i = 1; $i < mb_strlen($ret); $i++) {
  1327. $tmp = mb_substr($ret, $i, 1);
  1328. if (strlen($tmp) == $prevcsize) {
  1329. $tmpstr .= $tmp;
  1330. } else {
  1331. if ($prevcsize == 1) {
  1332. $result .= $tmpstr;
  1333. } else {
  1334. $result .= mb_encode_mimeheader($tmpstr);
  1335. }
  1336. $tmpstr = $tmp;
  1337. $prevcsize = strlen($tmp);
  1338. }
  1339. }
  1340. if (strlen($tmpstr)) {
  1341. if (strlen(mb_substr($tmpstr, 0, 1)) == 1)
  1342. $result .= $tmpstr;
  1343. else
  1344. $result .= mb_encode_mimeheader($tmpstr);
  1345. }
  1346. }
  1347. $ret = $result;
  1348. //$ret = mb_encode_mimeheader($ret);
  1349. break;
  1350. case 'decodeheader':
  1351. $ret = str_replace("\t", "", $ret);
  1352. if (eregi('=\\?([^?]+)\\?(q|b)\\?([^?]+)\\?=', $ret))
  1353. $ret = mb_decode_mimeheader($ret);
  1354. $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO');
  1355. break;
  1356. case 'downloadfilename':
  1357. $useragent = func_get_arg(2);
  1358. if (strstr($useragent, 'Windows') !== false ||
  1359. strstr($useragent, 'Mac_') !== false) {
  1360. $ret = mb_convert_encoding($ret, 'SJIS', 'AUTO');
  1361. } else {
  1362. $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO');
  1363. }
  1364. break;
  1365. }
  1366. }
  1367. return $ret;
  1368. }
  1369. /*
  1370. * Korean charset extra function
  1371. * Hangul(Korean Character) Attached File Name Fix.
  1372. */
  1373. function korean_charset_xtra() {
  1374. $ret = func_get_arg(1); /* default return value */
  1375. if (func_get_arg(0) == 'downloadfilename') { /* action */
  1376. $ret = str_replace("\x0D\x0A", '', $ret); /* Hanmail's CR/LF Clear */
  1377. for ($i=0;$i<strlen($ret);$i++) {
  1378. if ($ret[$i] >= "\xA1" && $ret[$i] <= "\xFE") { /* 0xA1 - 0XFE are Valid */
  1379. $i++;
  1380. continue;
  1381. } else if (($ret[$i] >= 'a' && $ret[$i] <= 'z') || /* From Original ereg_replace in download.php */
  1382. ($ret[$i] >= 'A' && $ret[$i] <= 'Z') ||
  1383. ($ret[$i] == '.') || ($ret[$i] == '-')) {
  1384. continue;
  1385. } else {
  1386. $ret[$i] = '_';
  1387. }
  1388. }
  1389. }
  1390. return $ret;
  1391. }
  1392. ?>