
with mbstring overloading. P.S. SquirrelMail login fails with php_value mbstring.func_overload 2 php_value mbstring.internal_encoding utf-8
51 lines
No EOL
1.5 KiB
PHP
51 lines
No EOL
1.5 KiB
PHP
<?php
|
|
/**
|
|
* decode/utf-8.php
|
|
*
|
|
* Copyright (c) 2003-2004 The SquirrelMail Project Team
|
|
* Licensed under the GNU GPL. For full terms see the file COPYING.
|
|
*
|
|
* This file contains utf-8 decoding function that is needed to read
|
|
* utf-8 encoded mails in non-utf-8 locale.
|
|
*
|
|
* Every decoded character consists of n bytes. First byte is octal
|
|
* 300-375, other bytes - always octals 200-277.
|
|
*
|
|
* \a\b characters are decoded to html code octdec(a-300)*64 + octdec(b-200)
|
|
* \a\b\c characters are decoded to html code octdec(a-340)*64*64 + octdec(b-200)*64 + octdec(c-200)
|
|
*
|
|
* decoding cycle is unfinished. please test and report problems to tokul@users.sourceforge.net
|
|
*
|
|
* @version $Id$
|
|
* @package squirrelmail
|
|
* @subpackage decode
|
|
*/
|
|
|
|
/**
|
|
* Decode utf-8 strings
|
|
* @param string $string Encoded string
|
|
* @return string Decoded string
|
|
*/
|
|
function charset_decode_utf_8 ($string) {
|
|
global $default_charset,$squirrelmail_language;
|
|
|
|
if ($squirrelmail_language == 'ja_JP')
|
|
return $string;
|
|
|
|
// don't do decoding when there are no 8bit symbols
|
|
if (! sq_is8bit($string,'utf-8'))
|
|
return $string;
|
|
|
|
// decode three byte unicode characters
|
|
$string = preg_replace("/([\340-\357])([\200-\277])([\200-\277])/e",
|
|
"'&#'.((ord('\\1')-224)*4096+(ord('\\2')-128)*64+(ord('\\3')-128)).';'",
|
|
$string);
|
|
|
|
// decode two byte unicode characters
|
|
$string = preg_replace("/([\300-\337])([\200-\277])/e",
|
|
"'&#'.((ord('\\1')-192)*64+(ord('\\2')-128)).';'",
|
|
$string);
|
|
|
|
return $string;
|
|
}
|
|
?>
|