X-Git-Url: https://vcs.fsf.org/?p=squirrelmail.git;a=blobdiff_plain;f=functions%2Fi18n.php;h=3d99ed0690253bba2e694310d8c7161a30a71720;hp=061ad1ef9890b55f1337862e68cbbd1421c7dd2e;hb=d6c32258c05219670ab3b4ae2d460d844ea9a247;hpb=c48a8ca7d6f39d2a109da30fa6ea861dffdb1023 diff --git a/functions/i18n.php b/functions/i18n.php index 061ad1ef..3d99ed06 100644 --- a/functions/i18n.php +++ b/functions/i18n.php @@ -13,66 +13,206 @@ * encoded using Unicode entities according to HTML 4.0. * * $Id$ + * @package squirrelmail */ +/** Everything uses global.php... */ require_once(SM_PATH . 'functions/global.php'); -/* Decodes a string to the internal encoding from the given charset */ +/** + * Decodes a string to the internal encoding from the given charset + * + * @param string $charset + * @param string $string Text to be decoded + * @return string Decoded text + */ function charset_decode ($charset, $string) { - global $languages, $squirrelmail_language; + global $languages, $squirrelmail_language, $default_charset; + global $use_php_recode, $use_php_iconv, $agresive_decoding; if (isset($languages[$squirrelmail_language]['XTRA_CODE']) && function_exists($languages[$squirrelmail_language]['XTRA_CODE'])) { $string = $languages[$squirrelmail_language]['XTRA_CODE']('decode', $string); } + $charset = strtolower($charset); + + set_my_charset(); + + // Variables that allow to use functions without function_exist() calls + if (! isset($use_php_recode) || $use_php_recode=="" ) { + $use_php_recode=false; } + if (! isset($use_php_iconv) || $use_php_iconv=="" ) { + $use_php_iconv=false; } + + // Don't do conversion if charset is the same. + if ( $charset == strtolower($default_charset) ) + return htmlspecialchars($string); + + // catch iso-8859-8-i thing + if ( $charset == "iso-8859-8-i" ) + $charset = "iso-8859-8"; + + /* + * Recode converts html special characters automatically if you use + * 'charset..html' decoding. There is no documented way to put -d option + * into php recode function call. + */ + if ( $use_php_recode ) { + if ( $default_charset == "utf-8" ) { + // other charsets can be converted to utf-8 without loss. + // and output string is smaller + $string = recode_string($charset . "..utf-8",$string); + return htmlspecialchars($string); + } else { + $string = recode_string($charset . "..html",$string); + // recode does not convert single quote, htmlspecialchars does. + $string = str_replace("'", ''', $string); + return $string; + } + } + + // iconv functions does not have html target and can be used only with utf-8 + if ( $use_php_iconv && $default_charset=='utf-8') { + $string = iconv($charset,$default_charset,$string); + return htmlspecialchars($string); + } + + // If we don't use recode and iconv, we'll do it old way. + /* All HTML special characters are 7 bit and can be replaced first */ $string = htmlspecialchars ($string); - $charset = strtolower($charset); - - set_my_charset() ; + /* controls cpu and memory intensive decoding cycles */ + if (! isset($agresive_decoding) || $agresive_decoding=="" ) { + $agresive_decoding=false; } if (ereg('iso-8859-([[:digit:]]+)', $charset, $res)) { if ($res[1] == '1') { - $ret = charset_decode_iso_8859_1 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-1.php'); + $ret = charset_decode_iso8859_1 ($string); } else if ($res[1] == '2') { - $ret = charset_decode_iso_8859_2 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-2.php'); + $ret = charset_decode_iso8859_2 ($string); + } else if ($res[1] == '3') { + include_once(SM_PATH . 'functions/decode/iso8859-3.php'); + $ret = charset_decode_iso8859_3 ($string); } else if ($res[1] == '4') { - $ret = charset_decode_iso_8859_4 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-4.php'); + $ret = charset_decode_iso8859_4 ($string); } else if ($res[1] == '5') { - $ret = charset_decode_iso_8859_5 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-5.php'); + $ret = charset_decode_iso8859_5 ($string); + } else if ($res[1] == '6') { + include_once(SM_PATH . 'functions/decode/iso8859-6.php'); + $ret = charset_decode_iso8859_6 ($string); } else if ($res[1] == '7') { - $ret = charset_decode_iso_8859_7 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-7.php'); + $ret = charset_decode_iso8859_7 ($string); + } else if ($res[1] == '8') { + include_once(SM_PATH . 'functions/decode/iso8859-8.php'); + $ret = charset_decode_iso8859_8 ($string); } else if ($res[1] == '9') { - $ret = charset_decode_iso_8859_9 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-9.php'); + $ret = charset_decode_iso8859_9 ($string); + } else if ($res[1] == '10') { + include_once(SM_PATH . 'functions/decode/iso8859-10.php'); + $ret = charset_decode_iso8859_10 ($string); + } else if ($res[1] == '11') { + include_once(SM_PATH . 'functions/decode/iso8859-11.php'); + $ret = charset_decode_iso8859_11 ($string); } else if ($res[1] == '13') { - $ret = charset_decode_iso_8859_13 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-13.php'); + $ret = charset_decode_iso8859_13 ($string); + } else if ($res[1] == '14') { + include_once(SM_PATH . 'functions/decode/iso8859-14.php'); + $ret = charset_decode_iso8859_14 ($string); } else if ($res[1] == '15') { - $ret = charset_decode_iso_8859_15 ($string); + include_once(SM_PATH . 'functions/decode/iso8859-15.php'); + $ret = charset_decode_iso8859_15 ($string); + } else if ($res[1] == '16') { + include_once(SM_PATH . 'functions/decode/iso8859-16.php'); + $ret = charset_decode_iso8859_16 ($string); } else { $ret = charset_decode_iso_8859_default ($string); } } else if ($charset == 'ns_4551-1') { $ret = charset_decode_ns_4551_1 ($string); } else if ($charset == 'koi8-r') { + include_once(SM_PATH . 'functions/decode/koi8-r.php'); $ret = charset_decode_koi8r ($string); } else if ($charset == 'koi8-u') { + include_once(SM_PATH . 'functions/decode/koi8-u.php'); $ret = charset_decode_koi8u ($string); + } else if ($charset == 'windows-1250') { + include_once(SM_PATH . 'functions/decode/cp1250.php'); + $ret = charset_decode_cp1250 ($string); } else if ($charset == 'windows-1251') { - $ret = charset_decode_windows_1251 ($string); + include_once(SM_PATH . 'functions/decode/cp1251.php'); + $ret = charset_decode_cp1251 ($string); + } else if ($charset == 'windows-1252') { + include_once(SM_PATH . 'functions/decode/cp1252.php'); + $ret = charset_decode_cp1252 ($string); } else if ($charset == 'windows-1253') { - $ret = charset_decode_windows_1253 ($string); + include_once(SM_PATH . 'functions/decode/cp1253.php'); + $ret = charset_decode_cp1253 ($string); } else if ($charset == 'windows-1254') { - $ret = charset_decode_windows_1254 ($string); + include_once(SM_PATH . 'functions/decode/cp1254.php'); + $ret = charset_decode_cp1254 ($string); } else if ($charset == 'windows-1255') { - $ret = charset_decode_windows_1255 ($string); + include_once(SM_PATH . 'functions/decode/cp1255.php'); + $ret = charset_decode_cp1255 ($string); } else if ($charset == 'windows-1256') { - $ret = charset_decode_windows_1256 ($string); + include_once(SM_PATH . 'functions/decode/cp1256.php'); + $ret = charset_decode_cp1256 ($string); } else if ($charset == 'windows-1257') { - $ret = charset_decode_windows_1257 ($string); - } else if ($charset == 'utf-8') { + include_once(SM_PATH . 'functions/decode/cp1257.php'); + $ret = charset_decode_cp1257 ($string); + } else if ($charset == 'windows-1258') { + include_once(SM_PATH . 'functions/decode/cp1258.php'); + $ret = charset_decode_cp1258 ($string); + } else if ($charset == 'x-mac-roman') { + include_once(SM_PATH . 'functions/decode/cp10000.php'); + $ret = charset_decode_cp10000 ($string); + } else if ($charset == 'x-mac-greek') { + include_once(SM_PATH . 'functions/decode/cp10006.php'); + $ret = charset_decode_cp10006 ($string); + } else if ($charset == 'x-mac-cyrillic') { + include_once(SM_PATH . 'functions/decode/cp10007.php'); + $ret = charset_decode_cp10007 ($string); + } else if ($charset == 'x-mac-ukrainian') { + include_once(SM_PATH . 'functions/decode/cp10017.php'); + $ret = charset_decode_cp10017 ($string); + } else if ($charset == 'x-mac-centraleurroman') { + include_once(SM_PATH . 'functions/decode/cp10029.php'); + $ret = charset_decode_cp10029 ($string); + } else if ($charset == 'x-mac-icelandic') { + include_once(SM_PATH . 'functions/decode/cp10079.php'); + $ret = charset_decode_cp10079 ($string); + } else if ($charset == 'x-mac-turkish') { + include_once(SM_PATH . 'functions/decode/cp10081.php'); + $ret = charset_decode_cp10081 ($string); + } else if ($charset == 'ibm855') { + include_once(SM_PATH . 'functions/decode/cp855.php'); + $ret = charset_decode_cp855 ($string); + } else if ($charset == 'ibm866') { + include_once(SM_PATH . 'functions/decode/cp866.php'); + $ret = charset_decode_cp866 ($string); + } else if ($charset == 'iso-ir-111') { + include_once(SM_PATH . 'functions/decode/iso-ir-111.php'); + $ret = charset_decode_iso_ir_111 ($string); + } else if ($charset == 'tis-620') { + include_once(SM_PATH . 'functions/decode/tis620.php'); + $ret = charset_decode_tis620 ($string); + } else if ($charset == 'big5' and $agresive_decoding ) { + include_once(SM_PATH . 'functions/decode/big5.php'); + $ret = charset_decode_big5 ($string); + } else if ($charset == 'gb2312' and $agresive_decoding ) { + include_once(SM_PATH . 'functions/decode/gb2312.php'); + $ret = charset_decode_gb2312 ($string); + } else if ($charset == 'utf-8' && $squirrelmail_language != 'ja_JP') { + include_once(SM_PATH . 'functions/decode/utf-8.php'); $ret = charset_decode_utf8 ($string); } else { $ret = $string; @@ -80,651 +220,6 @@ function charset_decode ($charset, $string) { return( $ret ); } -/* - iso-8859-1 is the same as Latin 1 and is normally used - in western europe. - */ -function charset_decode_iso_8859_1 ($string) { - global $default_charset; - - if (strtolower($default_charset) <> 'iso-8859-1') { - /* Only do the slow convert if there are 8-bit characters */ - if (ereg("[\200-\377]", $string)) { - $string = str_replace("\201", '', $string); - $string = str_replace("\202", '‚', $string); - $string = str_replace("\203", 'ƒ', $string); - $string = str_replace("\204", '„', $string); - $string = str_replace("\205", '…', $string); - $string = str_replace("\206", '†', $string); - $string = str_replace("\207", '‡', $string); - $string = str_replace("\210", 'ˆ', $string); - $string = str_replace("\211", '‰', $string); - $string = str_replace("\212", 'Š', $string); - $string = str_replace("\213", '‹', $string); - $string = str_replace("\214", 'Œ', $string); - $string = str_replace("\215", '', $string); - $string = str_replace("\216", 'Ž', $string); - $string = str_replace("\217", '', $string); - $string = str_replace("\220", '', $string); - $string = str_replace("\221", '‘', $string); - $string = str_replace("\222", '’', $string); - $string = str_replace("\223", '“', $string); - $string = str_replace("\224", '”', $string); - $string = str_replace("\225", '•', $string); - $string = str_replace("\226", '–', $string); - $string = str_replace("\227", '—', $string); - $string = str_replace("\230", '˜', $string); - $string = str_replace("\231", '™', $string); - $string = str_replace("\232", 'š', $string); - $string = str_replace("\233", '›', $string); - $string = str_replace("\234", 'œ', $string); - $string = str_replace("\235", '', $string); - $string = str_replace("\236", 'ž', $string); - $string = str_replace("\237", 'Ÿ', $string); - $string = str_replace("\240", ' ', $string); - $string = str_replace("\241", '¡', $string); - $string = str_replace("\242", '¢', $string); - $string = str_replace("\243", '£', $string); - $string = str_replace("\244", '¤', $string); - $string = str_replace("\245", '¥', $string); - $string = str_replace("\246", '¦', $string); - $string = str_replace("\247", '§', $string); - $string = str_replace("\250", '¨', $string); - $string = str_replace("\251", '©', $string); - $string = str_replace("\252", 'ª', $string); - $string = str_replace("\253", '«', $string); - $string = str_replace("\254", '¬', $string); - $string = str_replace("\255", '­', $string); - $string = str_replace("\256", '®', $string); - $string = str_replace("\257", '¯', $string); - $string = str_replace("\260", '°', $string); - $string = str_replace("\261", '±', $string); - $string = str_replace("\262", '²', $string); - $string = str_replace("\263", '³', $string); - $string = str_replace("\264", '´', $string); - $string = str_replace("\265", 'µ', $string); - $string = str_replace("\266", '¶', $string); - $string = str_replace("\267", '·', $string); - $string = str_replace("\270", '¸', $string); - $string = str_replace("\271", '¹', $string); - $string = str_replace("\272", 'º', $string); - $string = str_replace("\273", '»', $string); - $string = str_replace("\274", '¼', $string); - $string = str_replace("\275", '½', $string); - $string = str_replace("\276", '¾', $string); - $string = str_replace("\277", '¿', $string); - $string = str_replace("\300", 'À', $string); - $string = str_replace("\301", 'Á', $string); - $string = str_replace("\302", 'Â', $string); - $string = str_replace("\303", 'Ã', $string); - $string = str_replace("\304", 'Ä', $string); - $string = str_replace("\305", 'Å', $string); - $string = str_replace("\306", 'Æ', $string); - $string = str_replace("\307", 'Ç', $string); - $string = str_replace("\310", 'È', $string); - $string = str_replace("\311", 'É', $string); - $string = str_replace("\312", 'Ê', $string); - $string = str_replace("\313", 'Ë', $string); - $string = str_replace("\314", 'Ì', $string); - $string = str_replace("\315", 'Í', $string); - $string = str_replace("\316", 'Î', $string); - $string = str_replace("\317", 'Ï', $string); - $string = str_replace("\320", 'Ð', $string); - $string = str_replace("\321", 'Ñ', $string); - $string = str_replace("\322", 'Ò', $string); - $string = str_replace("\323", 'Ó', $string); - $string = str_replace("\324", 'Ô', $string); - $string = str_replace("\325", 'Õ', $string); - $string = str_replace("\326", 'Ö', $string); - $string = str_replace("\327", '×', $string); - $string = str_replace("\330", 'Ø', $string); - $string = str_replace("\331", 'Ù', $string); - $string = str_replace("\332", 'Ú', $string); - $string = str_replace("\333", 'Û', $string); - $string = str_replace("\334", 'Ü', $string); - $string = str_replace("\335", 'Ý', $string); - $string = str_replace("\336", 'Þ', $string); - $string = str_replace("\337", 'ß', $string); - $string = str_replace("\340", 'à', $string); - $string = str_replace("\341", 'á', $string); - $string = str_replace("\342", 'â', $string); - $string = str_replace("\343", 'ã', $string); - $string = str_replace("\344", 'ä', $string); - $string = str_replace("\345", 'å', $string); - $string = str_replace("\346", 'æ', $string); - $string = str_replace("\347", 'ç', $string); - $string = str_replace("\350", 'è', $string); - $string = str_replace("\351", 'é', $string); - $string = str_replace("\352", 'ê', $string); - $string = str_replace("\353", 'ë', $string); - $string = str_replace("\354", 'ì', $string); - $string = str_replace("\355", 'í', $string); - $string = str_replace("\356", 'î', $string); - $string = str_replace("\357", 'ï', $string); - $string = str_replace("\360", 'ð', $string); - $string = str_replace("\361", 'ñ', $string); - $string = str_replace("\362", 'ò', $string); - $string = str_replace("\363", 'ó', $string); - $string = str_replace("\364", 'ô', $string); - $string = str_replace("\365", 'õ', $string); - $string = str_replace("\366", 'ö', $string); - $string = str_replace("\367", '÷', $string); - $string = str_replace("\370", 'ø', $string); - $string = str_replace("\371", 'ù', $string); - $string = str_replace("\372", 'ú', $string); - $string = str_replace("\373", 'û', $string); - $string = str_replace("\374", 'ü', $string); - $string = str_replace("\375", 'ý', $string); - $string = str_replace("\376", 'þ', $string); - $string = str_replace("\377", 'ÿ', $string); - } - } - - return ($string); -} - -/* iso-8859-2 is used for some eastern European languages */ -function charset_decode_iso_8859_2 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'iso-8859-2') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - /* NO-BREAK SPACE */ - $string = str_replace("\240", ' ', $string); - /* LATIN CAPITAL LETTER A WITH OGONEK */ - $string = str_replace("\241", 'Ą', $string); - /* BREVE */ - $string = str_replace("\242", '˘', $string); - // LATIN CAPITAL LETTER L WITH STROKE - $string = str_replace("\243", 'Ł', $string); - // CURRENCY SIGN - $string = str_replace("\244", '¤', $string); - // LATIN CAPITAL LETTER L WITH CARON - $string = str_replace("\245", 'Ľ', $string); - // LATIN CAPITAL LETTER S WITH ACUTE - $string = str_replace("\246", 'Ś', $string); - // SECTION SIGN - $string = str_replace("\247", '§', $string); - // DIAERESIS - $string = str_replace("\250", '¨', $string); - // LATIN CAPITAL LETTER S WITH CARON - $string = str_replace("\251", 'Š', $string); - // LATIN CAPITAL LETTER S WITH CEDILLA - $string = str_replace("\252", 'Ş', $string); - // LATIN CAPITAL LETTER T WITH CARON - $string = str_replace("\253", 'Ť', $string); - // LATIN CAPITAL LETTER Z WITH ACUTE - $string = str_replace("\254", 'Ź', $string); - // SOFT HYPHEN - $string = str_replace("\255", '­', $string); - // LATIN CAPITAL LETTER Z WITH CARON - $string = str_replace("\256", 'Ž', $string); - // LATIN CAPITAL LETTER Z WITH DOT ABOVE - $string = str_replace("\257", 'Ż', $string); - // DEGREE SIGN - $string = str_replace("\260", '°', $string); - // LATIN SMALL LETTER A WITH OGONEK - $string = str_replace("\261", 'ą', $string); - // OGONEK - $string = str_replace("\262", '˛', $string); - // LATIN SMALL LETTER L WITH STROKE - $string = str_replace("\263", 'ł', $string); - // ACUTE ACCENT - $string = str_replace("\264", '´', $string); - // LATIN SMALL LETTER L WITH CARON - $string = str_replace("\265", 'ľ', $string); - // LATIN SMALL LETTER S WITH ACUTE - $string = str_replace("\266", 'ś', $string); - // CARON - $string = str_replace("\267", 'ˇ', $string); - // CEDILLA - $string = str_replace("\270", '¸', $string); - // LATIN SMALL LETTER S WITH CARON - $string = str_replace("\271", 'š', $string); - // LATIN SMALL LETTER S WITH CEDILLA - $string = str_replace("\272", 'ş', $string); - // LATIN SMALL LETTER T WITH CARON - $string = str_replace("\273", 'ť', $string); - // LATIN SMALL LETTER Z WITH ACUTE - $string = str_replace("\274", 'ź', $string); - // DOUBLE ACUTE ACCENT - $string = str_replace("\275", '˝', $string); - // LATIN SMALL LETTER Z WITH CARON - $string = str_replace("\276", 'ž', $string); - // LATIN SMALL LETTER Z WITH DOT ABOVE - $string = str_replace("\277", 'ż', $string); - // LATIN CAPITAL LETTER R WITH ACUTE - $string = str_replace("\300", 'Ŕ', $string); - // LATIN CAPITAL LETTER A WITH ACUTE - $string = str_replace("\301", 'Á', $string); - // LATIN CAPITAL LETTER A WITH CIRCUMFLEX - $string = str_replace("\302", 'Â', $string); - // LATIN CAPITAL LETTER A WITH BREVE - $string = str_replace("\303", 'Ă', $string); - // LATIN CAPITAL LETTER A WITH DIAERESIS - $string = str_replace("\304", 'Ä', $string); - // LATIN CAPITAL LETTER L WITH ACUTE - $string = str_replace("\305", 'Ĺ', $string); - // LATIN CAPITAL LETTER C WITH ACUTE - $string = str_replace("\306", 'Ć', $string); - // LATIN CAPITAL LETTER C WITH CEDILLA - $string = str_replace("\307", 'Ç', $string); - // LATIN CAPITAL LETTER C WITH CARON - $string = str_replace("\310", 'Č', $string); - // LATIN CAPITAL LETTER E WITH ACUTE - $string = str_replace("\311", 'É', $string); - // LATIN CAPITAL LETTER E WITH OGONEK - $string = str_replace("\312", 'Ę', $string); - // LATIN CAPITAL LETTER E WITH DIAERESIS - $string = str_replace("\313", 'Ë', $string); - // LATIN CAPITAL LETTER E WITH CARON - $string = str_replace("\314", 'Ě', $string); - // LATIN CAPITAL LETTER I WITH ACUTE - $string = str_replace("\315", 'Í', $string); - // LATIN CAPITAL LETTER I WITH CIRCUMFLEX - $string = str_replace("\316", 'Î', $string); - // LATIN CAPITAL LETTER D WITH CARON - $string = str_replace("\317", 'Ď', $string); - // LATIN CAPITAL LETTER D WITH STROKE - $string = str_replace("\320", 'Đ', $string); - // LATIN CAPITAL LETTER N WITH ACUTE - $string = str_replace("\321", 'Ń', $string); - // LATIN CAPITAL LETTER N WITH CARON - $string = str_replace("\322", 'Ň', $string); - // LATIN CAPITAL LETTER O WITH ACUTE - $string = str_replace("\323", 'Ó', $string); - // LATIN CAPITAL LETTER O WITH CIRCUMFLEX - $string = str_replace("\324", 'Ô', $string); - // LATIN CAPITAL LETTER O WITH DOUBLE ACUTE - $string = str_replace("\325", 'Ő', $string); - // LATIN CAPITAL LETTER O WITH DIAERESIS - $string = str_replace("\326", 'Ö', $string); - // MULTIPLICATION SIGN - $string = str_replace("\327", '×', $string); - // LATIN CAPITAL LETTER R WITH CARON - $string = str_replace("\330", 'Ř', $string); - // LATIN CAPITAL LETTER U WITH RING ABOVE - $string = str_replace("\331", 'Ů', $string); - // LATIN CAPITAL LETTER U WITH ACUTE - $string = str_replace("\332", 'Ú', $string); - // LATIN CAPITAL LETTER U WITH DOUBLE ACUTE - $string = str_replace("\333", 'Ű', $string); - // LATIN CAPITAL LETTER U WITH DIAERESIS - $string = str_replace("\334", 'Ü', $string); - // LATIN CAPITAL LETTER Y WITH ACUTE - $string = str_replace("\335", 'Ý', $string); - // LATIN CAPITAL LETTER T WITH CEDILLA - $string = str_replace("\336", 'Ţ', $string); - // LATIN SMALL LETTER SHARP S - $string = str_replace("\337", 'ß', $string); - // LATIN SMALL LETTER R WITH ACUTE - $string = str_replace("\340", 'ŕ', $string); - // LATIN SMALL LETTER A WITH ACUTE - $string = str_replace("\341", 'á', $string); - // LATIN SMALL LETTER A WITH CIRCUMFLEX - $string = str_replace("\342", 'â', $string); - // LATIN SMALL LETTER A WITH BREVE - $string = str_replace("\343", 'ă', $string); - // LATIN SMALL LETTER A WITH DIAERESIS - $string = str_replace("\344", 'ä', $string); - // LATIN SMALL LETTER L WITH ACUTE - $string = str_replace("\345", 'ĺ', $string); - // LATIN SMALL LETTER C WITH ACUTE - $string = str_replace("\346", 'ć', $string); - // LATIN SMALL LETTER C WITH CEDILLA - $string = str_replace("\347", 'ç', $string); - // LATIN SMALL LETTER C WITH CARON - $string = str_replace("\350", 'č', $string); - // LATIN SMALL LETTER E WITH ACUTE - $string = str_replace("\351", 'é', $string); - // LATIN SMALL LETTER E WITH OGONEK - $string = str_replace("\352", 'ę', $string); - // LATIN SMALL LETTER E WITH DIAERESIS - $string = str_replace("\353", 'ë', $string); - // LATIN SMALL LETTER E WITH CARON - $string = str_replace("\354", 'ě', $string); - // LATIN SMALL LETTER I WITH ACUTE - $string = str_replace("\355", 'í', $string); - // LATIN SMALL LETTER I WITH CIRCUMFLEX - $string = str_replace("\356", 'î', $string); - // LATIN SMALL LETTER D WITH CARON - $string = str_replace("\357", 'ď', $string); - // LATIN SMALL LETTER D WITH STROKE - $string = str_replace("\360", 'đ', $string); - // LATIN SMALL LETTER N WITH ACUTE - $string = str_replace("\361", 'ń', $string); - // LATIN SMALL LETTER N WITH CARON - $string = str_replace("\362", 'ň', $string); - // LATIN SMALL LETTER O WITH ACUTE - $string = str_replace("\363", 'ó', $string); - // LATIN SMALL LETTER O WITH CIRCUMFLEX - $string = str_replace("\364", 'ô', $string); - // LATIN SMALL LETTER O WITH DOUBLE ACUTE - $string = str_replace("\365", 'ő', $string); - // LATIN SMALL LETTER O WITH DIAERESIS - $string = str_replace("\366", 'ö', $string); - // DIVISION SIGN - $string = str_replace("\367", '÷', $string); - // LATIN SMALL LETTER R WITH CARON - $string = str_replace("\370", 'ř', $string); - // LATIN SMALL LETTER U WITH RING ABOVE - $string = str_replace("\371", 'ů', $string); - // LATIN SMALL LETTER U WITH ACUTE - $string = str_replace("\372", 'ú', $string); - // LATIN SMALL LETTER U WITH DOUBLE ACUTE - $string = str_replace("\373", 'ű', $string); - // LATIN SMALL LETTER U WITH DIAERESIS - $string = str_replace("\374", 'ü', $string); - // LATIN SMALL LETTER Y WITH ACUTE - $string = str_replace("\375", 'ý', $string); - // LATIN SMALL LETTER T WITH CEDILLA - $string = str_replace("\376", 'ţ', $string); - // DOT ABOVE - $string = str_replace("\377", '˙', $string); - - return $string; -} - -/* - ISO/IEC 8859-4:1998 Latin Alphabet No. 4 -*/ - -function charset_decode_iso_8859_4 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'iso-8859-4') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - $string = str_replace ("\241", 'Ą', $string); - $string = str_replace ("\242", 'ĸ', $string); - $string = str_replace ("\243", 'Ŗ', $string); - $string = str_replace ("\245", 'Ĩ', $string); - $string = str_replace ("\246", 'Ļ', $string); - $string = str_replace ("\251", 'Š', $string); - $string = str_replace ("\252", 'Ē', $string); - $string = str_replace ("\253", 'Ģ', $string); - $string = str_replace ("\254", 'Ŧ', $string); - $string = str_replace ("\256", 'Ž', $string); - $string = str_replace ("\261", 'ą', $string); - $string = str_replace ("\262", '˛', $string); - $string = str_replace ("\263", 'ŗ', $string); - $string = str_replace ("\265", 'ĩ', $string); - $string = str_replace ("\266", 'ļ', $string); - $string = str_replace ("\267", 'ˇ', $string); - $string = str_replace ("\271", 'š', $string); - $string = str_replace ("\272", 'ē', $string); - $string = str_replace ("\273", 'ģ', $string); - $string = str_replace ("\274", 'ŧ', $string); - $string = str_replace ("\275", 'Ŋ', $string); - $string = str_replace ("\276", 'ž', $string); - $string = str_replace ("\277", 'ŋ', $string); - $string = str_replace ("\300", 'Ā', $string); - $string = str_replace ("\307", 'Į', $string); - $string = str_replace ("\310", 'Č', $string); - $string = str_replace ("\312", 'Ę', $string); - $string = str_replace ("\314", 'Ė', $string); - $string = str_replace ("\317", 'Ī', $string); - $string = str_replace ("\320", 'Đ', $string); - $string = str_replace ("\321", 'Ņ', $string); - $string = str_replace ("\322", 'Ō', $string); - $string = str_replace ("\323", 'Ķ', $string); - $string = str_replace ("\331", 'Ų', $string); - $string = str_replace ("\335", 'Ũ', $string); - $string = str_replace ("\336", 'Ū', $string); - $string = str_replace ("\340", 'ā', $string); - $string = str_replace ("\347", 'į', $string); - $string = str_replace ("\350", 'č', $string); - $string = str_replace ("\352", 'ę', $string); - $string = str_replace ("\354", 'ė', $string); - $string = str_replace ("\357", 'ī', $string); - $string = str_replace ("\360", 'đ', $string); - $string = str_replace ("\361", 'ņ', $string); - $string = str_replace ("\362", 'ō', $string); - $string = str_replace ("\363", 'ķ', $string); - $string = str_replace ("\371", 'ų', $string); - $string = str_replace ("\375", 'ũ', $string); - $string = str_replace ("\376", 'ū', $string); - $string = str_replace ("\377", '˙', $string); - - // rest of charset is the same as ISO-8859-1 - return (charset_decode_iso_8859_1($string)); -} - -/* ISO-8859-5 is Cyrillic */ -function charset_decode_iso_8859_5 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'iso-8859-5') { - return $string; - } - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - // NO-BREAK SPACE - $string = str_replace("\240", ' ', $string); - // 161-172 -> 1025-1036 (+864) - $string = preg_replace("/([\241-\254])/e","'&#' . (ord('\\1')+864) . ';'",$string); - // SOFT HYPHEN - $string = str_replace("\255", '­', $string); - // 174-239 -> 1038-1103 (+864) - $string = preg_replace("/([\256-\357])/e","'&#' . (ord('\\1')+864) . ';'",$string); - // NUMERO SIGN - $string = str_replace("\360", '№', $string); - // 241-252 -> 1105-1116 (+864) - $string = preg_replace("/([\361-\374])/e","'&#' . (ord('\\1')+864) . ';'",$string); - // SECTION SIGN - $string = str_replace("\375", '§', $string); - // CYRILLIC SMALL LETTER SHORT U (Byelorussian) - $string = str_replace("\376", 'ў', $string); - // CYRILLIC SMALL LETTER DZHE - $string = str_replace("\377", 'џ', $string); - - return $string; -} - -/* iso-8859-7 is Greek. */ -function charset_decode_iso_8859_7 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'iso-8859-7') { - return $string; - } - - /* Only do the slow convert if there are 8-bit characters */ - if (!ereg("[\200-\377]", $string)) { - return $string; - } - - /* Some diverse characters in the beginning */ - $string = str_replace("\240", ' ', $string); - $string = str_replace("\241", '‘', $string); - $string = str_replace("\242", '’', $string); - $string = str_replace("\243", '£', $string); - $string = str_replace("\246", '¦', $string); - $string = str_replace("\247", '§', $string); - $string = str_replace("\250", '¨', $string); - $string = str_replace("\251", '©', $string); - $string = str_replace("\253", '«', $string); - $string = str_replace("\254", '¬', $string); - $string = str_replace("\255", '­', $string); - $string = str_replace("\257", '―', $string); - $string = str_replace("\260", '°', $string); - $string = str_replace("\261", '±', $string); - $string = str_replace("\262", '²', $string); - $string = str_replace("\263", '³', $string); - - /* Horizontal bar (parentheki pavla) */ - $string = str_replace ("\257", '―', $string); - - /* - * ISO-8859-7 characters from 11/04 (0xB4) to 11/06 (0xB6) - * These are Unicode 900-902 - */ - $string = preg_replace("/([\264-\266])/e","'&#' . (ord('\\1')+720);",$string); - - /* 11/07 (0xB7) Middle dot is the same in iso-8859-1 */ - $string = str_replace("\267", '·', $string); - - /* - * ISO-8859-7 characters from 11/08 (0xB8) to 11/10 (0xBA) - * These are Unicode 900-902 - */ - $string = preg_replace("/([\270-\272])/e","'&#' . (ord('\\1')+720);",$string); - - /* - * 11/11 (0xBB) Right angle quotation mark is the same as in - * iso-8859-1 - */ - $string = str_replace("\273", '»', $string); - - /* And now the rest of the charset */ - $string = preg_replace("/([\274-\376])/e","'&#'.(ord('\\1')+720);",$string); - - return $string; -} - -/* - ISOIEC 8859-9:1999 Latin Alphabet No. 5 - -*/ -function charset_decode_iso_8859_9 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'iso-8859-9') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - // latin capital letter g with breve 208->286 - $string = str_replace("\320", 'Ğ', $string); - // latin capital letter i with dot above 221->304 - $string = str_replace("\335", 'İ', $string); - // latin capital letter s with cedilla 222->350 - $string = str_replace("\336", 'Ş', $string); - // latin small letter g with breve 240->287 - $string = str_replace("\360", 'ğ', $string); - // latin small letter dotless i 253->305 - $string = str_replace("\375", 'ı', $string); - // latin small letter s with cedilla 254->351 - $string = str_replace("\376", 'ş', $string); - - // rest of charset is the same as ISO-8859-1 - return (charset_decode_iso_8859_1($string)); -} - - -/* - ISO/IEC 8859-13:1998 Latin Alphabet No. 7 (Baltic Rim) -*/ -function charset_decode_iso_8859_13 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'iso-8859-13') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - $string = str_replace ("\241", '”', $string); - $string = str_replace ("\245", '„', $string); - $string = str_replace ("\250", 'Ø', $string); - $string = str_replace ("\252", 'Ŗ', $string); - $string = str_replace ("\257", 'Æ', $string); - $string = str_replace ("\264", '“', $string); - $string = str_replace ("\270", 'ø', $string); - $string = str_replace ("\272", 'ŗ', $string); - $string = str_replace ("\277", 'æ', $string); - $string = str_replace ("\300", 'Ą', $string); - $string = str_replace ("\301", 'Į', $string); - $string = str_replace ("\302", 'Ā', $string); - $string = str_replace ("\303", 'Ć', $string); - $string = str_replace ("\306", 'Ę', $string); - $string = str_replace ("\307", 'Ē', $string); - $string = str_replace ("\310", 'Č', $string); - $string = str_replace ("\312", 'Ź', $string); - $string = str_replace ("\313", 'Ė', $string); - $string = str_replace ("\314", 'Ģ', $string); - $string = str_replace ("\315", 'Ķ', $string); - $string = str_replace ("\316", 'Ī', $string); - $string = str_replace ("\317", 'Ļ', $string); - $string = str_replace ("\320", 'Š', $string); - $string = str_replace ("\321", 'Ń', $string); - $string = str_replace ("\322", 'Ņ', $string); - $string = str_replace ("\324", 'Ō', $string); - $string = str_replace ("\330", 'Ų', $string); - $string = str_replace ("\331", 'Ł', $string); - $string = str_replace ("\332", 'Ś', $string); - $string = str_replace ("\333", 'Ū', $string); - $string = str_replace ("\335", 'Ż', $string); - $string = str_replace ("\336", 'Ž', $string); - $string = str_replace ("\340", 'ą', $string); - $string = str_replace ("\341", 'į', $string); - $string = str_replace ("\342", 'ā', $string); - $string = str_replace ("\343", 'ć', $string); - $string = str_replace ("\346", 'ę', $string); - $string = str_replace ("\347", 'ē', $string); - $string = str_replace ("\350", 'č', $string); - $string = str_replace ("\352", 'ź', $string); - $string = str_replace ("\353", 'ė', $string); - $string = str_replace ("\354", 'ģ', $string); - $string = str_replace ("\355", 'ķ', $string); - $string = str_replace ("\356", 'ī', $string); - $string = str_replace ("\357", 'ļ', $string); - $string = str_replace ("\360", 'š', $string); - $string = str_replace ("\361", 'ń', $string); - $string = str_replace ("\362", 'ņ', $string); - $string = str_replace ("\364", 'ō', $string); - $string = str_replace ("\370", 'ų', $string); - $string = str_replace ("\371", 'ł', $string); - $string = str_replace ("\372", 'ś', $string); - $string = str_replace ("\373", 'ū', $string); - $string = str_replace ("\375", 'ż', $string); - $string = str_replace ("\376", 'ž', $string); - $string = str_replace ("\377", '’', $string); - - // rest of charset is the same as ISO-8859-1 - return (charset_decode_iso_8859_1($string)); -} - -/* - * iso-8859-15 is Latin 9 and has very much the same use as Latin 1 - * but has the Euro symbol and some characters needed for French. - */ -function charset_decode_iso_8859_15 ($string) { - // Euro sign - $string = str_replace ("\244", '€', $string); - // Latin capital letter S with caron - $string = str_replace ("\246", 'Š', $string); - // Latin small letter s with caron - $string = str_replace ("\250", 'š', $string); - // Latin capital letter Z with caron - $string = str_replace ("\264", 'Ž', $string); - // Latin small letter z with caron - $string = str_replace ("\270", 'ž', $string); - // Latin capital ligature OE - $string = str_replace ("\274", 'Œ', $string); - // Latin small ligature oe - $string = str_replace ("\275", 'œ', $string); - // Latin capital letter Y with diaeresis - $string = str_replace ("\276", 'Ÿ', $string); - - return (charset_decode_iso_8859_1($string)); -} - /* Remove all 8 bit characters from all other ISO-8859 character sets */ function charset_decode_iso_8859_default ($string) { @@ -762,935 +257,13 @@ function charset_decode_ns_4551_1 ($string) { return strtr ($string, "[\\]{|}", "ÆØÅæøå"); } -/* - * KOI8-R is used to encode Russian mail (Cyrrilic). Defined in RFC - * 1489. - */ -function charset_decode_koi8r ($string) { - global $default_charset; - - if ($default_charset == 'koi8-r') { - return $string; - } - - /* - * Convert to Unicode HTML entities. - * This code is rather ineffective. - */ - $string = str_replace("\200", '─', $string); - $string = str_replace("\201", '│', $string); - $string = str_replace("\202", '┌', $string); - $string = str_replace("\203", '┐', $string); - $string = str_replace("\204", '└', $string); - $string = str_replace("\205", '┘', $string); - $string = str_replace("\206", '├', $string); - $string = str_replace("\207", '┤', $string); - $string = str_replace("\210", '┬', $string); - $string = str_replace("\211", '┴', $string); - $string = str_replace("\212", '┼', $string); - $string = str_replace("\213", '▀', $string); - $string = str_replace("\214", '▄', $string); - $string = str_replace("\215", '█', $string); - $string = str_replace("\216", '▌', $string); - $string = str_replace("\217", '▐', $string); - $string = str_replace("\220", '░', $string); - $string = str_replace("\221", '▒', $string); - $string = str_replace("\222", '▓', $string); - $string = str_replace("\223", '⌠', $string); - $string = str_replace("\224", '■', $string); - $string = str_replace("\225", '∙', $string); - $string = str_replace("\226", '√', $string); - $string = str_replace("\227", '≈', $string); - $string = str_replace("\230", '≤', $string); - $string = str_replace("\231", '≥', $string); - $string = str_replace("\232", ' ', $string); - $string = str_replace("\233", '⌡', $string); - $string = str_replace("\234", '°', $string); - $string = str_replace("\235", '²', $string); - $string = str_replace("\236", '·', $string); - $string = str_replace("\237", '÷', $string); - $string = str_replace("\240", '═', $string); - $string = str_replace("\241", '║', $string); - $string = str_replace("\242", '╒', $string); - $string = str_replace("\243", 'ё', $string); - $string = str_replace("\244", '╓', $string); - $string = str_replace("\245", '╔', $string); - $string = str_replace("\246", '╕', $string); - $string = str_replace("\247", '╖', $string); - $string = str_replace("\250", '╗', $string); - $string = str_replace("\251", '╘', $string); - $string = str_replace("\252", '╙', $string); - $string = str_replace("\253", '╚', $string); - $string = str_replace("\254", '╛', $string); - $string = str_replace("\255", '╜', $string); - $string = str_replace("\256", '╝', $string); - $string = str_replace("\257", '╞', $string); - $string = str_replace("\260", '╟', $string); - $string = str_replace("\261", '╠', $string); - $string = str_replace("\262", '╡', $string); - $string = str_replace("\263", 'Ё', $string); - $string = str_replace("\264", '╢', $string); - $string = str_replace("\265", '╣', $string); - $string = str_replace("\266", '╤', $string); - $string = str_replace("\267", '╥', $string); - $string = str_replace("\270", '╦', $string); - $string = str_replace("\271", '╧', $string); - $string = str_replace("\272", '╨', $string); - $string = str_replace("\273", '╩', $string); - $string = str_replace("\274", '╪', $string); - $string = str_replace("\275", '╫', $string); - $string = str_replace("\276", '╬', $string); - $string = str_replace("\277", '©', $string); - $string = str_replace("\300", 'ю', $string); - $string = str_replace("\301", 'а', $string); - $string = str_replace("\302", 'б', $string); - $string = str_replace("\303", 'ц', $string); - $string = str_replace("\304", 'д', $string); - $string = str_replace("\305", 'е', $string); - $string = str_replace("\306", 'ф', $string); - $string = str_replace("\307", 'г', $string); - $string = str_replace("\310", 'х', $string); - $string = str_replace("\311", 'и', $string); - $string = str_replace("\312", 'й', $string); - $string = str_replace("\313", 'к', $string); - $string = str_replace("\314", 'л', $string); - $string = str_replace("\315", 'м', $string); - $string = str_replace("\316", 'н', $string); - $string = str_replace("\317", 'о', $string); - $string = str_replace("\320", 'п', $string); - $string = str_replace("\321", 'я', $string); - $string = str_replace("\322", 'р', $string); - $string = str_replace("\323", 'с', $string); - $string = str_replace("\324", 'т', $string); - $string = str_replace("\325", 'у', $string); - $string = str_replace("\326", 'ж', $string); - $string = str_replace("\327", 'в', $string); - $string = str_replace("\330", 'ь', $string); - $string = str_replace("\331", 'ы', $string); - $string = str_replace("\332", 'з', $string); - $string = str_replace("\333", 'ш', $string); - $string = str_replace("\334", 'э', $string); - $string = str_replace("\335", 'щ', $string); - $string = str_replace("\336", 'ч', $string); - $string = str_replace("\337", 'ъ', $string); - $string = str_replace("\340", 'Ю', $string); - $string = str_replace("\341", 'А', $string); - $string = str_replace("\342", 'Б', $string); - $string = str_replace("\343", 'Ц', $string); - $string = str_replace("\344", 'Д', $string); - $string = str_replace("\345", 'Е', $string); - $string = str_replace("\346", 'Ф', $string); - $string = str_replace("\347", 'Г', $string); - $string = str_replace("\350", 'Х', $string); - $string = str_replace("\351", 'И', $string); - $string = str_replace("\352", 'Й', $string); - $string = str_replace("\353", 'К', $string); - $string = str_replace("\354", 'Л', $string); - $string = str_replace("\355", 'М', $string); - $string = str_replace("\356", 'Н', $string); - $string = str_replace("\357", 'О', $string); - $string = str_replace("\360", 'П', $string); - $string = str_replace("\361", 'Я', $string); - $string = str_replace("\362", 'Р', $string); - $string = str_replace("\363", 'С', $string); - $string = str_replace("\364", 'Т', $string); - $string = str_replace("\365", 'У', $string); - $string = str_replace("\366", 'Ж', $string); - $string = str_replace("\367", 'В', $string); - $string = str_replace("\370", 'Ь', $string); - $string = str_replace("\371", 'Ы', $string); - $string = str_replace("\372", 'З', $string); - $string = str_replace("\373", 'Ш', $string); - $string = str_replace("\374", 'Э', $string); - $string = str_replace("\375", 'Щ', $string); - $string = str_replace("\376", 'Ч', $string); - $string = str_replace("\377", 'Ъ', $string); - - return $string; -} - -/* - * KOI8-U is used to encode Ukrainian mail (Cyrrilic). Defined in RFC - * 2319. - */ -function charset_decode_koi8u ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'koi8-u') { - return $string; - } - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - // BOX DRAWINGS LIGHT HORIZONTAL - $string = str_replace("\200", '─', $string); - // BOX DRAWINGS LIGHT VERTICAL - $string = str_replace("\201", '│', $string); - // BOX DRAWINGS LIGHT DOWN AND RIGHT - $string = str_replace("\202", '┌', $string); - // BOX DRAWINGS LIGHT DOWN AND LEFT - $string = str_replace("\203", '┐', $string); - // BOX DRAWINGS LIGHT UP AND RIGHT - $string = str_replace("\204", '└', $string); - // BOX DRAWINGS LIGHT UP AND LEFT - $string = str_replace("\205", '┘', $string); - // BOX DRAWINGS LIGHT VERTICAL AND RIGHT - $string = str_replace("\206", '├', $string); - // BOX DRAWINGS LIGHT VERTICAL AND LEFT - $string = str_replace("\207", '┤', $string); - // BOX DRAWINGS LIGHT DOWN AND HORIZONTAL - $string = str_replace("\210", '┬', $string); - // BOX DRAWINGS LIGHT UP AND HORIZONTAL - $string = str_replace("\211", '┴', $string); - // BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL - $string = str_replace("\212", '┼', $string); - // UPPER HALF BLOCK - $string = str_replace("\213", '▀', $string); - // LOWER HALF BLOCK - $string = str_replace("\214", '▄', $string); - // FULL BLOCK - $string = str_replace("\215", '█', $string); - // LEFT HALF BLOCK - $string = str_replace("\216", '▌', $string); - // RIGHT HALF BLOCK - $string = str_replace("\217", '▐', $string); - // LIGHT SHADE - $string = str_replace("\220", '░', $string); - // MEDIUM SHADE - $string = str_replace("\221", '▒', $string); - // DARK SHADE - $string = str_replace("\222", '▓', $string); - // TOP HALF INTEGRAL - $string = str_replace("\223", '⌠', $string); - // BLACK SQUARE - $string = str_replace("\224", '■', $string); - // BULLET OPERATOR - $string = str_replace("\225", '∙', $string); - // SQUARE ROOT - $string = str_replace("\226", '√', $string); - // ALMOST EQUAL TO - $string = str_replace("\227", '≈', $string); - // LESS THAN OR EQUAL TO - $string = str_replace("\230", '≤', $string); - // GREATER THAN OR EQUAL TO - $string = str_replace("\231", '≥', $string); - // NO-BREAK SPACE - $string = str_replace("\232", ' ', $string); - // BOTTOM HALF INTEGRAL - $string = str_replace("\233", '⌡', $string); - // DEGREE SIGN - $string = str_replace("\234", '°', $string); - // SUPERSCRIPT DIGIT TWO - $string = str_replace("\235", '²', $string); - // MIDDLE DOT - $string = str_replace("\236", '·', $string); - // DIVISION SIGN - $string = str_replace("\237", '÷', $string); - // BOX DRAWINGS DOUBLE HORIZONTAL - $string = str_replace("\240", '═', $string); - // BOX DRAWINGS DOUBLE VERTICAL - $string = str_replace("\241", '║', $string); - // BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE - $string = str_replace("\242", '╒', $string); - // CYRILLIC SMALL LETTER IO - $string = str_replace("\243", 'ё', $string); - // CYRILLIC SMALL LETTER UKRAINIAN IE - $string = str_replace("\244", 'є', $string); - // BOX DRAWINGS DOUBLE DOWN AND RIGHT - $string = str_replace("\245", '╔', $string); - // CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I - $string = str_replace("\246", 'і', $string); - // CYRILLIC SMALL LETTER YI (Ukrainian) - $string = str_replace("\247", 'ї', $string); - // BOX DRAWINGS DOUBLE DOWN AND LEFT - $string = str_replace("\250", '╗', $string); - // BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE - $string = str_replace("\251", '╘', $string); - // BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE - $string = str_replace("\252", '╙', $string); - // BOX DRAWINGS DOUBLE UP AND RIGHT - $string = str_replace("\253", '╚', $string); - // BOX DRAWINGS UP SINGLE AND LEFT DOUBLE - $string = str_replace("\254", '╛', $string); - // CYRILLIC SMALL LETTER GHE WITH UPTURN - $string = str_replace("\255", 'ґ', $string); - // BOX DRAWINGS DOUBLE UP AND LEFT - $string = str_replace("\256", '╝', $string); - // BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE - $string = str_replace("\257", '╞', $string); - // BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE - $string = str_replace("\260", '╟', $string); - // BOX DRAWINGS DOUBLE VERTICAL AND RIGHT - $string = str_replace("\261", '╠', $string); - // BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE - $string = str_replace("\262", '╡', $string); - // CYRILLIC CAPITAL LETTER IO - $string = str_replace("\263", 'Ё', $string); - // CYRILLIC CAPITAL LETTER UKRAINIAN IE - $string = str_replace("\264", 'Є', $string); - // DOUBLE VERTICAL AND LEFT - $string = str_replace("\265", '╣', $string); - // CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I - $string = str_replace("\266", 'І', $string); - // CYRILLIC CAPITAL LETTER YI (Ukrainian) - $string = str_replace("\267", 'Ї', $string); - // BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL - $string = str_replace("\270", '╦', $string); - // BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE - $string = str_replace("\271", '╧', $string); - // BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE - $string = str_replace("\272", '╨', $string); - // BOX DRAWINGS DOUBLE UP AND HORIZONTAL - $string = str_replace("\273", '╩', $string); - // BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL DOUBLE - $string = str_replace("\274", '╪', $string); - // CYRILLIC CAPITAL LETTER GHE WITH UPTURN - $string = str_replace("\275", 'Ґ', $string); - // BOX DRAWINGS DOUBLE VERTICAL AND HORIZONTAL - $string = str_replace("\276", '╬', $string); - // COPYRIGHT SIGN - $string = str_replace("\277", '©', $string); - // CYRILLIC SMALL LETTER YU - $string = str_replace("\300", 'ю', $string); - // CYRILLIC SMALL LETTER A - $string = str_replace("\301", 'а', $string); - // CYRILLIC SMALL LETTER BE - $string = str_replace("\302", 'б', $string); - // CYRILLIC SMALL LETTER TSE - $string = str_replace("\303", 'ц', $string); - // CYRILLIC SMALL LETTER DE - $string = str_replace("\304", 'д', $string); - // CYRILLIC SMALL LETTER IE - $string = str_replace("\305", 'е', $string); - // CYRILLIC SMALL LETTER EF - $string = str_replace("\306", 'ф', $string); - // CYRILLIC SMALL LETTER GHE - $string = str_replace("\307", 'г', $string); - // CYRILLIC SMALL LETTER HA - $string = str_replace("\310", 'х', $string); - // CYRILLIC SMALL LETTER I - $string = str_replace("\311", 'и', $string); - // CYRILLIC SMALL LETTER SHORT I - $string = str_replace("\312", 'й', $string); - // CYRILLIC SMALL LETTER KA - $string = str_replace("\313", 'к', $string); - // CYRILLIC SMALL LETTER EL - $string = str_replace("\314", 'л', $string); - // CYRILLIC SMALL LETTER EM - $string = str_replace("\315", 'м', $string); - // CYRILLIC SMALL LETTER EN - $string = str_replace("\316", 'н', $string); - // CYRILLIC SMALL LETTER O - $string = str_replace("\317", 'о', $string); - // CYRILLIC SMALL LETTER PE - $string = str_replace("\320", 'п', $string); - // CYRILLIC SMALL LETTER YA - $string = str_replace("\321", 'я', $string); - // CYRILLIC SMALL LETTER ER - $string = str_replace("\322", 'р', $string); - // CYRILLIC SMALL LETTER ES - $string = str_replace("\323", 'с', $string); - // CYRILLIC SMALL LETTER TE - $string = str_replace("\324", 'т', $string); - // CYRILLIC SMALL LETTER U - $string = str_replace("\325", 'у', $string); - // CYRILLIC SMALL LETTER ZHE - $string = str_replace("\326", 'ж', $string); - // CYRILLIC SMALL LETTER VE - $string = str_replace("\327", 'в', $string); - // CYRILLIC SMALL LETTER SOFT SIGN - $string = str_replace("\330", 'ь', $string); - // CYRILLIC SMALL LETTER YERU - $string = str_replace("\331", 'ы', $string); - // CYRILLIC SMALL LETTER ZE - $string = str_replace("\332", 'з', $string); - // CYRILLIC SMALL LETTER SHA - $string = str_replace("\333", 'ш', $string); - // CYRILLIC SMALL LETTER E - $string = str_replace("\334", 'э', $string); - // CYRILLIC SMALL LETTER SHCHA - $string = str_replace("\335", 'щ', $string); - // CYRILLIC SMALL LETTER CHE - $string = str_replace("\336", 'ч', $string); - // CYRILLIC SMALL LETTER HARD SIGN - $string = str_replace("\337", 'ъ', $string); - // CYRILLIC CAPITAL LETTER YU - $string = str_replace("\340", 'Ю', $string); - // CYRILLIC CAPITAL LETTER A - $string = str_replace("\341", 'А', $string); - // CYRILLIC CAPITAL LETTER BE - $string = str_replace("\342", 'Б', $string); - // CYRILLIC CAPITAL LETTER TSE - $string = str_replace("\343", 'Ц', $string); - // CYRILLIC CAPITAL LETTER DE - $string = str_replace("\344", 'Д', $string); - // CYRILLIC CAPITAL LETTER IE - $string = str_replace("\345", 'Е', $string); - // CYRILLIC CAPITAL LETTER EF - $string = str_replace("\346", 'Ф', $string); - // CYRILLIC CAPITAL LETTER GHE - $string = str_replace("\347", 'Г', $string); - // CYRILLIC CAPITAL LETTER HA - $string = str_replace("\350", 'Х', $string); - // CYRILLIC CAPITAL LETTER I - $string = str_replace("\351", 'И', $string); - // CYRILLIC CAPITAL LETTER SHORT I - $string = str_replace("\352", 'Й', $string); - // CYRILLIC CAPITAL LETTER KA - $string = str_replace("\353", 'К', $string); - // CYRILLIC CAPITAL LETTER EL - $string = str_replace("\354", 'Л', $string); - // CYRILLIC CAPITAL LETTER EM - $string = str_replace("\355", 'М', $string); - // CYRILLIC CAPITAL LETTER EN - $string = str_replace("\356", 'Н', $string); - // CYRILLIC CAPITAL LETTER O - $string = str_replace("\357", 'О', $string); - // CYRILLIC CAPITAL LETTER PE - $string = str_replace("\360", 'П', $string); - // CYRILLIC CAPITAL LETTER YA - $string = str_replace("\361", 'Я', $string); - // CYRILLIC CAPITAL LETTER ER - $string = str_replace("\362", 'Р', $string); - // CYRILLIC CAPITAL LETTER ES - $string = str_replace("\363", 'С', $string); - // CYRILLIC CAPITAL LETTER TE - $string = str_replace("\364", 'Т', $string); - // CYRILLIC CAPITAL LETTER U - $string = str_replace("\365", 'У', $string); - // CYRILLIC CAPITAL LETTER ZHE - $string = str_replace("\366", 'Ж', $string); - // CYRILLIC CAPITAL LETTER VE - $string = str_replace("\367", 'В', $string); - // CYRILLIC CAPITAL LETTER SOFT SIGN - $string = str_replace("\370", 'Ь', $string); - // CYRILLIC CAPITAL LETTER YERU - $string = str_replace("\371", 'Ы', $string); - // CYRILLIC CAPITAL LETTER ZE - $string = str_replace("\372", 'З', $string); - // CYRILLIC CAPITAL LETTER SHA - $string = str_replace("\373", 'Ш', $string); - // CYRILLIC CAPITAL LETTER E - $string = str_replace("\374", 'Э', $string); - // CYRILLIC CAPITAL LETTER SHCHA - $string = str_replace("\375", 'Щ', $string); - // CYRILLIC CAPITAL LETTER CHE - $string = str_replace("\376", 'Ч', $string); - // CYRILLIC CAPITAL LETTER HARD SIGN - $string = str_replace("\377", 'Ъ', $string); - - return $string; -} - -/* - * windows-1251 is used to encode Bulgarian mail (Cyrrilic). - */ -function charset_decode_windows_1251 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'windows-1251') { - return $string; - } - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - // CYRILLIC CAPITAL LETTER DJE (Serbocroatian) - $string = str_replace("\200", 'Ђ', $string); - // CYRILLIC CAPITAL LETTER GJE - $string = str_replace("\201", 'Ѓ', $string); - // SINGLE LOW-9 QUOTATION MARK - $string = str_replace("\202", '‚', $string); - // CYRILLIC SMALL LETTER GJE - $string = str_replace("\203", 'ѓ', $string); - // DOUBLE LOW-9 QUOTATION MARK - $string = str_replace("\204", '„', $string); - // HORIZONTAL ELLIPSIS - $string = str_replace("\205", '…', $string); - // DAGGER - $string = str_replace("\206", '†', $string); - // DOUBLE DAGGER - $string = str_replace("\207", '‡', $string); - // EURO SIGN - $string = str_replace("\210", '€', $string); - // PER MILLE SIGN - $string = str_replace("\211", '‰', $string); - // CYRILLIC CAPITAL LETTER LJE - $string = str_replace("\212", 'Љ', $string); - // SINGLE LEFT-POINTING ANGLE QUOTATION MARK - $string = str_replace("\213", '‹', $string); - // CYRILLIC CAPITAL LETTER NJE - $string = str_replace("\214", 'Њ', $string); - // CYRILLIC CAPITAL LETTER KJE - $string = str_replace("\215", 'Ќ', $string); - // CYRILLIC CAPITAL LETTER TSHE (Serbocroatian) - $string = str_replace("\216", 'Ћ', $string); - // CYRILLIC CAPITAL LETTER DZHE - $string = str_replace("\217", 'Џ', $string); - // CYRILLIC SMALL LETTER DJE (Serbocroatian) - $string = str_replace("\220", 'ђ', $string); - // LEFT SINGLE QUOTATION MARK - $string = str_replace("\221", '‘', $string); - // RIGHT SINGLE QUOTATION MARK - $string = str_replace("\222", '’', $string); - // LEFT DOUBLE QUOTATION MARK - $string = str_replace("\223", '“', $string); - // RIGHT DOUBLE QUOTATION MARK - $string = str_replace("\224", '”', $string); - // BULLET - $string = str_replace("\225", '•', $string); - // EN DASH - $string = str_replace("\226", '–', $string); - // EM DASH - $string = str_replace("\227", '—', $string); - // TRADE MARK SIGN - $string = str_replace("\231", '™', $string); - // CYRILLIC SMALL LETTER LJE - $string = str_replace("\232", 'љ', $string); - // SINGLE RIGHT-POINTING ANGLE QUOTATION MARK - $string = str_replace("\233", '›', $string); - // CYRILLIC SMALL LETTER NJE - $string = str_replace("\234", 'њ', $string); - // CYRILLIC SMALL LETTER KJE - $string = str_replace("\235", 'ќ', $string); - // CYRILLIC SMALL LETTER TSHE (Serbocroatian) - $string = str_replace("\236", 'ћ', $string); - // CYRILLIC SMALL LETTER DZHE - $string = str_replace("\237", 'џ', $string); - // NO-BREAK SPACE - $string = str_replace("\240", ' ', $string); - // CYRILLIC CAPITAL LETTER SHORT U (Byelorussian) - $string = str_replace("\241", 'Ў', $string); - // CYRILLIC SMALL LETTER SHORT U (Byelorussian) - $string = str_replace("\242", 'ў', $string); - // CYRILLIC CAPITAL LETTER JE - $string = str_replace("\243", 'Ј', $string); - // CURRENCY SIGN - $string = str_replace("\244", '¤', $string); - // CYRILLIC CAPITAL LETTER GHE WITH UPTURN - $string = str_replace("\245", 'Ґ', $string); - // BROKEN BAR - $string = str_replace("\246", '¦', $string); - // SECTION SIGN - $string = str_replace("\247", '§', $string); - // CYRILLIC CAPITAL LETTER IO - $string = str_replace("\250", 'Ё', $string); - // COPYRIGHT SIGN - $string = str_replace("\251", '©', $string); - // CYRILLIC CAPITAL LETTER UKRAINIAN IE - $string = str_replace("\252", 'Є', $string); - // LEFT-POINTING DOUBLE ANGLE QUOTATION MARK - $string = str_replace("\253", '«', $string); - // NOT SIGN - $string = str_replace("\254", '¬', $string); - // SOFT HYPHEN - $string = str_replace("\255", '­', $string); - // REGISTERED SIGN - $string = str_replace("\256", '®', $string); - // CYRILLIC CAPITAL LETTER YI (Ukrainian) - $string = str_replace("\257", 'Ї', $string); - // DEGREE SIGN - $string = str_replace("\260", '°', $string); - // PLUS-MINUS SIGN - $string = str_replace("\261", '±', $string); - // CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I - $string = str_replace("\262", 'І', $string); - // CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I - $string = str_replace("\263", 'і', $string); - // CYRILLIC SMALL LETTER GHE WITH UPTURN - $string = str_replace("\264", 'ґ', $string); - // MICRO SIGN - $string = str_replace("\265", 'µ', $string); - // PILCROW SIGN - $string = str_replace("\266", '¶', $string); - // MIDDLE DOT - $string = str_replace("\267", '·', $string); - // CYRILLIC SMALL LETTER IO - $string = str_replace("\270", 'ё', $string); - // NUMERO SIGN - $string = str_replace("\271", '№', $string); - // CYRILLIC SMALL LETTER UKRAINIAN IE - $string = str_replace("\272", 'є', $string); - // RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK - $string = str_replace("\273", '»', $string); - // CYRILLIC SMALL LETTER JE - $string = str_replace("\274", 'ј', $string); - // CYRILLIC CAPITAL LETTER DZE - $string = str_replace("\275", 'Ѕ', $string); - // CYRILLIC SMALL LETTER DZE - $string = str_replace("\276", 'ѕ', $string); - // CYRILLIC SMALL LETTER YI (Ukrainian) - $string = str_replace("\277", 'ї', $string); - - // 192-255 > 1040-1103 (+848) - $string = preg_replace("/([\300-\377])/e","'&#' . (ord('\\1')+848) . ';'",$string); - - return $string; -} - -/* - windows-1253 (Greek) - */ -function charset_decode_windows_1253 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'windows-1253') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - $string = str_replace("\200", '€', $string); - $string = str_replace("\202", '‚', $string); - $string = str_replace("\203", 'ƒ', $string); - $string = str_replace("\204", '„', $string); - $string = str_replace("\205", '…', $string); - $string = str_replace("\206", '†', $string); - $string = str_replace("\207", '‡', $string); - $string = str_replace("\211", '‰', $string); - $string = str_replace("\213", '‹', $string); - $string = str_replace("\221", '‘', $string); - $string = str_replace("\222", '’', $string); - $string = str_replace("\223", '“', $string); - $string = str_replace("\224", '”', $string); - $string = str_replace("\225", '•', $string); - $string = str_replace("\226", '–', $string); - $string = str_replace("\227", '—', $string); - $string = str_replace("\231", '™', $string); - $string = str_replace("\233", '›', $string); - $string = str_replace("\241", '΅', $string); - $string = str_replace("\242", 'Ά', $string); - $string = str_replace ("\257", '―', $string); - $string = str_replace("\264", '΄', $string); - $string = str_replace("\270", 'Έ', $string); - $string = str_replace ("\271", 'Ή', $string); - $string = str_replace ("\272", 'Ί', $string); - $string = str_replace ("\274", 'Ό', $string); - // cycle for 190-254 symbols - $string = preg_replace("/([\274-\376])/e","'&#' . (ord('\\1')+720);",$string); - - // Rest of charset is like iso-8859-1 - return (charset_decode_iso_8859_1($string)); -} - -/* - windows-1254 (Turks) - */ -function charset_decode_windows_1254 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'windows-1254') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - // Euro sign 128 -> 8364 - $string = str_replace("\200", '€', $string); - // Single low-9 quotation mark 130 -> 8218 - $string = str_replace("\202", '‚', $string); - // latin small letter f with hook 131 -> 402 - $string = str_replace("\203", 'ƒ', $string); - // Double low-9 quotation mark 132 -> 8222 - $string = str_replace("\204", '„', $string); - // horizontal ellipsis 133 -> 8230 - $string = str_replace("\205", '…', $string); - // dagger 134 -> 8224 - $string = str_replace("\206", '†', $string); - // double dagger 135 -> 8225 - $string = str_replace("\207", '‡', $string); - // modifier letter circumflex accent 136->710 - $string = str_replace("\210", 'ˆ', $string); - // per mille sign 137 -> 8240 - $string = str_replace("\211", '‰', $string); - // latin capital letter s with caron 138 -> 352 - $string = str_replace("\212", 'Š', $string); - // single left-pointing angle quotation mark 139 -> 8249 - $string = str_replace("\213", '‹', $string); - // latin capital ligature oe 140 -> 338 - $string = str_replace("\214", 'Œ', $string); - // left single quotation mark 145 -> 8216 - $string = str_replace("\221", '‘', $string); - // right single quotation mark 146 -> 8217 - $string = str_replace("\222", '’', $string); - // left double quotation mark 147 -> 8220 - $string = str_replace("\223", '“', $string); - // right double quotation mark 148 -> 8221 - $string = str_replace("\224", '”', $string); - // bullet 149 -> 8226 - $string = str_replace("\225", '•', $string); - // en dash 150 -> 8211 - $string = str_replace("\226", '–', $string); - // em dash 151 -> 8212 - $string = str_replace("\227", '—', $string); - // small tilde 152 -> 732 - $string = str_replace("\230", '˜', $string); - // trade mark sign 153 -> 8482 - $string = str_replace("\231", '™', $string); - // latin small letter s with caron 154 -> 353 - $string = str_replace("\232", 'š', $string); - // single right-pointing angle quotation mark 155 -> 8250 - $string = str_replace("\233", '›', $string); - // latin small ligature oe 156 -> 339 - $string = str_replace("\234", 'œ', $string); - // latin capital letter y with diaresis 159->376 - $string = str_replace("\237", 'Ÿ', $string); - // latin capital letter g with breve 208->286 - $string = str_replace("\320", 'Ğ', $string); - // latin capital letter i with dot above 221->304 - $string = str_replace("\335", 'İ', $string); - // latin capital letter s with cedilla 222->350 - $string = str_replace("\336", 'Ş', $string); - // latin small letter g with breve 240->287 - $string = str_replace("\360", 'ğ', $string); - // latin small letter dotless i 253->305 - $string = str_replace("\375", 'ı', $string); - // latin small letter s with cedilla 254->351 - $string = str_replace("\376", 'ş', $string); - - // Rest of charset is like iso-8859-1 - return (charset_decode_iso_8859_1($string)); -} - -/* - windows-1255 (Hebr) - */ -function charset_decode_windows_1255 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'windows-1255') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - $string = str_replace("\200", '€', $string); - $string = str_replace("\202", '‚', $string); - $string = str_replace("\203", 'ƒ', $string); - $string = str_replace("\204", '„', $string); - $string = str_replace("\205", '…', $string); - $string = str_replace("\206", '†', $string); - $string = str_replace("\207", '‡', $string); - $string = str_replace("\211", '‰', $string); - $string = str_replace("\213", '‹', $string); - $string = str_replace("\221", '‘', $string); - $string = str_replace("\222", '’', $string); - $string = str_replace("\223", '“', $string); - $string = str_replace("\224", '”', $string); - $string = str_replace("\225", '•', $string); - $string = str_replace("\226", '–', $string); - $string = str_replace("\227", '—', $string); - $string = str_replace("\231", '™', $string); - $string = str_replace("\233", '›', $string); - $string = str_replace("\240", ' ', $string); - // 162-169 - $string = preg_replace("/([\242-\251])/e","'&#' . ord('\\1') . ';'",$string); - $string = str_replace("\252", '×', $string); - // 171-174 - $string = preg_replace("/([\253-\256])/e","'&#' . ord('\\1') . ';'",$string); - $string = str_replace ("\257", '̍', $string); - // 176-185 - $string = preg_replace("/([\260-\271])/e","'&#' . ord('\\1') . ';'",$string); - $string = str_replace ("\272", '÷', $string); - // 187-190 - $string = preg_replace("/([\273-\276])/e","'&#' . ord('\\1') . ';'",$string); - $string = str_replace ("\337", '‗', $string); - // 224-250 1488-1514 (+1264) - $string = preg_replace("/([\340-\372])/e","'&#' . (ord('\\1')+1264) . ';'",$string); - - return ($string); -} - -/* - windows-1256 (Arab) - */ -function charset_decode_windows_1256 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'windows-1256') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - $string = str_replace("\200", '،', $string); - $string = str_replace("\202", '‚', $string); - $string = str_replace("\204", '„', $string); - $string = str_replace("\205", '…', $string); - $string = str_replace("\206", '†', $string); - $string = str_replace("\207", '‡', $string); - $string = str_replace("\211", '‰', $string); - $string = str_replace("\213", '‹', $string); - $string = str_replace("\221", '‘', $string); - $string = str_replace("\222", '’', $string); - $string = str_replace("\223", '“', $string); - $string = str_replace("\224", '”', $string); - $string = str_replace("\225", '•', $string); - $string = str_replace("\226", '–', $string); - $string = str_replace("\227", '—', $string); - $string = str_replace("\230", '؜', $string); - $string = str_replace("\231", '™', $string); - $string = str_replace("\232", '؟', $string); - $string = str_replace("\233", '›', $string); - $string = str_replace("\234", 'ء', $string); - $string = str_replace("\235", 'آ', $string); - $string = str_replace("\236", 'أ', $string); - $string = str_replace("\237", 'Ÿ', $string); - $string = str_replace("\241", 'ؤ', $string); - $string = str_replace("\242", 'إ', $string); - $string = str_replace("\245", 'ئ', $string); - $string = str_replace ("\250", 'ا', $string); - $string = str_replace ("\252", 'ب', $string); - $string = str_replace ("\262", 'ة', $string); - $string = str_replace ("\263", 'ت', $string); - $string = str_replace ("\264", 'ث', $string); - $string = str_replace ("\270", 'ج', $string); - $string = str_replace ("\272", 'ح', $string); - $string = str_replace ("\274", 'خ', $string); - $string = str_replace ("\275", 'د', $string); - $string = str_replace ("\276", 'ذ', $string); - $string = str_replace ("\277", 'ر', $string); - $string = str_replace ("\301", 'ز', $string); - $string = str_replace ("\304", 'س', $string); - $string = str_replace ("\305", 'ش', $string); - $string = str_replace ("\306", 'ص', $string); - $string = str_replace ("\314", 'ض', $string); - $string = str_replace ("\315", 'ط', $string); - $string = str_replace ("\320", 'ظ', $string); - $string = str_replace ("\321", 'ع', $string); - $string = str_replace ("\322", 'غ', $string); - $string = str_replace ("\323", 'ـ', $string); - $string = str_replace ("\325", 'ف', $string); - $string = str_replace ("\326", 'ق', $string); - $string = str_replace ("\330", 'ك', $string); - $string = str_replace ("\332", 'گ', $string); - $string = str_replace ("\335", 'ل', $string); - $string = str_replace ("\336", 'م', $string); - $string = str_replace ("\337", 'ن', $string); - $string = str_replace ("\341", 'ه', $string); - $string = str_replace ("\344", 'و', $string); - $string = str_replace ("\345", 'ى', $string); - $string = str_replace ("\346", 'ي', $string); - $string = str_replace ("\354", 'ً', $string); - $string = str_replace ("\355", 'ٌ', $string); - $string = str_replace ("\360", 'ٍ', $string); - $string = str_replace ("\361", 'َ', $string); - $string = str_replace ("\362", 'ُ', $string); - $string = str_replace ("\363", 'ِ', $string); - $string = str_replace ("\365", 'ّ', $string); - $string = str_replace ("\366", 'ْ', $string); - - // Rest of charset is like iso-8859-1 - return (charset_decode_iso_8859_1($string)); -} - -/* - windows-1257 (BaltRim) - */ -function charset_decode_windows_1257 ($string) { - global $default_charset; - - if (strtolower($default_charset) == 'windows-1257') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - $string = str_replace("\200", '€', $string); - $string = str_replace("\202", '‚', $string); - $string = str_replace("\204", '„', $string); - $string = str_replace("\205", '…', $string); - $string = str_replace("\206", '†', $string); - $string = str_replace("\207", '‡', $string); - $string = str_replace("\211", '‰', $string); - $string = str_replace("\213", '‹', $string); - $string = str_replace("\215", '¨', $string); - $string = str_replace("\216", 'ˇ', $string); - $string = str_replace("\217", '¸', $string); - $string = str_replace("\221", '‘', $string); - $string = str_replace("\222", '’', $string); - $string = str_replace("\223", '“', $string); - $string = str_replace("\224", '”', $string); - $string = str_replace("\225", '•', $string); - $string = str_replace("\226", '–', $string); - $string = str_replace("\227", '—', $string); - $string = str_replace("\231", '™', $string); - $string = str_replace("\233", '›', $string); - $string = str_replace("\235", '¯', $string); - $string = str_replace("\236", '˛', $string); - $string = str_replace ("\250", 'Ø', $string); - $string = str_replace ("\252", 'Ŗ', $string); - $string = str_replace ("\257", 'Æ', $string); - $string = str_replace ("\270", 'ø', $string); - $string = str_replace ("\272", 'ŗ', $string); - $string = str_replace ("\277", 'æ', $string); - $string = str_replace ("\300", 'Ą', $string); - $string = str_replace ("\301", 'Į', $string); - $string = str_replace ("\302", 'Ā', $string); - $string = str_replace ("\303", 'Ć', $string); - $string = str_replace ("\306", 'Ę', $string); - $string = str_replace ("\307", 'Ē', $string); - $string = str_replace ("\310", 'Č', $string); - $string = str_replace ("\312", 'Ź', $string); - $string = str_replace ("\313", 'Ė', $string); - $string = str_replace ("\314", 'Ģ', $string); - $string = str_replace ("\315", 'Ķ', $string); - $string = str_replace ("\316", 'Ī', $string); - $string = str_replace ("\317", 'Ļ', $string); - $string = str_replace ("\320", 'Š', $string); - $string = str_replace ("\321", 'Ń', $string); - $string = str_replace ("\322", 'Ņ', $string); - $string = str_replace ("\324", 'Ō', $string); - $string = str_replace ("\330", 'Ų', $string); - $string = str_replace ("\331", 'Ł', $string); - $string = str_replace ("\332", 'Ŕ', $string); - $string = str_replace ("\333", 'Ū', $string); - $string = str_replace ("\335", 'Ż', $string); - $string = str_replace ("\336", 'Ž', $string); - $string = str_replace ("\340", 'ą', $string); - $string = str_replace ("\341", 'į', $string); - $string = str_replace ("\342", 'ā', $string); - $string = str_replace ("\343", 'ć', $string); - $string = str_replace ("\346", 'ę', $string); - $string = str_replace ("\347", 'ē', $string); - $string = str_replace ("\350", 'č', $string); - $string = str_replace ("\352", 'ź', $string); - $string = str_replace ("\353", 'ė', $string); - $string = str_replace ("\354", 'ģ', $string); - $string = str_replace ("\355", 'ķ', $string); - $string = str_replace ("\356", 'ī', $string); - $string = str_replace ("\357", 'ļ', $string); - $string = str_replace ("\360", 'š', $string); - $string = str_replace ("\361", 'ń', $string); - $string = str_replace ("\362", 'ņ', $string); - $string = str_replace ("\364", 'ō', $string); - $string = str_replace ("\370", 'ų', $string); - $string = str_replace ("\371", 'ł', $string); - $string = str_replace ("\372", 'ś', $string); - $string = str_replace ("\373", 'ū', $string); - $string = str_replace ("\375", 'ż', $string); - $string = str_replace ("\376", 'ž', $string); - $string = str_replace ("\377", '˙', $string); - - // Rest of charset is like iso-8859-1 - return (charset_decode_iso_8859_1($string)); -} - /* * Set up the language to be output * if $do_search is true, then scan the browser information * for a possible language that we know */ -function set_up_language($sm_language, $do_search = false) { +function set_up_language($sm_language, $do_search = false, $default = false) { static $SetupAlready = 0; global $use_gettext, $languages, @@ -1708,11 +281,20 @@ function set_up_language($sm_language, $do_search = false) { $sm_language = substr($accept_lang, 0, 2); } - if (!$sm_language && isset($squirrelmail_default_language)) { + if ((!$sm_language||$default) && isset($squirrelmail_default_language)) { $squirrelmail_language = $squirrelmail_default_language; $sm_language = $squirrelmail_default_language; } $sm_notAlias = $sm_language; + + // Catching removed translation + // System reverts to English translation if user prefs contain translation + // that is not available in $languages array (admin removed directory + // with that translation) + if (!isset($languages[$sm_notAlias])) { + $sm_notAlias="en_US"; + } + while (isset($languages[$sm_notAlias]['ALIAS'])) { $sm_notAlias = $languages[$sm_notAlias]['ALIAS']; } @@ -1726,14 +308,19 @@ function set_up_language($sm_language, $do_search = false) { if (function_exists('bind_textdomain_codeset')) { bind_textdomain_codeset ("squirrelmail", $languages[$sm_notAlias]['CHARSET'] ); } + if (isset($languages[$sm_notAlias]['LOCALE'])){ + $longlocale=$languages[$sm_notAlias]['LOCALE']; + } else { + $longlocale=$sm_notAlias; + } if ( !ini_get('safe_mode') && - getenv( 'LC_ALL' ) != $sm_notAlias ) { - putenv( "LC_ALL=$sm_notAlias" ); - putenv( "LANG=$sm_notAlias" ); - putenv( "LANGUAGE=$sm_notAlias" ); + getenv( 'LC_ALL' ) != $longlocale ) { + putenv( "LC_ALL=$longlocale" ); + putenv( "LANG=$longlocale" ); + putenv( "LANGUAGE=$longlocale" ); } - setlocale(LC_ALL, $sm_notAlias); - $squirrelmail_language = $sm_notAlias; + setlocale(LC_ALL, $longlocale); + $squirrelmail_language = $sm_notAlias; if ($squirrelmail_language == 'ja_JP' && function_exists('mb_detect_encoding') ) { header ('Content-Type: text/html; charset=EUC-JP'); if (!function_exists('mb_internal_encoding')) { @@ -1767,6 +354,10 @@ function set_my_charset(){ if (!$my_language) { $my_language = $squirrelmail_default_language ; } + // Catch removed translation + if (!isset($languages[$my_language])) { + $my_language="en_US"; + } while (isset($languages[$my_language]['ALIAS'])) { $my_language = $languages[$my_language]['ALIAS']; } @@ -1785,39 +376,49 @@ if (! isset($squirrelmail_language)) { } /* This array specifies the available languages. */ - -// The glibc locale is ca_ES. +$languages['bg_BG']['NAME'] = 'Bulgarian'; +$languages['bg_BG']['ALTNAME'] = 'Български'; +$languages['bg_BG']['CHARSET'] = 'windows-1251'; +$languages['bg']['ALIAS'] = 'bg_BG'; $languages['ca_ES']['NAME'] = 'Catalan'; $languages['ca_ES']['CHARSET'] = 'iso-8859-1'; $languages['ca']['ALIAS'] = 'ca_ES'; $languages['cs_CZ']['NAME'] = 'Czech'; +$languages['cs_CZ']['ALTNAME'] = 'Čeština'; $languages['cs_CZ']['CHARSET'] = 'iso-8859-2'; $languages['cs']['ALIAS'] = 'cs_CZ'; -// Danish locale is da_DK. +$languages['cy_GB']['NAME'] = 'Welsh'; +$languages['cy_GB']['ALTNAME'] = 'Cymraeg'; +$languages['cy_GB']['CHARSET'] = 'iso-8859-1'; +$languages['cy']['ALIAS'] = 'cy_GB'; +// Danish locale is da_DK. $languages['da_DK']['NAME'] = 'Danish'; +$languages['da_DK']['ALTNAME'] = 'Dansk'; $languages['da_DK']['CHARSET'] = 'iso-8859-1'; $languages['da']['ALIAS'] = 'da_DK'; -$languages['de_DE']['NAME'] = 'Deutsch'; +$languages['de_DE']['NAME'] = 'German'; +$languages['de_DE']['ALTNAME'] = 'Deutsch'; $languages['de_DE']['CHARSET'] = 'iso-8859-1'; $languages['de']['ALIAS'] = 'de_DE'; -// There is no en_EN! There is en_US, en_BR, en_AU, and so forth, -// but who cares about !US, right? Right? :) - $languages['el_GR']['NAME'] = 'Greek'; +$languages['el_GR']['ALTNAME'] = 'Ελληνικά'; $languages['el_GR']['CHARSET'] = 'iso-8859-7'; $languages['el']['ALIAS'] = 'el_GR'; +// There is no en_EN! There is en_US, en_BR, en_AU, and so forth, +// but who cares about !US, right? Right? :) $languages['en_US']['NAME'] = 'English'; $languages['en_US']['CHARSET'] = 'iso-8859-1'; $languages['en']['ALIAS'] = 'en_US'; $languages['es_ES']['NAME'] = 'Spanish'; +$languages['es_ES']['ALTNAME'] = 'Español'; $languages['es_ES']['CHARSET'] = 'iso-8859-1'; $languages['es']['ALIAS'] = 'es_ES'; @@ -1830,10 +431,12 @@ $languages['fo_FO']['CHARSET'] = 'iso-8859-1'; $languages['fo']['ALIAS'] = 'fo_FO'; $languages['fi_FI']['NAME'] = 'Finnish'; +$languages['fi_FI']['ALTNAME'] = 'Suomi'; $languages['fi_FI']['CHARSET'] = 'iso-8859-1'; $languages['fi']['ALIAS'] = 'fi_FI'; $languages['fr_FR']['NAME'] = 'French'; +$languages['fr_FR']['ALTNAME'] = 'Français'; $languages['fr_FR']['CHARSET'] = 'iso-8859-1'; $languages['fr']['ALIAS'] = 'fr_FR'; @@ -1842,14 +445,17 @@ $languages['hr_HR']['CHARSET'] = 'iso-8859-2'; $languages['hr']['ALIAS'] = 'hr_HR'; $languages['hu_HU']['NAME'] = 'Hungarian'; +$languages['hu_HU']['ALTNAME'] = 'Magyar'; $languages['hu_HU']['CHARSET'] = 'iso-8859-2'; $languages['hu']['ALIAS'] = 'hu_HU'; -$languages['id_ID']['NAME'] = 'Bahasa Indonesia'; +$languages['id_ID']['NAME'] = 'Indonesian'; +$languages['id_ID']['ALTNAME'] = 'Bahasa Indonesia'; $languages['id_ID']['CHARSET'] = 'iso-8859-1'; $languages['id']['ALIAS'] = 'id_ID'; $languages['is_IS']['NAME'] = 'Icelandic'; +$languages['is_IS']['ALTNAME'] = 'Íslenska'; $languages['is_IS']['CHARSET'] = 'iso-8859-1'; $languages['is']['ALIAS'] = 'is_IS'; @@ -1858,6 +464,7 @@ $languages['it_IT']['CHARSET'] = 'iso-8859-1'; $languages['it']['ALIAS'] = 'it_IT'; $languages['ja_JP']['NAME'] = 'Japanese'; +$languages['ja_JP']['ALTNAME'] = '日本語'; $languages['ja_JP']['CHARSET'] = 'iso-2022-jp'; $languages['ja_JP']['XTRA_CODE'] = 'japanese_charset_xtra'; $languages['ja']['ALIAS'] = 'ja_JP'; @@ -1867,38 +474,78 @@ $languages['ko_KR']['CHARSET'] = 'euc-KR'; $languages['ko_KR']['XTRA_CODE'] = 'korean_charset_xtra'; $languages['ko']['ALIAS'] = 'ko_KR'; +$languages['lt_LT']['NAME'] = 'Lithuanian'; +$languages['lt_LT']['ALTNAME'] = 'Lietuvių'; +$languages['lt_LT']['CHARSET'] = 'utf-8'; +$languages['lt_LT']['LOCALE'] = 'lt_LT.UTF-8'; +$languages['lt']['ALIAS'] = 'lt_LT'; + $languages['nl_NL']['NAME'] = 'Dutch'; +$languages['nl_NL']['ALTNAME'] = 'Nederlands'; $languages['nl_NL']['CHARSET'] = 'iso-8859-1'; $languages['nl']['ALIAS'] = 'nl_NL'; +$languages['ms_MY']['NAME'] = 'Malay'; +$languages['ms_MY']['ALTNAME'] = 'Bahasa Melayu'; +$languages['ms_MY']['CHARSET'] = 'iso-8859-1'; +$languages['my']['ALIAS'] = 'ms_MY'; + $languages['no_NO']['NAME'] = 'Norwegian (Bokmål)'; +$languages['no_NO']['ALTNAME'] = 'Norsk (Bokmål)'; $languages['no_NO']['CHARSET'] = 'iso-8859-1'; $languages['no']['ALIAS'] = 'no_NO'; + $languages['nn_NO']['NAME'] = 'Norwegian (Nynorsk)'; +$languages['nn_NO']['ALTNAME'] = 'Norsk (Nynorsk)'; $languages['nn_NO']['CHARSET'] = 'iso-8859-1'; $languages['pl_PL']['NAME'] = 'Polish'; +$languages['pl_PL']['ALTNAME'] = 'Polski'; $languages['pl_PL']['CHARSET'] = 'iso-8859-2'; $languages['pl']['ALIAS'] = 'pl_PL'; $languages['pt_PT']['NAME'] = 'Portuguese (Portugal)'; $languages['pt_PT']['CHARSET'] = 'iso-8859-1'; +$languages['pt']['ALIAS'] = 'pt_PT'; + $languages['pt_BR']['NAME'] = 'Portuguese (Brazil)'; +$languages['pt_BR']['ALTNAME'] = 'Português do Brasil'; $languages['pt_BR']['CHARSET'] = 'iso-8859-1'; -$languages['pt']['ALIAS'] = 'pt_PT'; + +$languages['ro_RO']['NAME'] = 'Romanian'; +$languages['ro_RO']['ALTNAME'] = 'Română'; +$languages['ro_RO']['CHARSET'] = 'iso-8859-2'; +$languages['ro']['ALIAS'] = 'ro_RO'; $languages['ru_RU']['NAME'] = 'Russian'; -$languages['ru_RU']['CHARSET'] = 'koi8-r'; +$languages['ru_RU']['ALTNAME'] = 'Русский'; +$languages['ru_RU']['CHARSET'] = 'utf-8'; +$languages['ru_RU']['LOCALE'] = 'ru_RU.UTF-8'; $languages['ru']['ALIAS'] = 'ru_RU'; +$languages['sk_SK']['NAME'] = 'Slovak'; +$languages['sk_SK']['CHARSET'] = 'iso-8859-2'; +$languages['sk']['ALIAS'] = 'sk_SK'; + +$languages['sl_SI']['NAME'] = 'Slovenian'; +$languages['sl_SI']['ALTNAME'] = 'Slovenščina'; +$languages['sl_SI']['CHARSET'] = 'iso-8859-2'; +$languages['sl']['ALIAS'] = 'sl_SI'; + $languages['sr_YU']['NAME'] = 'Serbian'; +$languages['sr_YU']['ALTNAME'] = 'Srpski'; $languages['sr_YU']['CHARSET'] = 'iso-8859-2'; $languages['sr']['ALIAS'] = 'sr_YU'; $languages['sv_SE']['NAME'] = 'Swedish'; +$languages['sv_SE']['ALTNAME'] = 'Svenska'; $languages['sv_SE']['CHARSET'] = 'iso-8859-1'; $languages['sv']['ALIAS'] = 'sv_SE'; +$languages['th_TH']['NAME'] = 'Thai'; +$languages['th_TH']['CHARSET'] = 'tis-620'; +$languages['th']['ALIAS'] = 'th_TH'; + $languages['tr_TR']['NAME'] = 'Turkish'; $languages['tr_TR']['CHARSET'] = 'iso-8859-9'; $languages['tr']['ALIAS'] = 'tr_TR'; @@ -1911,44 +558,20 @@ $languages['zh_CN']['NAME'] = 'Chinese Simp'; $languages['zh_CN']['CHARSET'] = 'gb2312'; $languages['cn']['ALIAS'] = 'zh_CN'; -$languages['sk_SK']['NAME'] = 'Slovak'; -$languages['sk_SK']['CHARSET'] = 'iso-8859-2'; -$languages['sk']['ALIAS'] = 'sk_SK'; - -$languages['ro_RO']['NAME'] = 'Romanian'; -$languages['ro_RO']['CHARSET'] = 'iso-8859-2'; -$languages['ro']['ALIAS'] = 'ro_RO'; - -$languages['th_TH']['NAME'] = 'Thai'; -$languages['th_TH']['CHARSET'] = 'tis-620'; -$languages['th']['ALIAS'] = 'th_TH'; - -$languages['lt_LT']['NAME'] = 'Lithuanian'; -$languages['lt_LT']['CHARSET'] = 'windows-1257'; -$languages['lt']['ALIAS'] = 'lt_LT'; - -$languages['sl_SI']['NAME'] = 'Slovenian'; -$languages['sl_SI']['CHARSET'] = 'iso-8859-2'; -$languages['sl']['ALIAS'] = 'sl_SI'; - -$languages['bg_BG']['NAME'] = 'Bulgarian'; -$languages['bg_BG']['CHARSET'] = 'windows-1251'; -$languages['bg']['ALIAS'] = 'bg_BG'; - +/* $languages['uk_UA']['NAME'] = 'Ukrainian'; $languages['uk_UA']['CHARSET'] = 'koi8-u'; $languages['uk']['ALIAS'] = 'uk_UA'; - -$languages['cy_GB']['NAME'] = 'Welsh'; -$languages['cy_GB']['CHARSET'] = 'iso-8859-1'; -$languages['cy']['ALIAS'] = 'cy_GB'; - -$languages['vi_VN']['NAME'] = 'Vietnamese'; -$languages['vi_VN']['CHARSET'] = 'utf-8'; -$languages['vi']['ALIAS'] = 'vi_VN'; +*/ +/* +if ( file_exists( SM_PATH . 'locale/vi_VN') ) { + $languages['vi_VN']['NAME'] = 'Vietnamese'; + $languages['vi_VN']['CHARSET'] = 'utf-8'; + $languages['vi']['ALIAS'] = 'vi_VN'; +} +*/ // Right to left languages - $languages['ar']['NAME'] = 'Arabic'; $languages['ar']['CHARSET'] = 'windows-1256'; $languages['ar']['DIR'] = 'rtl'; @@ -1997,39 +620,6 @@ elseif ($gettext_flags == 0) { } } -function charset_decode_utf8 ($string) { -/* - Every decoded character consists of n bytes. First byte is octal - 300-375, other bytes - always octals 200-277. - - \a\b characters are decoded to html code octdec(a-300)*64 + octdec(b-200) - \a\b\c characters are decoded to html code octdec(a-340)*64*64 + octdec(b-200)*64 + octdec(c-200) - - decoding cycle is unfinished. please test and report problems to tokul@users.sourceforge.net -*/ - global $default_charset, $languages, $sm_notAlias; - - if (strtolower($default_charset) == 'utf-8') - return $string; - if (strtolower($languages[$sm_notAlias]['CHARSET']) == 'utf-8') - return $string; - - /* Only do the slow convert if there are 8-bit characters */ - if (! ereg("[\200-\377]", $string)) - return $string; - - // decode three byte unicode characters - $string = preg_replace("/([\340-\357])([\200-\277])([\200-\277])/e", - "'&#'.((ord('\\1')-224)*4096+(ord('\\2')-128)*64+(ord('\\3')-128)).';'", - $string); - - // decode two byte unicode characters - $string = preg_replace("/([\300-\337])([\200-\277])/e", - "'&#'.((ord('\\1')-192)*64+(ord('\\2')-128)).';'", - $string); - - return $string; -} /* * Japanese charset extra function @@ -2189,4 +779,117 @@ function korean_charset_xtra() { return $ret; } -?> \ No newline at end of file +/* + * This function can be used to replace non-braking space symbols + * that are inserted in forms by some browsers instead of normal + * space symbol. + */ +function cleanup_nbsp($string,$charset) { + + // reduce number of case statements + if (stristr('iso-8859-',substr($charset,0,9))){ + $output_charset="iso-8859-x"; + } + if (stristr('windows-125',substr($charset,0,11))){ + $output_charset="cp125x"; + } + if (stristr('koi8',substr($charset,0,4))){ + $output_charset="koi8-x"; + } + if (! isset($output_charset)){ + $output_charset=strtolower($charset); + } + +// where is non-braking space symbol +switch($output_charset): + case "iso-8859-x": + case "cp125x": + case "iso-2022-jp": + $nbsp="\xA0"; + break; + case "koi8-x": + $nbsp="\x9A"; + break; + case "utf-8": + $nbsp="\xC2\xA0"; + break; + default: + // don't change string if charset is unmatched + return $string; +endswitch; + +// return space instead of non-braking space. + return str_replace($nbsp,' ',$string); +} + +function is_conversion_safe($input_charset) { + global $languages, $sm_notAlias, $default_charset; + + // convert to lower case + $input_charset = strtolower($input_charset); + + // Is user's locale Unicode based ? + if ( $default_charset == "utf-8" ) { + return true; + } + + // Charsets that are similar +switch ($default_charset): +case "windows-1251": + if ( $input_charset == "iso-8859-5" || + $input_charset == "koi8-r" || + $input_charset == "koi8-u" ) { + return true; + } else { + return false; + } +case "windows-1257": + if ( $input_charset == "iso-8859-13" || + $input_charset == "iso-8859-4" ) { + return true; + } else { + return false; + } +case "iso-8859-4": + if ( $input_charset == "iso-8859-13" || + $input_charset == "windows-1257" ) { + return true; + } else { + return false; + } +case "iso-8859-5": + if ( $input_charset == "windows-1251" || + $input_charset == "koi8-r" || + $input_charset == "koi8-u" ) { + return true; + } else { + return false; + } +case "iso-8859-13": + if ( $input_charset == "iso-8859-4" || + $input_charset == "windows-1257" ) { + return true; + } else { + return false; + } +case "koi8-r": + if ( $input_charset == "windows-1251" || + $input_charset == "iso-8859-5" || + $input_charset == "koi8-u" ) { + return true; + } else { + return false; + } +case "koi8-u": + if ( $input_charset == "windows-1251" || + $input_charset == "iso-8859-5" || + $input_charset == "koi8-r" ) { + return true; + } else { + return false; + } +default: + return false; +endswitch; +} +?>