X-Git-Url: https://vcs.fsf.org/?a=blobdiff_plain;f=functions%2Fi18n.php;h=10fe4e8e689d4792ceeb5710272379c3b10eea56;hb=dcc5c9134b5578c657f9f5c45e64c79eb46684c7;hp=791f0d99e3d1a5d624b140a58d391aff0cf4b610;hpb=5dd23dac87742f29bc491e3ae4dba699b8147fc0;p=squirrelmail.git diff --git a/functions/i18n.php b/functions/i18n.php index 791f0d99..10fe4e8e 100644 --- a/functions/i18n.php +++ b/functions/i18n.php @@ -19,23 +19,66 @@ require_once(SM_PATH . 'functions/global.php'); /* Decodes a string to the internal encoding from the given charset */ function charset_decode ($charset, $string) { - global $languages, $squirrelmail_language; + global $languages, $squirrelmail_language, $default_charset; + global $use_php_recode, $use_php_iconv, $agresive_decoding; if (isset($languages[$squirrelmail_language]['XTRA_CODE']) && function_exists($languages[$squirrelmail_language]['XTRA_CODE'])) { $string = $languages[$squirrelmail_language]['XTRA_CODE']('decode', $string); } + $charset = strtolower($charset); + + set_my_charset(); + + // Variables that allow to use functions without function_exist() calls + if (! isset($use_php_recode) || $use_php_recode=="" ) { + $use_php_recode=false; } + if (! isset($use_php_iconv) || $use_php_iconv=="" ) { + $use_php_iconv=false; } + + // Don't do conversion if charset is the same. + if ( $charset == strtolower($default_charset) ) + return htmlspecialchars($string); + + // catch iso-8859-8-i thing + if ( $charset == "iso-8859-8-i" ) + $charset = "iso-8859-8"; + + /* + * Recode converts html special characters automatically if you use + * 'charset..html' decoding. There is no documented way to put -d option + * into php recode function call. + */ + if ( $use_php_recode ) { + if ( $default_charset == "utf-8" ) { + // other charsets can be converted to utf-8 without loss. + // and output string is smaller + $string = recode_string($charset . "..utf-8",$string); + return htmlspecialchars($string); + } else { + $string = recode_string($charset . "..html",$string); + // recode does not convert single quote, htmlspecialchars does. + $string = str_replace("'", ''', $string); + return $string; + } + } + + // iconv functions does not have html target and can be used only with utf-8 + if ( $use_php_iconv && $default_charset=='utf-8') { + $string = iconv($charset,$default_charset,$string); + return htmlspecialchars($string); + } + + // If we don't use recode and iconv, we'll do it old way. + /* All HTML special characters are 7 bit and can be replaced first */ $string = htmlspecialchars ($string); - $charset = strtolower($charset); - - set_my_charset() ; - /* controls cpu and memory intensive decoding cycles */ - $agresive_decoding = false; + if (! isset($agresive_decoding) || $agresive_decoding=="" ) { + $agresive_decoding=false; } if (ereg('iso-8859-([[:digit:]]+)', $charset, $res)) { if ($res[1] == '1') { @@ -121,6 +164,39 @@ function charset_decode ($charset, $string) { } else if ($charset == 'windows-1258') { include_once(SM_PATH . 'functions/decode/cp1258.php'); $ret = charset_decode_cp1258 ($string); + } else if ($charset == 'x-mac-roman') { + include_once(SM_PATH . 'functions/decode/cp10000.php'); + $ret = charset_decode_cp10000 ($string); + } else if ($charset == 'x-mac-greek') { + include_once(SM_PATH . 'functions/decode/cp10006.php'); + $ret = charset_decode_cp10006 ($string); + } else if ($charset == 'x-mac-cyrillic') { + include_once(SM_PATH . 'functions/decode/cp10007.php'); + $ret = charset_decode_cp10007 ($string); + } else if ($charset == 'x-mac-ukrainian') { + include_once(SM_PATH . 'functions/decode/cp10017.php'); + $ret = charset_decode_cp10017 ($string); + } else if ($charset == 'x-mac-centraleurroman') { + include_once(SM_PATH . 'functions/decode/cp10029.php'); + $ret = charset_decode_cp10029 ($string); + } else if ($charset == 'x-mac-icelandic') { + include_once(SM_PATH . 'functions/decode/cp10079.php'); + $ret = charset_decode_cp10079 ($string); + } else if ($charset == 'x-mac-turkish') { + include_once(SM_PATH . 'functions/decode/cp10081.php'); + $ret = charset_decode_cp10081 ($string); + } else if ($charset == 'ibm855') { + include_once(SM_PATH . 'functions/decode/cp855.php'); + $ret = charset_decode_cp855 ($string); + } else if ($charset == 'ibm866') { + include_once(SM_PATH . 'functions/decode/cp866.php'); + $ret = charset_decode_cp866 ($string); + } else if ($charset == 'iso-ir-111') { + include_once(SM_PATH . 'functions/decode/iso-ir-111.php'); + $ret = charset_decode_iso_ir_111 ($string); + } else if ($charset == 'tis-620') { + include_once(SM_PATH . 'functions/decode/tis620.php'); + $ret = charset_decode_tis620 ($string); } else if ($charset == 'big5' and $agresive_decoding ) { include_once(SM_PATH . 'functions/decode/big5.php'); $ret = charset_decode_big5 ($string); @@ -179,7 +255,7 @@ function charset_decode_ns_4551_1 ($string) { * if $do_search is true, then scan the browser information * for a possible language that we know */ -function set_up_language($sm_language, $do_search = false) { +function set_up_language($sm_language, $do_search = false, $default = false) { static $SetupAlready = 0; global $use_gettext, $languages, @@ -197,11 +273,20 @@ function set_up_language($sm_language, $do_search = false) { $sm_language = substr($accept_lang, 0, 2); } - if (!$sm_language && isset($squirrelmail_default_language)) { + if ((!$sm_language||$default) && isset($squirrelmail_default_language)) { $squirrelmail_language = $squirrelmail_default_language; $sm_language = $squirrelmail_default_language; } $sm_notAlias = $sm_language; + + // Catching removed translation + // System reverts to English translation if user prefs contain translation + // that is not available in $languages array (admin removed directory + // with that translation) + if (!isset($languages[$sm_notAlias])) { + $sm_notAlias="en_US"; + } + while (isset($languages[$sm_notAlias]['ALIAS'])) { $sm_notAlias = $languages[$sm_notAlias]['ALIAS']; } @@ -215,14 +300,19 @@ function set_up_language($sm_language, $do_search = false) { if (function_exists('bind_textdomain_codeset')) { bind_textdomain_codeset ("squirrelmail", $languages[$sm_notAlias]['CHARSET'] ); } + if (isset($languages[$sm_notAlias]['LOCALE'])){ + $longlocale=$languages[$sm_notAlias]['LOCALE']; + } else { + $longlocale=$sm_notAlias; + } if ( !ini_get('safe_mode') && - getenv( 'LC_ALL' ) != $sm_notAlias ) { - putenv( "LC_ALL=$sm_notAlias" ); - putenv( "LANG=$sm_notAlias" ); - putenv( "LANGUAGE=$sm_notAlias" ); + getenv( 'LC_ALL' ) != $longlocale ) { + putenv( "LC_ALL=$longlocale" ); + putenv( "LANG=$longlocale" ); + putenv( "LANGUAGE=$longlocale" ); } - setlocale(LC_ALL, $sm_notAlias); - $squirrelmail_language = $sm_notAlias; + setlocale(LC_ALL, $longlocale); + $squirrelmail_language = $sm_notAlias; if ($squirrelmail_language == 'ja_JP' && function_exists('mb_detect_encoding') ) { header ('Content-Type: text/html; charset=EUC-JP'); if (!function_exists('mb_internal_encoding')) { @@ -256,6 +346,10 @@ function set_my_charset(){ if (!$my_language) { $my_language = $squirrelmail_default_language ; } + // Catch removed translation + if (!isset($languages[$my_language])) { + $my_language="en_US"; + } while (isset($languages[$my_language]['ALIAS'])) { $my_language = $languages[$my_language]['ALIAS']; } @@ -274,39 +368,49 @@ if (! isset($squirrelmail_language)) { } /* This array specifies the available languages. */ - -// The glibc locale is ca_ES. +$languages['bg_BG']['NAME'] = 'Bulgarian'; +$languages['bg_BG']['ALTNAME'] = 'Български'; +$languages['bg_BG']['CHARSET'] = 'windows-1251'; +$languages['bg']['ALIAS'] = 'bg_BG'; $languages['ca_ES']['NAME'] = 'Catalan'; $languages['ca_ES']['CHARSET'] = 'iso-8859-1'; $languages['ca']['ALIAS'] = 'ca_ES'; $languages['cs_CZ']['NAME'] = 'Czech'; +$languages['cs_CZ']['ALTNAME'] = 'Čeština'; $languages['cs_CZ']['CHARSET'] = 'iso-8859-2'; $languages['cs']['ALIAS'] = 'cs_CZ'; -// Danish locale is da_DK. +$languages['cy_GB']['NAME'] = 'Welsh'; +$languages['cy_GB']['ALTNAME'] = 'Cymraeg'; +$languages['cy_GB']['CHARSET'] = 'iso-8859-1'; +$languages['cy']['ALIAS'] = 'cy_GB'; +// Danish locale is da_DK. $languages['da_DK']['NAME'] = 'Danish'; +$languages['da_DK']['ALTNAME'] = 'Dansk'; $languages['da_DK']['CHARSET'] = 'iso-8859-1'; $languages['da']['ALIAS'] = 'da_DK'; -$languages['de_DE']['NAME'] = 'Deutsch'; +$languages['de_DE']['NAME'] = 'German'; +$languages['de_DE']['ALTNAME'] = 'Deutsch'; $languages['de_DE']['CHARSET'] = 'iso-8859-1'; $languages['de']['ALIAS'] = 'de_DE'; -// There is no en_EN! There is en_US, en_BR, en_AU, and so forth, -// but who cares about !US, right? Right? :) - $languages['el_GR']['NAME'] = 'Greek'; +$languages['el_GR']['ALTNAME'] = 'Ελληνικά'; $languages['el_GR']['CHARSET'] = 'iso-8859-7'; $languages['el']['ALIAS'] = 'el_GR'; +// There is no en_EN! There is en_US, en_BR, en_AU, and so forth, +// but who cares about !US, right? Right? :) $languages['en_US']['NAME'] = 'English'; $languages['en_US']['CHARSET'] = 'iso-8859-1'; $languages['en']['ALIAS'] = 'en_US'; $languages['es_ES']['NAME'] = 'Spanish'; +$languages['es_ES']['ALTNAME'] = 'Español'; $languages['es_ES']['CHARSET'] = 'iso-8859-1'; $languages['es']['ALIAS'] = 'es_ES'; @@ -319,10 +423,12 @@ $languages['fo_FO']['CHARSET'] = 'iso-8859-1'; $languages['fo']['ALIAS'] = 'fo_FO'; $languages['fi_FI']['NAME'] = 'Finnish'; +$languages['fi_FI']['ALTNAME'] = 'Suomi'; $languages['fi_FI']['CHARSET'] = 'iso-8859-1'; $languages['fi']['ALIAS'] = 'fi_FI'; $languages['fr_FR']['NAME'] = 'French'; +$languages['fr_FR']['ALTNAME'] = 'Français'; $languages['fr_FR']['CHARSET'] = 'iso-8859-1'; $languages['fr']['ALIAS'] = 'fr_FR'; @@ -331,14 +437,17 @@ $languages['hr_HR']['CHARSET'] = 'iso-8859-2'; $languages['hr']['ALIAS'] = 'hr_HR'; $languages['hu_HU']['NAME'] = 'Hungarian'; +$languages['hu_HU']['ALTNAME'] = 'Magyar'; $languages['hu_HU']['CHARSET'] = 'iso-8859-2'; $languages['hu']['ALIAS'] = 'hu_HU'; -$languages['id_ID']['NAME'] = 'Bahasa Indonesia'; +$languages['id_ID']['NAME'] = 'Indonesian'; +$languages['id_ID']['ALTNAME'] = 'Bahasa Indonesia'; $languages['id_ID']['CHARSET'] = 'iso-8859-1'; $languages['id']['ALIAS'] = 'id_ID'; $languages['is_IS']['NAME'] = 'Icelandic'; +$languages['is_IS']['ALTNAME'] = 'Íslenska'; $languages['is_IS']['CHARSET'] = 'iso-8859-1'; $languages['is']['ALIAS'] = 'is_IS'; @@ -347,6 +456,7 @@ $languages['it_IT']['CHARSET'] = 'iso-8859-1'; $languages['it']['ALIAS'] = 'it_IT'; $languages['ja_JP']['NAME'] = 'Japanese'; +$languages['ja_JP']['ALTNAME'] = '日本語'; $languages['ja_JP']['CHARSET'] = 'iso-2022-jp'; $languages['ja_JP']['XTRA_CODE'] = 'japanese_charset_xtra'; $languages['ja']['ALIAS'] = 'ja_JP'; @@ -356,38 +466,78 @@ $languages['ko_KR']['CHARSET'] = 'euc-KR'; $languages['ko_KR']['XTRA_CODE'] = 'korean_charset_xtra'; $languages['ko']['ALIAS'] = 'ko_KR'; +$languages['lt_LT']['NAME'] = 'Lithuanian'; +$languages['lt_LT']['ALTNAME'] = 'Lietuvių'; +$languages['lt_LT']['CHARSET'] = 'utf-8'; +$languages['lt_LT']['LOCALE'] = 'lt_LT.UTF-8'; +$languages['lt']['ALIAS'] = 'lt_LT'; + $languages['nl_NL']['NAME'] = 'Dutch'; +$languages['nl_NL']['ALTNAME'] = 'Nederlands'; $languages['nl_NL']['CHARSET'] = 'iso-8859-1'; $languages['nl']['ALIAS'] = 'nl_NL'; +$languages['ms_MY']['NAME'] = 'Malay'; +$languages['ms_MY']['ALTNAME'] = 'Bahasa Melayu'; +$languages['ms_MY']['CHARSET'] = 'iso-8859-1'; +$languages['my']['ALIAS'] = 'ms_MY'; + $languages['no_NO']['NAME'] = 'Norwegian (Bokmål)'; +$languages['no_NO']['ALTNAME'] = 'Norsk (Bokmål)'; $languages['no_NO']['CHARSET'] = 'iso-8859-1'; $languages['no']['ALIAS'] = 'no_NO'; + $languages['nn_NO']['NAME'] = 'Norwegian (Nynorsk)'; +$languages['nn_NO']['ALTNAME'] = 'Norsk (Nynorsk)'; $languages['nn_NO']['CHARSET'] = 'iso-8859-1'; $languages['pl_PL']['NAME'] = 'Polish'; +$languages['pl_PL']['ALTNAME'] = 'Polski'; $languages['pl_PL']['CHARSET'] = 'iso-8859-2'; $languages['pl']['ALIAS'] = 'pl_PL'; $languages['pt_PT']['NAME'] = 'Portuguese (Portugal)'; $languages['pt_PT']['CHARSET'] = 'iso-8859-1'; +$languages['pt']['ALIAS'] = 'pt_PT'; + $languages['pt_BR']['NAME'] = 'Portuguese (Brazil)'; +$languages['pt_BR']['ALTNAME'] = 'Português do Brasil'; $languages['pt_BR']['CHARSET'] = 'iso-8859-1'; -$languages['pt']['ALIAS'] = 'pt_PT'; + +$languages['ro_RO']['NAME'] = 'Romanian'; +$languages['ro_RO']['ALTNAME'] = 'Română'; +$languages['ro_RO']['CHARSET'] = 'iso-8859-2'; +$languages['ro']['ALIAS'] = 'ro_RO'; $languages['ru_RU']['NAME'] = 'Russian'; -$languages['ru_RU']['CHARSET'] = 'koi8-r'; +$languages['ru_RU']['ALTNAME'] = 'Русский'; +$languages['ru_RU']['CHARSET'] = 'utf-8'; +$languages['ru_RU']['LOCALE'] = 'ru_RU.UTF-8'; $languages['ru']['ALIAS'] = 'ru_RU'; +$languages['sk_SK']['NAME'] = 'Slovak'; +$languages['sk_SK']['CHARSET'] = 'iso-8859-2'; +$languages['sk']['ALIAS'] = 'sk_SK'; + +$languages['sl_SI']['NAME'] = 'Slovenian'; +$languages['sl_SI']['ALTNAME'] = 'Slovenščina'; +$languages['sl_SI']['CHARSET'] = 'iso-8859-2'; +$languages['sl']['ALIAS'] = 'sl_SI'; + $languages['sr_YU']['NAME'] = 'Serbian'; +$languages['sr_YU']['ALTNAME'] = 'Srpski'; $languages['sr_YU']['CHARSET'] = 'iso-8859-2'; $languages['sr']['ALIAS'] = 'sr_YU'; $languages['sv_SE']['NAME'] = 'Swedish'; +$languages['sv_SE']['ALTNAME'] = 'Svenska'; $languages['sv_SE']['CHARSET'] = 'iso-8859-1'; $languages['sv']['ALIAS'] = 'sv_SE'; +$languages['th_TH']['NAME'] = 'Thai'; +$languages['th_TH']['CHARSET'] = 'tis-620'; +$languages['th']['ALIAS'] = 'th_TH'; + $languages['tr_TR']['NAME'] = 'Turkish'; $languages['tr_TR']['CHARSET'] = 'iso-8859-9'; $languages['tr']['ALIAS'] = 'tr_TR'; @@ -400,44 +550,20 @@ $languages['zh_CN']['NAME'] = 'Chinese Simp'; $languages['zh_CN']['CHARSET'] = 'gb2312'; $languages['cn']['ALIAS'] = 'zh_CN'; -$languages['sk_SK']['NAME'] = 'Slovak'; -$languages['sk_SK']['CHARSET'] = 'iso-8859-2'; -$languages['sk']['ALIAS'] = 'sk_SK'; - -$languages['ro_RO']['NAME'] = 'Romanian'; -$languages['ro_RO']['CHARSET'] = 'iso-8859-2'; -$languages['ro']['ALIAS'] = 'ro_RO'; - -$languages['th_TH']['NAME'] = 'Thai'; -$languages['th_TH']['CHARSET'] = 'tis-620'; -$languages['th']['ALIAS'] = 'th_TH'; - -$languages['lt_LT']['NAME'] = 'Lithuanian'; -$languages['lt_LT']['CHARSET'] = 'windows-1257'; -$languages['lt']['ALIAS'] = 'lt_LT'; - -$languages['sl_SI']['NAME'] = 'Slovenian'; -$languages['sl_SI']['CHARSET'] = 'iso-8859-2'; -$languages['sl']['ALIAS'] = 'sl_SI'; - -$languages['bg_BG']['NAME'] = 'Bulgarian'; -$languages['bg_BG']['CHARSET'] = 'windows-1251'; -$languages['bg']['ALIAS'] = 'bg_BG'; - +/* $languages['uk_UA']['NAME'] = 'Ukrainian'; $languages['uk_UA']['CHARSET'] = 'koi8-u'; $languages['uk']['ALIAS'] = 'uk_UA'; - -$languages['cy_GB']['NAME'] = 'Welsh'; -$languages['cy_GB']['CHARSET'] = 'iso-8859-1'; -$languages['cy']['ALIAS'] = 'cy_GB'; - -$languages['vi_VN']['NAME'] = 'Vietnamese'; -$languages['vi_VN']['CHARSET'] = 'utf-8'; -$languages['vi']['ALIAS'] = 'vi_VN'; +*/ +/* +if ( file_exists( SM_PATH . 'locale/vi_VN') ) { + $languages['vi_VN']['NAME'] = 'Vietnamese'; + $languages['vi_VN']['CHARSET'] = 'utf-8'; + $languages['vi']['ALIAS'] = 'vi_VN'; +} +*/ // Right to left languages - $languages['ar']['NAME'] = 'Arabic'; $languages['ar']['CHARSET'] = 'windows-1256'; $languages['ar']['DIR'] = 'rtl'; @@ -645,4 +771,117 @@ function korean_charset_xtra() { return $ret; } -?> \ No newline at end of file +/* + * This function can be used to replace non-braking space symbols + * that are inserted in forms by some browsers instead of normal + * space symbol. + */ +function cleanup_nbsp($string,$charset) { + + // reduce number of case statements + if (stristr('iso-8859-',substr($charset,0,9))){ + $output_charset="iso-8859-x"; + } + if (stristr('windows-125',substr($charset,0,11))){ + $output_charset="cp125x"; + } + if (stristr('koi8',substr($charset,0,4))){ + $output_charset="koi8-x"; + } + if (! isset($output_charset)){ + $output_charset=strtolower($charset); + } + +// where is non-braking space symbol +switch($output_charset): + case "iso-8859-x": + case "cp125x": + case "iso-2022-jp": + $nbsp="\xA0"; + break; + case "koi8-x": + $nbsp="\x9A"; + break; + case "utf-8": + $nbsp="\xC2\xA0"; + break; + default: + // don't change string if charset is unmatched + return $string; +endswitch; + +// return space instead of non-braking space. + return str_replace($nbsp,' ',$string); +} + +function is_conversion_safe($input_charset) { + global $languages, $sm_notAlias, $default_charset; + + // convert to lower case + $input_charset = strtolower($input_charset); + + // Is user's locale Unicode based ? + if ( $default_charset == "utf-8" ) { + return true; + } + + // Charsets that are similar +switch ($default_charset): +case "windows-1251": + if ( $input_charset == "iso-8859-5" || + $input_charset == "koi8-r" || + $input_charset == "koi8-u" ) { + return true; + } else { + return false; + } +case "windows-1257": + if ( $input_charset == "iso-8859-13" || + $input_charset == "iso-8859-4" ) { + return true; + } else { + return false; + } +case "iso-8859-4": + if ( $input_charset == "iso-8859-13" || + $input_charset == "windows-1257" ) { + return true; + } else { + return false; + } +case "iso-8859-5": + if ( $input_charset == "windows-1251" || + $input_charset == "koi8-r" || + $input_charset == "koi8-u" ) { + return true; + } else { + return false; + } +case "iso-8859-13": + if ( $input_charset == "iso-8859-4" || + $input_charset == "windows-1257" ) { + return true; + } else { + return false; + } +case "koi8-r": + if ( $input_charset == "windows-1251" || + $input_charset == "iso-8859-5" || + $input_charset == "koi8-u" ) { + return true; + } else { + return false; + } +case "koi8-u": + if ( $input_charset == "windows-1251" || + $input_charset == "iso-8859-5" || + $input_charset == "koi8-r" ) { + return true; + } else { + return false; + } +default: + return false; +endswitch; +} +?>