/* Decodes a string to the internal encoding from the given charset */
function charset_decode ($charset, $string) {
- global $languages, $squirrelmail_language;
+ global $languages, $squirrelmail_language, $default_charset;
+ global $use_php_recode, $use_php_iconv, $agresive_decoding;
if (isset($languages[$squirrelmail_language]['XTRA_CODE']) &&
function_exists($languages[$squirrelmail_language]['XTRA_CODE'])) {
$string = $languages[$squirrelmail_language]['XTRA_CODE']('decode', $string);
}
+ $charset = strtolower($charset);
+
+ set_my_charset();
+
+ // Variables that allow to use functions without function_exist() calls
+ if (! isset($use_php_recode) || $use_php_recode=="" ) {
+ $use_php_recode=false; }
+ if (! isset($use_php_iconv) || $use_php_iconv=="" ) {
+ $use_php_iconv=false; }
+
+ // Don't do conversion if charset is the same.
+ if ( $charset == strtolower($default_charset) )
+ return htmlspecialchars($string);
+
+ // catch iso-8859-8-i thing
+ if ( $charset == "iso-8859-8-i" )
+ $charset = "iso-8859-8";
+
+ /*
+ * Recode converts html special characters automatically if you use
+ * 'charset..html' decoding. There is no documented way to put -d option
+ * into php recode function call.
+ */
+ if ( $use_php_recode ) {
+ if ( $default_charset == "utf-8" ) {
+ // other charsets can be converted to utf-8 without loss.
+ // and output string is smaller
+ $string = recode_string($charset . "..utf-8",$string);
+ return htmlspecialchars($string);
+ } else {
+ $string = recode_string($charset . "..html",$string);
+ // recode does not convert single quote, htmlspecialchars does.
+ $string = str_replace("'", ''', $string);
+ return $string;
+ }
+ }
+
+ // iconv functions does not have html target and can be used only with utf-8
+ if ( $use_php_iconv && $default_charset=='utf-8') {
+ $string = iconv($charset,$default_charset,$string);
+ return htmlspecialchars($string);
+ }
+
+ // If we don't use recode and iconv, we'll do it old way.
+
/* All HTML special characters are 7 bit and can be replaced first */
$string = htmlspecialchars ($string);
- $charset = strtolower($charset);
-
- set_my_charset() ;
-
/* controls cpu and memory intensive decoding cycles */
- $agresive_decoding = false;
+ if (! isset($agresive_decoding) || $agresive_decoding=="" ) {
+ $agresive_decoding=false; }
if (ereg('iso-8859-([[:digit:]]+)', $charset, $res)) {
if ($res[1] == '1') {
} else if ($charset == 'windows-1258') {
include_once(SM_PATH . 'functions/decode/cp1258.php');
$ret = charset_decode_cp1258 ($string);
+ } else if ($charset == 'x-mac-roman') {
+ include_once(SM_PATH . 'functions/decode/cp10000.php');
+ $ret = charset_decode_cp10000 ($string);
+ } else if ($charset == 'x-mac-greek') {
+ include_once(SM_PATH . 'functions/decode/cp10006.php');
+ $ret = charset_decode_cp10006 ($string);
+ } else if ($charset == 'x-mac-cyrillic') {
+ include_once(SM_PATH . 'functions/decode/cp10007.php');
+ $ret = charset_decode_cp10007 ($string);
+ } else if ($charset == 'x-mac-ukrainian') {
+ include_once(SM_PATH . 'functions/decode/cp10017.php');
+ $ret = charset_decode_cp10017 ($string);
+ } else if ($charset == 'x-mac-centraleurroman') {
+ include_once(SM_PATH . 'functions/decode/cp10029.php');
+ $ret = charset_decode_cp10029 ($string);
+ } else if ($charset == 'x-mac-icelandic') {
+ include_once(SM_PATH . 'functions/decode/cp10079.php');
+ $ret = charset_decode_cp10079 ($string);
+ } else if ($charset == 'x-mac-turkish') {
+ include_once(SM_PATH . 'functions/decode/cp10081.php');
+ $ret = charset_decode_cp10081 ($string);
+ } else if ($charset == 'ibm855') {
+ include_once(SM_PATH . 'functions/decode/cp855.php');
+ $ret = charset_decode_cp855 ($string);
+ } else if ($charset == 'ibm866') {
+ include_once(SM_PATH . 'functions/decode/cp866.php');
+ $ret = charset_decode_cp866 ($string);
+ } else if ($charset == 'iso-ir-111') {
+ include_once(SM_PATH . 'functions/decode/iso-ir-111.php');
+ $ret = charset_decode_iso_ir_111 ($string);
+ } else if ($charset == 'tis-620') {
+ include_once(SM_PATH . 'functions/decode/tis620.php');
+ $ret = charset_decode_tis620 ($string);
} else if ($charset == 'big5' and $agresive_decoding ) {
include_once(SM_PATH . 'functions/decode/big5.php');
$ret = charset_decode_big5 ($string);
} else if ($charset == 'gb2312' and $agresive_decoding ) {
include_once(SM_PATH . 'functions/decode/gb2312.php');
$ret = charset_decode_gb2312 ($string);
- } else if ($charset == 'utf-8') {
+ } else if ($charset == 'utf-8' && $squirrelmail_language != 'ja_JP') {
include_once(SM_PATH . 'functions/decode/utf-8.php');
$ret = charset_decode_utf8 ($string);
} else {
$sm_language = $squirrelmail_default_language;
}
$sm_notAlias = $sm_language;
+
+ // Catching removed translation
+ // System reverts to English translation if user prefs contain translation
+ // that is not available in $languages array (admin removed directory
+ // with that translation)
+ if (!isset($languages[$sm_notAlias])) {
+ $sm_notAlias="en_US";
+ }
+
while (isset($languages[$sm_notAlias]['ALIAS'])) {
$sm_notAlias = $languages[$sm_notAlias]['ALIAS'];
}
if (!$my_language) {
$my_language = $squirrelmail_default_language ;
}
+ // Catch removed translation
+ if (!isset($languages[$my_language])) {
+ $my_language="en_US";
+ }
while (isset($languages[$my_language]['ALIAS'])) {
$my_language = $languages[$my_language]['ALIAS'];
}
}
/* This array specifies the available languages. */
-
-// The glibc locale is ca_ES.
+$languages['bg_BG']['NAME'] = 'Bulgarian';
+$languages['bg_BG']['ALTNAME'] = 'Български';
+$languages['bg_BG']['CHARSET'] = 'windows-1251';
+$languages['bg']['ALIAS'] = 'bg_BG';
$languages['ca_ES']['NAME'] = 'Catalan';
$languages['ca_ES']['CHARSET'] = 'iso-8859-1';
$languages['ca']['ALIAS'] = 'ca_ES';
$languages['cs_CZ']['NAME'] = 'Czech';
+$languages['cs_CZ']['ALTNAME'] = 'Čeština';
$languages['cs_CZ']['CHARSET'] = 'iso-8859-2';
$languages['cs']['ALIAS'] = 'cs_CZ';
-// Danish locale is da_DK.
+$languages['cy_GB']['NAME'] = 'Welsh';
+$languages['cy_GB']['ALTNAME'] = 'Cymraeg';
+$languages['cy_GB']['CHARSET'] = 'iso-8859-1';
+$languages['cy']['ALIAS'] = 'cy_GB';
+// Danish locale is da_DK.
$languages['da_DK']['NAME'] = 'Danish';
+$languages['da_DK']['ALTNAME'] = 'Dansk';
$languages['da_DK']['CHARSET'] = 'iso-8859-1';
$languages['da']['ALIAS'] = 'da_DK';
-$languages['de_DE']['NAME'] = 'Deutsch';
+$languages['de_DE']['NAME'] = 'German';
+$languages['de_DE']['ALTNAME'] = 'Deutsch';
$languages['de_DE']['CHARSET'] = 'iso-8859-1';
$languages['de']['ALIAS'] = 'de_DE';
-// There is no en_EN! There is en_US, en_BR, en_AU, and so forth,
-// but who cares about !US, right? Right? :)
-
$languages['el_GR']['NAME'] = 'Greek';
+$languages['el_GR']['ALTNAME'] = 'Ελληνικά';
$languages['el_GR']['CHARSET'] = 'iso-8859-7';
$languages['el']['ALIAS'] = 'el_GR';
+// There is no en_EN! There is en_US, en_BR, en_AU, and so forth,
+// but who cares about !US, right? Right? :)
$languages['en_US']['NAME'] = 'English';
$languages['en_US']['CHARSET'] = 'iso-8859-1';
$languages['en']['ALIAS'] = 'en_US';
$languages['es_ES']['NAME'] = 'Spanish';
+$languages['es_ES']['ALTNAME'] = 'Español';
$languages['es_ES']['CHARSET'] = 'iso-8859-1';
$languages['es']['ALIAS'] = 'es_ES';
$languages['fo']['ALIAS'] = 'fo_FO';
$languages['fi_FI']['NAME'] = 'Finnish';
+$languages['fi_FI']['ALTNAME'] = 'Suomi';
$languages['fi_FI']['CHARSET'] = 'iso-8859-1';
$languages['fi']['ALIAS'] = 'fi_FI';
$languages['fr_FR']['NAME'] = 'French';
+$languages['fr_FR']['ALTNAME'] = 'Français';
$languages['fr_FR']['CHARSET'] = 'iso-8859-1';
$languages['fr']['ALIAS'] = 'fr_FR';
$languages['hr']['ALIAS'] = 'hr_HR';
$languages['hu_HU']['NAME'] = 'Hungarian';
+$languages['hu_HU']['ALTNAME'] = 'Magyar';
$languages['hu_HU']['CHARSET'] = 'iso-8859-2';
$languages['hu']['ALIAS'] = 'hu_HU';
-$languages['id_ID']['NAME'] = 'Bahasa Indonesia';
+$languages['id_ID']['NAME'] = 'Indonesian';
+$languages['id_ID']['ALTNAME'] = 'Bahasa Indonesia';
$languages['id_ID']['CHARSET'] = 'iso-8859-1';
$languages['id']['ALIAS'] = 'id_ID';
$languages['is_IS']['NAME'] = 'Icelandic';
+$languages['is_IS']['ALTNAME'] = 'Íslenska';
$languages['is_IS']['CHARSET'] = 'iso-8859-1';
$languages['is']['ALIAS'] = 'is_IS';
$languages['it']['ALIAS'] = 'it_IT';
$languages['ja_JP']['NAME'] = 'Japanese';
+$languages['ja_JP']['ALTNAME'] = '日本語';
$languages['ja_JP']['CHARSET'] = 'iso-2022-jp';
$languages['ja_JP']['XTRA_CODE'] = 'japanese_charset_xtra';
$languages['ja']['ALIAS'] = 'ja_JP';
$languages['ko_KR']['XTRA_CODE'] = 'korean_charset_xtra';
$languages['ko']['ALIAS'] = 'ko_KR';
+$languages['lt_LT']['NAME'] = 'Lithuanian';
+$languages['lt_LT']['ALTNAME'] = 'Lietuvių';
+$languages['lt_LT']['CHARSET'] = 'utf-8';
+$languages['lt_LT']['LOCALE'] = 'lt_LT.UTF-8';
+$languages['lt']['ALIAS'] = 'lt_LT';
+
$languages['nl_NL']['NAME'] = 'Dutch';
+$languages['nl_NL']['ALTNAME'] = 'Nederlands';
$languages['nl_NL']['CHARSET'] = 'iso-8859-1';
$languages['nl']['ALIAS'] = 'nl_NL';
+$languages['ms_MY']['NAME'] = 'Malay';
+$languages['ms_MY']['ALTNAME'] = 'Bahasa Melayu';
+$languages['ms_MY']['CHARSET'] = 'iso-8859-1';
+$languages['my']['ALIAS'] = 'ms_MY';
+
$languages['no_NO']['NAME'] = 'Norwegian (Bokmål)';
+$languages['no_NO']['ALTNAME'] = 'Norsk (Bokmål)';
$languages['no_NO']['CHARSET'] = 'iso-8859-1';
$languages['no']['ALIAS'] = 'no_NO';
+
$languages['nn_NO']['NAME'] = 'Norwegian (Nynorsk)';
+$languages['nn_NO']['ALTNAME'] = 'Norsk (Nynorsk)';
$languages['nn_NO']['CHARSET'] = 'iso-8859-1';
$languages['pl_PL']['NAME'] = 'Polish';
+$languages['pl_PL']['ALTNAME'] = 'Polski';
$languages['pl_PL']['CHARSET'] = 'iso-8859-2';
$languages['pl']['ALIAS'] = 'pl_PL';
$languages['pt_PT']['NAME'] = 'Portuguese (Portugal)';
$languages['pt_PT']['CHARSET'] = 'iso-8859-1';
+$languages['pt']['ALIAS'] = 'pt_PT';
+
$languages['pt_BR']['NAME'] = 'Portuguese (Brazil)';
+$languages['pt_BR']['ALTNAME'] = 'Português do Brasil';
$languages['pt_BR']['CHARSET'] = 'iso-8859-1';
-$languages['pt']['ALIAS'] = 'pt_PT';
+
+$languages['ro_RO']['NAME'] = 'Romanian';
+$languages['ro_RO']['ALTNAME'] = 'Română';
+$languages['ro_RO']['CHARSET'] = 'iso-8859-2';
+$languages['ro']['ALIAS'] = 'ro_RO';
$languages['ru_RU']['NAME'] = 'Russian';
-$languages['ru_RU']['CHARSET'] = 'koi8-r';
-$languages['ru_RU']['LOCALE'] = 'ru_RU.KOI8-R';
+$languages['ru_RU']['ALTNAME'] = 'Русский';
+$languages['ru_RU']['CHARSET'] = 'utf-8';
+$languages['ru_RU']['LOCALE'] = 'ru_RU.UTF-8';
$languages['ru']['ALIAS'] = 'ru_RU';
+$languages['sk_SK']['NAME'] = 'Slovak';
+$languages['sk_SK']['CHARSET'] = 'iso-8859-2';
+$languages['sk']['ALIAS'] = 'sk_SK';
+
+$languages['sl_SI']['NAME'] = 'Slovenian';
+$languages['sl_SI']['ALTNAME'] = 'Slovenščina';
+$languages['sl_SI']['CHARSET'] = 'iso-8859-2';
+$languages['sl']['ALIAS'] = 'sl_SI';
+
$languages['sr_YU']['NAME'] = 'Serbian';
+$languages['sr_YU']['ALTNAME'] = 'Srpski';
$languages['sr_YU']['CHARSET'] = 'iso-8859-2';
$languages['sr']['ALIAS'] = 'sr_YU';
$languages['sv_SE']['NAME'] = 'Swedish';
+$languages['sv_SE']['ALTNAME'] = 'Svenska';
$languages['sv_SE']['CHARSET'] = 'iso-8859-1';
$languages['sv']['ALIAS'] = 'sv_SE';
+$languages['th_TH']['NAME'] = 'Thai';
+$languages['th_TH']['CHARSET'] = 'tis-620';
+$languages['th']['ALIAS'] = 'th_TH';
+
$languages['tr_TR']['NAME'] = 'Turkish';
$languages['tr_TR']['CHARSET'] = 'iso-8859-9';
$languages['tr']['ALIAS'] = 'tr_TR';
$languages['zh_CN']['CHARSET'] = 'gb2312';
$languages['cn']['ALIAS'] = 'zh_CN';
-$languages['sk_SK']['NAME'] = 'Slovak';
-$languages['sk_SK']['CHARSET'] = 'iso-8859-2';
-$languages['sk']['ALIAS'] = 'sk_SK';
-
-$languages['ro_RO']['NAME'] = 'Romanian';
-$languages['ro_RO']['CHARSET'] = 'iso-8859-2';
-$languages['ro']['ALIAS'] = 'ro_RO';
-
-$languages['th_TH']['NAME'] = 'Thai';
-$languages['th_TH']['CHARSET'] = 'tis-620';
-$languages['th']['ALIAS'] = 'th_TH';
-
-$languages['lt_LT']['NAME'] = 'Lithuanian';
-$languages['lt_LT']['CHARSET'] = 'windows-1257';
-$languages['lt_LT']['LOCALE'] = 'lt_LT.CP1257';
-$languages['lt']['ALIAS'] = 'lt_LT';
-
-$languages['sl_SI']['NAME'] = 'Slovenian';
-$languages['sl_SI']['CHARSET'] = 'iso-8859-2';
-$languages['sl']['ALIAS'] = 'sl_SI';
-
-$languages['bg_BG']['NAME'] = 'Bulgarian';
-$languages['bg_BG']['CHARSET'] = 'windows-1251';
-$languages['bg']['ALIAS'] = 'bg_BG';
-
+/*
$languages['uk_UA']['NAME'] = 'Ukrainian';
$languages['uk_UA']['CHARSET'] = 'koi8-u';
$languages['uk']['ALIAS'] = 'uk_UA';
-
-$languages['cy_GB']['NAME'] = 'Welsh';
-$languages['cy_GB']['CHARSET'] = 'iso-8859-1';
-$languages['cy']['ALIAS'] = 'cy_GB';
-
-$languages['vi_VN']['NAME'] = 'Vietnamese';
-$languages['vi_VN']['CHARSET'] = 'utf-8';
-$languages['vi']['ALIAS'] = 'vi_VN';
+*/
+/*
+if ( file_exists( SM_PATH . 'locale/vi_VN') ) {
+ $languages['vi_VN']['NAME'] = 'Vietnamese';
+ $languages['vi_VN']['CHARSET'] = 'utf-8';
+ $languages['vi']['ALIAS'] = 'vi_VN';
+}
+*/
// Right to left languages
-
$languages['ar']['NAME'] = 'Arabic';
$languages['ar']['CHARSET'] = 'windows-1256';
$languages['ar']['DIR'] = 'rtl';
return $ret;
}
-?>
\ No newline at end of file
+/*
+ * This function can be used to replace non-braking space symbols
+ * that are inserted in forms by some browsers instead of normal
+ * space symbol.
+ */
+function cleanup_nbsp($string,$charset) {
+
+ // reduce number of case statements
+ if (stristr('iso-8859-',substr($charset,0,9))){
+ $output_charset="iso-8859-x";
+ }
+ if (stristr('windows-125',substr($charset,0,11))){
+ $output_charset="cp125x";
+ }
+ if (stristr('koi8',substr($charset,0,4))){
+ $output_charset="koi8-x";
+ }
+ if (! isset($output_charset)){
+ $output_charset=strtolower($charset);
+ }
+
+// where is non-braking space symbol
+switch($output_charset):
+ case "iso-8859-x":
+ case "cp125x":
+ case "iso-2022-jp":
+ $nbsp="\xA0";
+ break;
+ case "koi8-x":
+ $nbsp="\x9A";
+ break;
+ case "utf-8":
+ $nbsp="\xC2\xA0";
+ break;
+ default:
+ // don't change string if charset is unmatched
+ return $string;
+endswitch;
+
+// return space instead of non-braking space.
+ return str_replace($nbsp,' ',$string);
+}
+
+function is_conversion_safe($input_charset) {
+ global $languages, $sm_notAlias, $default_charset;
+
+ // convert to lower case
+ $input_charset = strtolower($input_charset);
+
+ // Is user's locale Unicode based ?
+ if ( $default_charset == "utf-8" ) {
+ return true;
+ }
+
+ // Charsets that are similar
+switch ($default_charset):
+case "windows-1251":
+ if ( $input_charset == "iso-8859-5" ||
+ $input_charset == "koi8-r" ||
+ $input_charset == "koi8-u" ) {
+ return true;
+ } else {
+ return false;
+ }
+case "windows-1257":
+ if ( $input_charset == "iso-8859-13" ||
+ $input_charset == "iso-8859-4" ) {
+ return true;
+ } else {
+ return false;
+ }
+case "iso-8859-4":
+ if ( $input_charset == "iso-8859-13" ||
+ $input_charset == "windows-1257" ) {
+ return true;
+ } else {
+ return false;
+ }
+case "iso-8859-5":
+ if ( $input_charset == "windows-1251" ||
+ $input_charset == "koi8-r" ||
+ $input_charset == "koi8-u" ) {
+ return true;
+ } else {
+ return false;
+ }
+case "iso-8859-13":
+ if ( $input_charset == "iso-8859-4" ||
+ $input_charset == "windows-1257" ) {
+ return true;
+ } else {
+ return false;
+ }
+case "koi8-r":
+ if ( $input_charset == "windows-1251" ||
+ $input_charset == "iso-8859-5" ||
+ $input_charset == "koi8-u" ) {
+ return true;
+ } else {
+ return false;
+ }
+case "koi8-u":
+ if ( $input_charset == "windows-1251" ||
+ $input_charset == "iso-8859-5" ||
+ $input_charset == "koi8-r" ) {
+ return true;
+ } else {
+ return false;
+ }
+default:
+ return false;
+endswitch;
+}
+?>