X-Git-Url: https://vcs.fsf.org/?a=blobdiff_plain;f=functions%2Fi18n.php;h=83dfe3063cef78140383525d1f661ba17bfc8c18;hb=7fcab811a919289459e616f0e47388c1cb27195a;hp=3d99ed0690253bba2e694310d8c7161a30a71720;hpb=d6c32258c05219670ab3b4ae2d460d844ea9a247;p=squirrelmail.git diff --git a/functions/i18n.php b/functions/i18n.php index 3d99ed06..83dfe306 100644 --- a/functions/i18n.php +++ b/functions/i18n.php @@ -1,9 +1,9 @@ ','<','"'),$string); + } + $encode=fixcharset($charset); + $encodefile=SM_PATH . 'functions/encode/' . $encode . '.php'; + if (file_exists($encodefile)) { + include_once($encodefile); + $ret = call_user_func('charset_encode_'.$encode, $string); + } else { + $ret = $string; + } + return( $ret ); } -/* - * This is the same as ISO-646-NO and is used by some - * Microsoft programs when sending Norwegian characters +/** + * Combined decoding and encoding functions + * + * If conversion is done to charset different that utf-8, unsupported symbols + * will be replaced with question marks. + * @param string $in_charset initial charset + * @param string $string string that has to be converted + * @param string $out_charset final charset + * @param boolean $htmlencode keep htmlspecialchars encoding + * @return string converted string */ -function charset_decode_ns_4551_1 ($string) { - /* - * These characters are: - * Latin capital letter AE - * Latin capital letter O with stroke - * Latin capital letter A with ring above - * and the same as small letters - */ - return strtr ($string, "[\\]{|}", "ÆØÅæøå"); +function charset_convert($in_charset,$string,$out_charset,$htmlencode=true) { + $string=charset_decode($in_charset,$string); + $string=charset_encode($string,$out_charset,$htmlencode); + return $string; } +/** + * Makes charset name suitable for decoding cycles + * + * @param string $charset Name of charset + * @return string $charset Adjusted name of charset + */ +function fixcharset($charset) { + // minus removed from function names + $charset=str_replace('-','_',$charset); + + // windows-125x and cp125x charsets + $charset=str_replace('windows_','cp',$charset); + + // ibm > cp + $charset=str_replace('ibm','cp',$charset); -/* + // iso-8859-8-i -> iso-8859-8 + // use same cycle until I'll find differences + $charset=str_replace('iso_8859_8_i','iso_8859_8',$charset); + + return $charset; +} + +/** * Set up the language to be output * if $do_search is true, then scan the browser information * for a possible language that we know + * + * Function sets system locale environment (LC_ALL, LANG, LANGUAGE), + * gettext translation bindings and html header information. + * + * Function returns error codes, if there is some fatal error. + * 0 = no error, + * 1 = mbstring support is not present, + * 2 = mbstring support is not present, user's translation reverted to en_US. + * + * @param string $sm_language translation used by user's interface + * @param bool $do_search use browser's preferred language detection functions. Defaults to false. + * @param bool $default set $sm_language to $squirrelmail_default_language if language detection fails or language is not set. Defaults to false. + * @return int function execution error codes. */ function set_up_language($sm_language, $do_search = false, $default = false) { static $SetupAlready = 0; global $use_gettext, $languages, $squirrelmail_language, $squirrelmail_default_language, - $sm_notAlias; + $sm_notAlias, $username, $data_dir; if ($SetupAlready) { return; @@ -289,8 +217,7 @@ function set_up_language($sm_language, $do_search = false, $default = false) { // Catching removed translation // System reverts to English translation if user prefs contain translation - // that is not available in $languages array (admin removed directory - // with that translation) + // that is not available in $languages array if (!isset($languages[$sm_notAlias])) { $sm_notAlias="en_US"; } @@ -305,26 +232,63 @@ function set_up_language($sm_language, $do_search = false, $default = false) { isset($languages[$sm_notAlias]['CHARSET']) ) { bindtextdomain( 'squirrelmail', SM_PATH . 'locale/' ); textdomain( 'squirrelmail' ); - if (function_exists('bind_textdomain_codeset')) { - bind_textdomain_codeset ("squirrelmail", $languages[$sm_notAlias]['CHARSET'] ); - } - if (isset($languages[$sm_notAlias]['LOCALE'])){ - $longlocale=$languages[$sm_notAlias]['LOCALE']; - } else { - $longlocale=$sm_notAlias; - } + if (function_exists('bind_textdomain_codeset')) { + if ($sm_notAlias == 'ja_JP') { + bind_textdomain_codeset ("squirrelmail", 'EUC-JP'); + } else { + bind_textdomain_codeset ("squirrelmail", $languages[$sm_notAlias]['CHARSET'] ); + } + } + if (isset($languages[$sm_notAlias]['LOCALE'])){ + $longlocale=$languages[$sm_notAlias]['LOCALE']; + } else { + $longlocale=$sm_notAlias; + } if ( !ini_get('safe_mode') && getenv( 'LC_ALL' ) != $longlocale ) { putenv( "LC_ALL=$longlocale" ); putenv( "LANG=$longlocale" ); putenv( "LANGUAGE=$longlocale" ); } - setlocale(LC_ALL, $longlocale); - $squirrelmail_language = $sm_notAlias; - if ($squirrelmail_language == 'ja_JP' && function_exists('mb_detect_encoding') ) { + setlocale(LC_ALL, $longlocale); + + // Set text direction/alignment variables + if (isset($languages[$sm_notAlias]['DIR']) && + $languages[$sm_notAlias]['DIR'] == 'rtl') { + /** + * Text direction + * @global string $text_direction + */ + $text_direction='rtl'; + /** + * Left alignment + * @global string $left_align + */ + $left_align='right'; + /** + * Right alignment + * @global string $right_align + */ + $right_align='left'; + } else { + $text_direction='ltr'; + $left_align='left'; + $right_align='right'; + } + + $squirrelmail_language = $sm_notAlias; + if ($squirrelmail_language == 'ja_JP') { header ('Content-Type: text/html; charset=EUC-JP'); if (!function_exists('mb_internal_encoding')) { - echo _("You need to have php4 installed with the multibyte string function enabled (using configure option --enable-mbstring)."); + // Error messages can't be displayed here + $error = 1; + // Revert to English if possible. + if (function_exists('setPref') && $username!='' && $data_dir!="") { + setPref($data_dir, $username, 'language', "en_US"); + $error = 2; + } + // stop further execution in order not to get php errors on mb_internal_encoding(). + return $error; } if (function_exists('mb_language')) { mb_language('Japanese'); @@ -335,19 +299,25 @@ function set_up_language($sm_language, $do_search = false, $default = false) { header( 'Content-Type: text/html; charset=' . $languages[$sm_notAlias]['CHARSET'] ); } } + return 0; } +/** + * Sets default_charset variable according to the one that is used by user's translations. + * + * Function changes global $default_charset variable in order to be sure, that it + * contains charset used by user's translation. Sanity of $squirrelmail_default_language + * and $default_charset combination provided in SquirrelMail config is also tested. + * + * There can be a $default_charset setting in the + * config.php file, but the user may have a different language + * selected for a user interface. This function checks the + * language selected by the user and tags the outgoing messages + * with the appropriate charset corresponding to the language + * selection. This is "more right" (tm), than just stamping the + * message blindly with the system-wide $default_charset. + */ function set_my_charset(){ - - /* - * There can be a $default_charset setting in the - * config.php file, but the user may have a different language - * selected for a user interface. This function checks the - * language selected by the user and tags the outgoing messages - * with the appropriate charset corresponding to the language - * selection. This is "more right" (tm), than just stamping the - * message blindly with the system-wide $default_charset. - */ global $data_dir, $username, $default_charset, $languages, $squirrelmail_default_language; $my_language = getPref($data_dir, $username, 'language'); @@ -375,103 +345,149 @@ if (! isset($squirrelmail_language)) { $squirrelmail_language = ''; } -/* This array specifies the available languages. */ +/** + * Array specifies the available translations. + * + * Structure of array: + * $languages['language']['variable'] = 'value' + * + * Possible 'variable' names: + * NAME - Translation name in English + * CHARSET - Encoding used by translation + * ALIAS - used when 'language' is only short name and 'value' should provide long language name + * ALTNAME - Native translation name. Any 8bit symbols must be html encoded. + * LOCALE - Full locale name (in xx_XX.charset format) + * DIR - Text direction. Used to define Right-to-Left languages. Possible values 'rtl' or 'ltr'. If undefined - defaults to 'ltr' + * XTRA_CODE - translation uses special functions. See doc/i18n.txt + * + * Each 'language' definition requires NAME+CHARSET or ALIAS variables. + * + * @name $languages + * @global array $languages + */ $languages['bg_BG']['NAME'] = 'Bulgarian'; $languages['bg_BG']['ALTNAME'] = 'Български'; $languages['bg_BG']['CHARSET'] = 'windows-1251'; +$languages['bg_BG']['LOCALE'] = 'bg_BG.CP1251'; $languages['bg']['ALIAS'] = 'bg_BG'; $languages['ca_ES']['NAME'] = 'Catalan'; $languages['ca_ES']['CHARSET'] = 'iso-8859-1'; +$languages['ca_ES']['LOCALE'] = 'ca_ES.ISO8859-1'; $languages['ca']['ALIAS'] = 'ca_ES'; $languages['cs_CZ']['NAME'] = 'Czech'; $languages['cs_CZ']['ALTNAME'] = 'Čeština'; $languages['cs_CZ']['CHARSET'] = 'iso-8859-2'; +$languages['cs_CZ']['LOCALE'] = 'cs_CZ.ISO8859-2'; $languages['cs']['ALIAS'] = 'cs_CZ'; $languages['cy_GB']['NAME'] = 'Welsh'; $languages['cy_GB']['ALTNAME'] = 'Cymraeg'; $languages['cy_GB']['CHARSET'] = 'iso-8859-1'; +$languages['cy_GB']['LOCALE'] = 'cy_GB.ISO8859-1'; $languages['cy']['ALIAS'] = 'cy_GB'; // Danish locale is da_DK. $languages['da_DK']['NAME'] = 'Danish'; $languages['da_DK']['ALTNAME'] = 'Dansk'; $languages['da_DK']['CHARSET'] = 'iso-8859-1'; +$languages['da_DK']['LOCALE'] = 'da_DK.ISO8859-1'; $languages['da']['ALIAS'] = 'da_DK'; $languages['de_DE']['NAME'] = 'German'; $languages['de_DE']['ALTNAME'] = 'Deutsch'; $languages['de_DE']['CHARSET'] = 'iso-8859-1'; +$languages['de_DE']['LOCALE'] = 'de_DE.ISO8859-1'; $languages['de']['ALIAS'] = 'de_DE'; $languages['el_GR']['NAME'] = 'Greek'; $languages['el_GR']['ALTNAME'] = 'Ελληνικά'; $languages['el_GR']['CHARSET'] = 'iso-8859-7'; +$languages['el_GR']['LOCALE'] = 'el_GR.ISO8859-7'; $languages['el']['ALIAS'] = 'el_GR'; -// There is no en_EN! There is en_US, en_BR, en_AU, and so forth, -// but who cares about !US, right? Right? :) +$languages['en_GB']['NAME'] = 'British'; +$languages['en_GB']['CHARSET'] = 'iso-8859-15'; +$languages['en_GB']['LOCALE'] = 'en_GB.ISO8859-15'; + $languages['en_US']['NAME'] = 'English'; $languages['en_US']['CHARSET'] = 'iso-8859-1'; +$languages['en_US']['LOCALE'] = 'en_US.ISO8859-1'; $languages['en']['ALIAS'] = 'en_US'; $languages['es_ES']['NAME'] = 'Spanish'; $languages['es_ES']['ALTNAME'] = 'Español'; $languages['es_ES']['CHARSET'] = 'iso-8859-1'; +$languages['es_ES']['LOCALE'] = 'es_ES.ISO8859-1'; $languages['es']['ALIAS'] = 'es_ES'; $languages['et_EE']['NAME'] = 'Estonian'; $languages['et_EE']['CHARSET'] = 'iso-8859-15'; +$languages['et_EE']['LOCALE'] = 'et_EE.ISO8859-15'; $languages['et']['ALIAS'] = 'et_EE'; +$languages['eu_ES']['NAME'] = 'Basque'; +$languages['eu_ES']['CHARSET'] = 'iso-8859-1'; +$languages['eu_ES']['LOCALE'] = 'eu_ES.ISO8859-1'; +$languages['eu']['ALIAS'] = 'eu_ES'; + $languages['fo_FO']['NAME'] = 'Faroese'; $languages['fo_FO']['CHARSET'] = 'iso-8859-1'; +$languages['fo_FO']['LOCALE'] = 'fo_FO.ISO8859-1'; $languages['fo']['ALIAS'] = 'fo_FO'; $languages['fi_FI']['NAME'] = 'Finnish'; $languages['fi_FI']['ALTNAME'] = 'Suomi'; $languages['fi_FI']['CHARSET'] = 'iso-8859-1'; +$languages['fi_FI']['LOCALE'] = 'fi_FI.ISO8859-1'; $languages['fi']['ALIAS'] = 'fi_FI'; $languages['fr_FR']['NAME'] = 'French'; $languages['fr_FR']['ALTNAME'] = 'Français'; $languages['fr_FR']['CHARSET'] = 'iso-8859-1'; +$languages['fr_FR']['LOCALE'] = 'fr_FR.ISO8859-1'; $languages['fr']['ALIAS'] = 'fr_FR'; $languages['hr_HR']['NAME'] = 'Croatian'; $languages['hr_HR']['CHARSET'] = 'iso-8859-2'; +$languages['hr_HR']['LOCALE'] = 'hr_HR.ISO8859-2'; $languages['hr']['ALIAS'] = 'hr_HR'; $languages['hu_HU']['NAME'] = 'Hungarian'; $languages['hu_HU']['ALTNAME'] = 'Magyar'; $languages['hu_HU']['CHARSET'] = 'iso-8859-2'; +$languages['hu_HU']['LOCALE'] = 'hu_HU.ISO8859-2'; $languages['hu']['ALIAS'] = 'hu_HU'; $languages['id_ID']['NAME'] = 'Indonesian'; $languages['id_ID']['ALTNAME'] = 'Bahasa Indonesia'; $languages['id_ID']['CHARSET'] = 'iso-8859-1'; +$languages['id_ID']['LOCALE'] = 'id_ID.ISO8859-1'; $languages['id']['ALIAS'] = 'id_ID'; $languages['is_IS']['NAME'] = 'Icelandic'; $languages['is_IS']['ALTNAME'] = 'Íslenska'; $languages['is_IS']['CHARSET'] = 'iso-8859-1'; +$languages['is_IS']['LOCALE'] = 'is_IS.ISO8859-1'; $languages['is']['ALIAS'] = 'is_IS'; $languages['it_IT']['NAME'] = 'Italian'; $languages['it_IT']['CHARSET'] = 'iso-8859-1'; +$languages['it_IT']['LOCALE'] = 'it_IT.ISO8859-1'; $languages['it']['ALIAS'] = 'it_IT'; $languages['ja_JP']['NAME'] = 'Japanese'; $languages['ja_JP']['ALTNAME'] = '日本語'; $languages['ja_JP']['CHARSET'] = 'iso-2022-jp'; -$languages['ja_JP']['XTRA_CODE'] = 'japanese_charset_xtra'; +$languages['ja_JP']['LOCALE'] = 'ja_JP.EUC-JP'; +$languages['ja_JP']['XTRA_CODE'] = 'japanese_xtra'; $languages['ja']['ALIAS'] = 'ja_JP'; $languages['ko_KR']['NAME'] = 'Korean'; $languages['ko_KR']['CHARSET'] = 'euc-KR'; -$languages['ko_KR']['XTRA_CODE'] = 'korean_charset_xtra'; +$languages['ko_KR']['LOCALE'] = 'ko_KR.EUC-KR'; +$languages['ko_KR']['XTRA_CODE'] = 'korean_xtra'; $languages['ko']['ALIAS'] = 'ko_KR'; $languages['lt_LT']['NAME'] = 'Lithuanian'; @@ -483,92 +499,115 @@ $languages['lt']['ALIAS'] = 'lt_LT'; $languages['nl_NL']['NAME'] = 'Dutch'; $languages['nl_NL']['ALTNAME'] = 'Nederlands'; $languages['nl_NL']['CHARSET'] = 'iso-8859-1'; +$languages['nl_NL']['LOCALE'] = 'nl_NL.ISO8859-1'; $languages['nl']['ALIAS'] = 'nl_NL'; $languages['ms_MY']['NAME'] = 'Malay'; $languages['ms_MY']['ALTNAME'] = 'Bahasa Melayu'; $languages['ms_MY']['CHARSET'] = 'iso-8859-1'; +$languages['ms_MY']['LOCALE'] = 'ms_MY.ISO8859-1'; $languages['my']['ALIAS'] = 'ms_MY'; -$languages['no_NO']['NAME'] = 'Norwegian (Bokmål)'; -$languages['no_NO']['ALTNAME'] = 'Norsk (Bokmål)'; -$languages['no_NO']['CHARSET'] = 'iso-8859-1'; -$languages['no']['ALIAS'] = 'no_NO'; +$languages['nb_NO']['NAME'] = 'Norwegian (Bokmål)'; +$languages['nb_NO']['ALTNAME'] = 'Norsk (Bokmål)'; +$languages['nb_NO']['CHARSET'] = 'iso-8859-1'; +$languages['nb_NO']['LOCALE'] = 'nb_NO.ISO8859-1'; +$languages['nb']['ALIAS'] = 'nb_NO'; $languages['nn_NO']['NAME'] = 'Norwegian (Nynorsk)'; $languages['nn_NO']['ALTNAME'] = 'Norsk (Nynorsk)'; $languages['nn_NO']['CHARSET'] = 'iso-8859-1'; +$languages['nn_NO']['LOCALE'] = 'nn_NO.ISO8859-1'; $languages['pl_PL']['NAME'] = 'Polish'; $languages['pl_PL']['ALTNAME'] = 'Polski'; $languages['pl_PL']['CHARSET'] = 'iso-8859-2'; +$languages['pl_PL']['LOCALE'] = 'pl_PL.ISO8859-2'; $languages['pl']['ALIAS'] = 'pl_PL'; $languages['pt_PT']['NAME'] = 'Portuguese (Portugal)'; $languages['pt_PT']['CHARSET'] = 'iso-8859-1'; +$languages['pt_PT']['LOCALE'] = 'pt_PT.ISO8859-1'; $languages['pt']['ALIAS'] = 'pt_PT'; $languages['pt_BR']['NAME'] = 'Portuguese (Brazil)'; $languages['pt_BR']['ALTNAME'] = 'Português do Brasil'; $languages['pt_BR']['CHARSET'] = 'iso-8859-1'; +$languages['pt_BR']['LOCALE'] = 'pt_BR.ISO8859-1'; $languages['ro_RO']['NAME'] = 'Romanian'; $languages['ro_RO']['ALTNAME'] = 'Română'; $languages['ro_RO']['CHARSET'] = 'iso-8859-2'; +$languages['ro_RO']['LOCALE'] = 'ro_RO.ISO8859-2'; $languages['ro']['ALIAS'] = 'ro_RO'; $languages['ru_RU']['NAME'] = 'Russian'; $languages['ru_RU']['ALTNAME'] = 'Русский'; $languages['ru_RU']['CHARSET'] = 'utf-8'; -$languages['ru_RU']['LOCALE'] = 'ru_RU.UTF-8'; +$languages['ru_RU']['LOCALE'] = 'ru_RU.UTF-8'; $languages['ru']['ALIAS'] = 'ru_RU'; -$languages['sk_SK']['NAME'] = 'Slovak'; -$languages['sk_SK']['CHARSET'] = 'iso-8859-2'; -$languages['sk']['ALIAS'] = 'sk_SK'; +$languages['sk_SK']['NAME'] = 'Slovak'; +$languages['sk_SK']['CHARSET'] = 'iso-8859-2'; +$languages['sk_SK']['LOCALE'] = 'sk_SK.ISO8859-2'; +$languages['sk']['ALIAS'] = 'sk_SK'; $languages['sl_SI']['NAME'] = 'Slovenian'; $languages['sl_SI']['ALTNAME'] = 'Slovenščina'; $languages['sl_SI']['CHARSET'] = 'iso-8859-2'; +$languages['sl_SI']['LOCALE'] = 'sl_SI.ISO8859-2'; $languages['sl']['ALIAS'] = 'sl_SI'; $languages['sr_YU']['NAME'] = 'Serbian'; $languages['sr_YU']['ALTNAME'] = 'Srpski'; $languages['sr_YU']['CHARSET'] = 'iso-8859-2'; +$languages['sr_YU']['LOCALE'] = 'sr_YU.ISO8859-2'; $languages['sr']['ALIAS'] = 'sr_YU'; $languages['sv_SE']['NAME'] = 'Swedish'; $languages['sv_SE']['ALTNAME'] = 'Svenska'; $languages['sv_SE']['CHARSET'] = 'iso-8859-1'; +$languages['sv_SE']['LOCALE'] = 'sv_SE.ISO8859-1'; $languages['sv']['ALIAS'] = 'sv_SE'; $languages['th_TH']['NAME'] = 'Thai'; $languages['th_TH']['CHARSET'] = 'tis-620'; +$languages['th_TH']['LOCALE'] = 'th_TH.TIS-620'; $languages['th']['ALIAS'] = 'th_TH'; +$languages['tl_PH']['NAME'] = 'Tagalog'; +$languages['tl_PH']['CHARSET'] = 'iso-8859-1'; +$languages['tl_PH']['LOCALE'] = 'tl_PH.ISO8859-1'; +$languages['tl']['ALIAS'] = 'tl_PH'; + $languages['tr_TR']['NAME'] = 'Turkish'; $languages['tr_TR']['CHARSET'] = 'iso-8859-9'; +$languages['tr_TR']['LOCALE'] = 'tr_TR.ISO8859-9'; $languages['tr']['ALIAS'] = 'tr_TR'; $languages['zh_TW']['NAME'] = 'Chinese Trad'; $languages['zh_TW']['CHARSET'] = 'big5'; +$languages['zh_TW']['LOCALE'] = 'zh_TW.BIG5'; $languages['tw']['ALIAS'] = 'zh_TW'; $languages['zh_CN']['NAME'] = 'Chinese Simp'; $languages['zh_CN']['CHARSET'] = 'gb2312'; +$languages['zh_CN']['LOCALE'] = 'zh_CN.GB2312'; $languages['cn']['ALIAS'] = 'zh_CN'; -/* $languages['uk_UA']['NAME'] = 'Ukrainian'; $languages['uk_UA']['CHARSET'] = 'koi8-u'; +$languages['uk_UA']['LOCALE'] = 'uk_UA.KOI8-U'; $languages['uk']['ALIAS'] = 'uk_UA'; -*/ + +$languages['ru_UA']['NAME'] = 'Russian (Ukrainian)'; +$languages['ru_UA']['CHARSET'] = 'koi8-r'; +$languages['ru_UA']['LOCALE'] = 'ru_UA.KOI8-R'; + /* -if ( file_exists( SM_PATH . 'locale/vi_VN') ) { - $languages['vi_VN']['NAME'] = 'Vietnamese'; - $languages['vi_VN']['CHARSET'] = 'utf-8'; - $languages['vi']['ALIAS'] = 'vi_VN'; -} +$languages['vi_VN']['NAME'] = 'Vietnamese'; +$languages['vi_VN']['CHARSET'] = 'utf-8'; +$languages['vi']['ALIAS'] = 'vi_VN'; */ // Right to left languages @@ -576,11 +615,22 @@ $languages['ar']['NAME'] = 'Arabic'; $languages['ar']['CHARSET'] = 'windows-1256'; $languages['ar']['DIR'] = 'rtl'; +$languages['fa_IR']['NAME'] = 'Farsi'; +$languages['fa_IR']['CHARSET'] = 'utf-8'; +$languages['fa_IR']['DIR'] = 'rtl'; +$languages['fa_IR']['LOCALE'] = 'fa_IR.UTF-8'; +$languages['fa']['ALIAS'] = 'fa_IR'; + $languages['he_IL']['NAME'] = 'Hebrew'; $languages['he_IL']['CHARSET'] = 'windows-1255'; +$languages['he_IL']['LOCALE'] = 'he_IL.CP1255'; $languages['he_IL']['DIR'] = 'rtl'; $languages['he']['ALIAS'] = 'he_IL'; +$languages['ug']['NAME'] = 'Uighur'; +$languages['ug']['CHARSET'] = 'utf-8'; +$languages['ug']['DIR'] = 'rtl'; + /* Detect whether gettext is installed. */ $gettext_flags = 0; if (function_exists('_')) { @@ -604,16 +654,28 @@ elseif ($gettext_flags == 0) { } else { /* Uh-ho. A weird install */ if (! $gettext_flags & 1) { + /** + * Function is used as replacement in broken installs + * @ignore + */ function _($str) { return $str; } } if (! $gettext_flags & 2) { + /** + * Function is used as replacement in broken installs + * @ignore + */ function bindtextdomain() { return; } } if (! $gettext_flags & 4) { + /** + * Function is used as replacemet in broken installs + * @ignore + */ function textdomain() { return; } @@ -621,11 +683,27 @@ elseif ($gettext_flags == 0) { } -/* +/** * Japanese charset extra function * + * Action performed by function is defined by first argument. + * Default return value is defined by second argument. + * Use of third argument depends on action. + * + * @param string $action action performed by this function. + * possible values: + * decode - convert returned string to euc-jp. third argument unused + * encode - convert returned string to jis. third argument unused + * strimwidth - third argument=$width. trims string to $width symbols. + * encodeheader - create base64 encoded header in iso-2022-jp. third argument unused + * decodeheader - return human readable string from mime header. string is returned in euc-jp. third argument unused + * downloadfilename - third argument $useragent. Arguments provide browser info. Returns shift-jis or euc-jp encoded file name + * wordwrap - third argument=$wrap. wraps text at $wrap symbols + * utf7-imap_encode - returns string converted from euc-jp to utf7-imap. third argument unused + * utf7-imap_decode - returns string converted from utf7-imap to euc-jp. third argument unused + * @param string $ret default return value */ -function japanese_charset_xtra() { +function japanese_xtra() { $ret = func_get_arg(1); /* default return value */ if (function_exists('mb_detect_encoding')) { switch (func_get_arg(0)) { /* action */ @@ -751,38 +829,275 @@ function japanese_charset_xtra() { return $ret; } +/************************** + * Japanese extra functions + **************************/ -/* - * Korean charset extra function - * Hangul(Korean Character) Attached File Name Fix. +/** + * Japanese decoding function + * + * converts string to euc-jp, if string uses JIS, EUC-JP, ShiftJIS or UTF-8 + * charset. Needs mbstring support in php. + * @param string $ret text, that has to be converted + * @return string converted string + * @since 1.5.1 */ -function korean_charset_xtra() { - - $ret = func_get_arg(1); /* default return value */ - if (func_get_arg(0) == 'downloadfilename') { /* action */ - $ret = str_replace("\x0D\x0A", '', $ret); /* Hanmail's CR/LF Clear */ - for ($i=0;$i= "\xA1" && $ret[$i] <= "\xFE") { /* 0xA1 - 0XFE are Valid */ - $i++; - continue; - } else if (($ret[$i] >= 'a' && $ret[$i] <= 'z') || /* From Original ereg_replace in download.php */ - ($ret[$i] >= 'A' && $ret[$i] <= 'Z') || - ($ret[$i] == '.') || ($ret[$i] == '-')) { - continue; - } else { - $ret[$i] = '_'; +function japanese_xtra_decode($ret) { + if (function_exists('mb_detect_encoding')) { + $detect_encoding = @mb_detect_encoding($ret); + if ($detect_encoding == 'JIS' || + $detect_encoding == 'EUC-JP' || + $detect_encoding == 'SJIS' || + $detect_encoding == 'UTF-8') { + + $ret = mb_convert_kana(mb_convert_encoding($ret, 'EUC-JP', 'AUTO'), "KV"); + } + } + return $ret; +} + +/** + * Japanese encoding function + * + * converts string to jis, if string uses JIS, EUC-JP, ShiftJIS or UTF-8 + * charset. Needs mbstring support in php. + * @param string $ret text, that has to be converted + * @return string converted text + * @since 1.5.1 + */ +function japanese_xtra_encode($ret) { + if (function_exists('mb_detect_encoding')) { + $detect_encoding = @mb_detect_encoding($ret); + if ($detect_encoding == 'JIS' || + $detect_encoding == 'EUC-JP' || + $detect_encoding == 'SJIS' || + $detect_encoding == 'UTF-8') { + + $ret = mb_convert_encoding(mb_convert_kana($ret, "KV"), 'JIS', 'AUTO'); + } + } + return $ret; +} + +/** + * Japanese header encoding function + * + * creates base64 encoded header in iso-2022-jp charset + * @param string $ret text, that has to be converted + * @return string mime base64 encoded string + * @since 1.5.1 + */ +function japanese_xtra_encodeheader($ret) { + if (function_exists('mb_detect_encoding')) { + $result = ''; + if (strlen($ret) > 0) { + $tmpstr = mb_substr($ret, 0, 1); + $prevcsize = strlen($tmpstr); + for ($i = 1; $i < mb_strlen($ret); $i++) { + $tmp = mb_substr($ret, $i, 1); + if (strlen($tmp) == $prevcsize) { + $tmpstr .= $tmp; + } else { + if ($prevcsize == 1) { + $result .= $tmpstr; + } else { + $result .= str_replace(' ', '', + mb_encode_mimeheader($tmpstr,'iso-2022-jp','B','')); + } + $tmpstr = $tmp; + $prevcsize = strlen($tmp); + } + } + if (strlen($tmpstr)) { + if (strlen(mb_substr($tmpstr, 0, 1)) == 1) + $result .= $tmpstr; + else + $result .= str_replace(' ', '', + mb_encode_mimeheader($tmpstr,'iso-2022-jp','B','')); } } + $ret = $result; + } + return $ret; +} + +/** + * Japanese header decoding function + * + * return human readable string from mime header. string is returned in euc-jp + * charset. + * @param string $ret header string + * @return string decoded header string + * @since 1.5.1 + */ +function japanese_xtra_decodeheader($ret) { + if (function_exists('mb_detect_encoding')) { + $ret = str_replace("\t", "", $ret); + if (eregi('=\\?([^?]+)\\?(q|b)\\?([^?]+)\\?=', $ret)) + $ret = @mb_decode_mimeheader($ret); + $ret = @mb_convert_encoding($ret, 'EUC-JP', 'AUTO'); + } + return $ret; +} +/** + * Japanese downloaded filename processing function + * + * Returns shift-jis or euc-jp encoded file name + * @param string $ret string + * @param string $useragent browser + * @return string converted string + * @since 1.5.1 + */ +function japanese_xtra_downloadfilename($ret,$useragent) { + if (function_exists('mb_detect_encoding')) { + if (strstr($useragent, 'Windows') !== false || + strstr($useragent, 'Mac_') !== false) { + $ret = mb_convert_encoding($ret, 'SJIS', 'AUTO'); + } else { + $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO'); + } } + return $ret; +} +/** + * Japanese wordwrap function + * + * wraps text at set number of symbols + * @param string $ret text + * @param integer $wrap number of symbols per line + * @return string wrapped text + * @since 1.5.1 + */ +function japanese_xtra_wordwrap($ret,$wrap) { + if (function_exists('mb_detect_encoding')) { + $no_begin = "\x21\x25\x29\x2c\x2e\x3a\x3b\x3f\x5d\x7d\xa1\xf1\xa1\xeb\xa1" . + "\xc7\xa1\xc9\xa2\xf3\xa1\xec\xa1\xed\xa1\xee\xa1\xa2\xa1\xa3\xa1\xb9" . + "\xa1\xd3\xa1\xd5\xa1\xd7\xa1\xd9\xa1\xdb\xa1\xcd\xa4\xa1\xa4\xa3\xa4" . + "\xa5\xa4\xa7\xa4\xa9\xa4\xc3\xa4\xe3\xa4\xe5\xa4\xe7\xa4\xee\xa1\xab" . + "\xa1\xac\xa1\xb5\xa1\xb6\xa5\xa1\xa5\xa3\xa5\xa5\xa5\xa7\xa5\xa9\xa5" . + "\xc3\xa5\xe3\xa5\xe5\xa5\xe7\xa5\xee\xa5\xf5\xa5\xf6\xa1\xa6\xa1\xbc" . + "\xa1\xb3\xa1\xb4\xa1\xaa\xa1\xf3\xa1\xcb\xa1\xa4\xa1\xa5\xa1\xa7\xa1" . + "\xa8\xa1\xa9\xa1\xcf\xa1\xd1"; + $no_end = "\x5c\x24\x28\x5b\x7b\xa1\xf2\x5c\xa1\xc6\xa1\xc8\xa1\xd2\xa1" . + "\xd4\xa1\xd6\xa1\xd8\xa1\xda\xa1\xcc\xa1\xf0\xa1\xca\xa1\xce\xa1\xd0\xa1\xef"; + + if (strlen($ret) >= $wrap && + substr($ret, 0, 1) != '>' && + strpos($ret, 'http://') === FALSE && + strpos($ret, 'https://') === FALSE && + strpos($ret, 'ftp://') === FALSE) { + + $ret = mb_convert_kana($ret, "KV"); + + $line_new = ''; + $ptr = 0; + + while ($ptr < strlen($ret) - 1) { + $l = mb_strcut($ret, $ptr, $wrap); + $ptr += strlen($l); + $tmp = $l; + + $l = mb_strcut($ret, $ptr, 2); + while (strlen($l) != 0 && mb_strpos($no_begin, $l) !== FALSE ) { + $tmp .= $l; + $ptr += strlen($l); + $l = mb_strcut($ret, $ptr, 1); + } + $line_new .= $tmp; + if ($ptr < strlen($ret) - 1) + $line_new .= "\n"; + } + $ret = $line_new; + } + } return $ret; } -/* +/** + * Japanese imap folder name encoding function + * + * converts folder name from euc-jp to utf7-imap + * @param string $ret folder name + * @return string converted folder name + * @since 1.5.1 + */ +function japanese_xtra_utf7_imap_encode($ret){ + if (function_exists('mb_detect_encoding')) { + $ret = mb_convert_encoding($ret, 'UTF7-IMAP', 'EUC-JP'); + } + return $ret; +} + +/** + * Japanese imap folder name decoding function + * + * converts folder name from utf7-imap to euc-jp. + * @param string $ret folder name in utf7-imap + * @return string converted folder name + * @since 1.5.1 + */ +function japanese_xtra_utf7_imap_decode($ret) { + if (function_exists('mb_detect_encoding')) { + $ret = mb_convert_encoding($ret, 'EUC-JP', 'UTF7-IMAP'); + } + return $ret; +} + +/** + * Japanese string trimming function + * + * trims string to defined number of symbols + * @param string $ret string + * @param integer $width number of symbols + * @return string trimmed string + * @since 1.5.1 + */ +function japanese_xtra_strimwidth($ret,$width) { + if (function_exists('mb_detect_encoding')) { + $ret = mb_strimwidth($ret, 0, $width, '...'); + } + return $ret; +} + +/******************************** + * Korean charset extra functions + ********************************/ + +/** + * Korean downloaded filename processing functions + * + * @param string default return value + * @return string + */ +function korean_xtra_downloadfilename($ret) { + $ret = str_replace("\x0D\x0A", '', $ret); /* Hanmail's CR/LF Clear */ + for ($i=0;$i= "\xA1" && $ret[$i] <= "\xFE") { /* 0xA1 - 0XFE are Valid */ + $i++; + continue; + } else if (($ret[$i] >= 'a' && $ret[$i] <= 'z') || /* From Original ereg_replace in download.php */ + ($ret[$i] >= 'A' && $ret[$i] <= 'Z') || + ($ret[$i] == '.') || ($ret[$i] == '-')) { + continue; + } else { + $ret[$i] = '_'; + } + } + return $ret; +} + +/** + * Replaces non-braking spaces inserted by some browsers with regular space + * * This function can be used to replace non-braking space symbols * that are inserted in forms by some browsers instead of normal * space symbol. + * + * @param string $string Text that needs to be cleaned + * @param string $charset Charset used in text + * @return string Cleaned text */ function cleanup_nbsp($string,$charset) { @@ -822,6 +1137,15 @@ endswitch; return str_replace($nbsp,' ',$string); } +/** + * Function informs if it is safe to convert given charset to the one that is used by user. + * + * It is safe to use conversion only if user uses utf-8 encoding and when + * converted charset is similar to the one that is used by user. + * + * @param string $input_charset Charset of text that needs to be converted + * @return bool is it possible to convert to user's charset + */ function is_conversion_safe($input_charset) { global $languages, $sm_notAlias, $default_charset; @@ -837,30 +1161,30 @@ function is_conversion_safe($input_charset) { switch ($default_charset): case "windows-1251": if ( $input_charset == "iso-8859-5" || - $input_charset == "koi8-r" || - $input_charset == "koi8-u" ) { + $input_charset == "koi8-r" || + $input_charset == "koi8-u" ) { return true; } else { return false; } case "windows-1257": if ( $input_charset == "iso-8859-13" || - $input_charset == "iso-8859-4" ) { + $input_charset == "iso-8859-4" ) { return true; } else { return false; } case "iso-8859-4": if ( $input_charset == "iso-8859-13" || - $input_charset == "windows-1257" ) { + $input_charset == "windows-1257" ) { return true; } else { return false; } case "iso-8859-5": if ( $input_charset == "windows-1251" || - $input_charset == "koi8-r" || - $input_charset == "koi8-u" ) { + $input_charset == "koi8-r" || + $input_charset == "koi8-u" ) { return true; } else { return false; @@ -874,16 +1198,16 @@ case "iso-8859-13": } case "koi8-r": if ( $input_charset == "windows-1251" || - $input_charset == "iso-8859-5" || - $input_charset == "koi8-u" ) { + $input_charset == "iso-8859-5" || + $input_charset == "koi8-u" ) { return true; } else { return false; } case "koi8-u": if ( $input_charset == "windows-1251" || - $input_charset == "iso-8859-5" || - $input_charset == "koi8-r" ) { + $input_charset == "iso-8859-5" || + $input_charset == "koi8-r" ) { return true; } else { return false; @@ -892,4 +1216,4 @@ default: return false; endswitch; } -?> +?> \ No newline at end of file