X-Git-Url: https://vcs.fsf.org/?p=squirrelmail.git;a=blobdiff_plain;f=functions%2Fi18n.php;h=6836ac7533cac499c689b18524df76495cfaa705;hp=d4799d268b0eb8af7edd291a1668390372537950;hb=226a7b743417c982257640d765887f14856707af;hpb=b6c52e6192ab29a322f38006675318ec00a0724d diff --git a/functions/i18n.php b/functions/i18n.php index d4799d26..6836ac75 100644 --- a/functions/i18n.php +++ b/functions/i18n.php @@ -1,801 +1,14 @@ '),$string); - return $string; - } - } - - // iconv functions does not have html target and can be used only with utf-8 - if ( $use_php_iconv && $default_charset=='utf-8') { - $string = iconv($charset,$default_charset,$string); - return ($save_html ? $strings : htmlspecialchars($string)); - } - - // If we don't use recode and iconv, we'll do it old way. - - /* All HTML special characters are 7 bit and can be replaced first */ - if (! $save_html) $string = htmlspecialchars ($string); - - /* controls cpu and memory intensive decoding cycles */ - if (! isset($aggressive_decoding) || $aggressive_decoding=="" ) { - $aggressive_decoding=false; } - - $decode=fixcharset($charset); - $decodefile=SM_PATH . 'functions/decode/' . $decode . '.php'; - if (file_exists($decodefile)) { - include_once($decodefile); - // send $save_html argument to decoding function. needed for iso-2022-xx decoding. - $ret = call_user_func('charset_decode_'.$decode, $string, $save_html); - } else { - $ret = $string; - } - return( $ret ); -} - -/** - * Converts html string to given charset - * @since 1.5.1 and 1.4.4 - * @param string $string - * @param string $charset - * @param boolean $htmlencode keep htmlspecialchars encoding - * @param string - */ -function charset_encode($string,$charset,$htmlencode=true) { - global $default_charset; - - $encode=fixcharset($charset); - $encodefile=SM_PATH . 'functions/encode/' . $encode . '.php'; - if (file_exists($encodefile)) { - include_once($encodefile); - $ret = call_user_func('charset_encode_'.$encode, $string); - } elseif(file_exists(SM_PATH . 'functions/encode/us_ascii.php')) { - // function replaces all 8bit html entities with question marks. - // it is used when other encoding functions are unavailable - include_once(SM_PATH . 'functions/encode/us_ascii.php'); - $ret = charset_encode_us_ascii($string); - } else { - /** - * fix for yahoo users that remove all us-ascii related things - */ - $ret = $string; - } - - /** - * Undo html special chars, some places (like compose form) have - * own sanitizing functions and don't need html symbols. - * Undo chars only after encoding in order to prevent conversion of - * html entities in plain text emails. - */ - if (! $htmlencode ) { - $ret = str_replace(array('&','>','<','"'),array('&','>','<','"'),$ret); - } - return( $ret ); -} - -/** - * Combined decoding and encoding functions - * - * If conversion is done to charset different that utf-8, unsupported symbols - * will be replaced with question marks. - * @since 1.5.1 and 1.4.4 - * @param string $in_charset initial charset - * @param string $string string that has to be converted - * @param string $out_charset final charset - * @param boolean $htmlencode keep htmlspecialchars encoding - * @return string converted string - */ -function charset_convert($in_charset,$string,$out_charset,$htmlencode=true) { - $string=charset_decode($in_charset,$string,true); - $string=charset_encode($string,$out_charset,$htmlencode); - return $string; -} - -/** - * Makes charset name suitable for decoding cycles - * - * @since 1.5.0 and 1.4.4 - * @param string $charset Name of charset - * @return string $charset Adjusted name of charset */ -function fixcharset($charset) { - /* remove minus and characters that might be used in paths from charset - * name in order to be able to use it in function names and include calls. - */ - $charset=preg_replace("/[-:.\/\\\]/",'_',$charset); - - // windows-125x and cp125x charsets - $charset=str_replace('windows_','cp',$charset); - - // ibm > cp - $charset=str_replace('ibm','cp',$charset); - - // iso-8859-8-i -> iso-8859-8 - // use same cycle until I'll find differences - $charset=str_replace('iso_8859_8_i','iso_8859_8',$charset); - - return $charset; -} - -/** - * Set up the language to be output - * if $do_search is true, then scan the browser information - * for a possible language that we know - * - * Function sets system locale environment (LC_ALL, LANG, LANGUAGE), - * gettext translation bindings and html header information. - * - * Function returns error codes, if there is some fatal error. - * 0 = no error, - * 1 = mbstring support is not present, - * 2 = mbstring support is not present, user's translation reverted to en_US. - * - * @param string $sm_language translation used by user's interface - * @param bool $do_search use browser's preferred language detection functions. Defaults to false. - * @param bool $default set $sm_language to $squirrelmail_default_language if language detection fails or language is not set. Defaults to false. - * @return int function execution error codes. - */ -function set_up_language($sm_language, $do_search = false, $default = false) { - - static $SetupAlready = 0; - global $use_gettext, $languages, - $squirrelmail_language, $squirrelmail_default_language, $default_charset, - $sm_notAlias, $username, $data_dir; - - if ($SetupAlready) { - return; - } - - $SetupAlready = TRUE; - sqgetGlobalVar('HTTP_ACCEPT_LANGUAGE', $accept_lang, SQ_SERVER); - - /** - * If function is asked to detect preferred language - * OR squirrelmail default language is set to empty string - * AND - * squirrelmail language ($sm_language) is empty string - * (not set in user's prefs and no cookie with language info) - * AND - * browser provides list of preferred languages - * THEN - * get preferred language from HTTP_ACCEPT_LANGUAGE header - */ - if (($do_search || empty($squirrelmail_default_language)) && - ! $sm_language && - isset($accept_lang)) { - // TODO: use more than one language, if first language is not available - // FIXME: function assumes that string contains two or more characters. - // FIXME: some languages use 5 chars - $sm_language = substr($accept_lang, 0, 2); - } - - /** - * If language preference is not set OR script asks to use default language - * AND - * default squirrelmail language is not set to empty string - * THEN - * use default squirrelmail language value from configuration. - */ - if ((!$sm_language||$default) && - ! empty($squirrelmail_default_language)) { - $squirrelmail_language = $squirrelmail_default_language; - $sm_language = $squirrelmail_default_language; - } - - /** provide failsafe language when detection fails */ - if (! $sm_language) $sm_language='en_US'; - - $sm_notAlias = $sm_language; - - // Catching removed translation - // System reverts to English translation if user prefs contain translation - // that is not available in $languages array - if (!isset($languages[$sm_notAlias])) { - $sm_notAlias="en_US"; - } - - while (isset($languages[$sm_notAlias]['ALIAS'])) { - $sm_notAlias = $languages[$sm_notAlias]['ALIAS']; - } - - if ( isset($sm_language) && - $use_gettext && - $sm_language != '' && - isset($languages[$sm_notAlias]['CHARSET']) ) { - sq_bindtextdomain( 'squirrelmail', SM_PATH . 'locale/' ); - sq_textdomain( 'squirrelmail' ); - - // set codeset in order to avoid gettext charset conversions - if (function_exists('bind_textdomain_codeset')) { - // Japanese translation uses different internal charset - if ($sm_notAlias == 'ja_JP') { - bind_textdomain_codeset ('squirrelmail', 'EUC-JP'); - } else { - bind_textdomain_codeset ('squirrelmail', $languages[$sm_notAlias]['CHARSET'] ); - } - } - - // Use LOCALE key, if it is set. - if (isset($languages[$sm_notAlias]['LOCALE'])){ - $longlocale=$languages[$sm_notAlias]['LOCALE']; - } else { - $longlocale=$sm_notAlias; - } - - // try setting locale - $retlocale=sq_setlocale(LC_ALL, $longlocale); - - // check if locale is set and assign that locale to $longlocale - // in order to use it in putenv calls. - if (! is_bool($retlocale)) { - $longlocale=$retlocale; - } elseif (is_array($longlocale)) { - // setting of all locales failed. - // we need string instead of array used in LOCALE key. - $longlocale=$sm_notAlias; - } - - if ( !((bool)ini_get('safe_mode')) && - getenv( 'LC_ALL' ) != $longlocale ) { - putenv( "LC_ALL=$longlocale" ); - putenv( "LANG=$longlocale" ); - putenv( "LANGUAGE=$longlocale" ); - putenv( "LC_NUMERIC=C" ); - if ($sm_notAlias=='tr_TR') putenv( "LC_CTYPE=C" ); - } - // Workaround for plugins that use numbers with floating point - // It might be removed if plugins use correct decimal delimiters - // according to locale settings. - setlocale(LC_NUMERIC, 'C'); - // Workaround for specific Turkish strtolower/strtoupper rules. - // Many functions expect English conversion rules. - if ($sm_notAlias=='tr_TR') setlocale(LC_CTYPE,'C'); - - // Set text direction/alignment variables - // These don't appear to be used... are they safe to remove? - if (isset($languages[$sm_notAlias]['DIR']) && - $languages[$sm_notAlias]['DIR'] == 'rtl') { - /** - * Text direction - * @global string $text_direction - */ - $text_direction='rtl'; - /** - * Left alignment - * @global string $left_align - */ - $left_align='right'; - /** - * Right alignment - * @global string $right_align - */ - $right_align='left'; - } else { - $text_direction='ltr'; - $left_align='left'; - $right_align='right'; - } - - $squirrelmail_language = $sm_notAlias; - if ($squirrelmail_language == 'ja_JP') { - header ('Content-Type: text/html; charset=EUC-JP'); - if (!function_exists('mb_internal_encoding')) { - // Error messages can't be displayed here - $error = 1; - // Revert to English if possible. - if (function_exists('setPref') && $username!='' && $data_dir!="") { - setPref($data_dir, $username, 'language', "en_US"); - $error = 2; - } - // stop further execution in order not to get php errors on mb_internal_encoding(). - return $error; - } - if (function_exists('mb_language')) { - mb_language('Japanese'); - } - mb_internal_encoding('EUC-JP'); - mb_http_output('pass'); - } elseif ($squirrelmail_language == 'en_US') { - header( 'Content-Type: text/html; charset=' . $default_charset ); - } else { - header( 'Content-Type: text/html; charset=' . $languages[$sm_notAlias]['CHARSET'] ); - } - /** - * mbstring.func_overload fix (#929644). - * - * php mbstring extension can replace standard string functions with their multibyte - * equivalents. See http://www.php.net/ref.mbstring#mbstring.overload. This feature - * was added in php v.4.2.0 - * - * Some SquirrelMail functions work with 8bit strings in bytes. If interface is forced - * to use mbstring functions and mbstring internal encoding is set to multibyte charset, - * interface can't trust regular string functions. Due to mbstring overloading design - * limits php scripts can't control this setting. - * - * This hack should fix some issues related to 8bit strings in passwords. Correct fix is - * to disable mbstring overloading. Japanese translation uses different internal encoding. - */ - if ($squirrelmail_language != 'ja_JP' && - function_exists('mb_internal_encoding') && - check_php_version(4,2,0) && - (int)ini_get('mbstring.func_overload')!=0) { - mb_internal_encoding('pass'); - } - } - return 0; -} - -/** - * Sets default_charset variable according to the one that is used by user's translations. - * - * Function changes global $default_charset variable in order to be sure, that it - * contains charset used by user's translation. Sanity of $squirrelmail_language - * and $default_charset combination is also tested. - * - * There can be a $default_charset setting in the - * config.php file, but the user may have a different language - * selected for a user interface. This function checks the - * language selected by the user and tags the outgoing messages - * with the appropriate charset corresponding to the language - * selection. This is "more right" (tm), than just stamping the - * message blindly with the system-wide $default_charset. - */ -function set_my_charset(){ - global $data_dir, $username, $default_charset, $languages, $squirrelmail_language; - - $my_language = getPref($data_dir, $username, 'language'); - if (!$my_language) { - $my_language = $squirrelmail_language ; - } - // Catch removed translation - if (!isset($languages[$my_language])) { - $my_language="en_US"; - } - while (isset($languages[$my_language]['ALIAS'])) { - $my_language = $languages[$my_language]['ALIAS']; - } - $my_charset = $languages[$my_language]['CHARSET']; - if ($my_language!='en_US') { - $default_charset = $my_charset; - } -} - -/** - * Replaces non-braking spaces inserted by some browsers with regular space - * - * This function can be used to replace non-braking space symbols - * that are inserted in forms by some browsers instead of normal - * space symbol. - * - * @param string $string Text that needs to be cleaned - * @param string $charset Charset used in text - * @return string Cleaned text - */ -function cleanup_nbsp($string,$charset) { - - // reduce number of case statements - if (stristr('iso-8859-',substr($charset,0,9))){ - $output_charset="iso-8859-x"; - } - if (stristr('windows-125',substr($charset,0,11))){ - $output_charset="cp125x"; - } - if (stristr('koi8',substr($charset,0,4))){ - $output_charset="koi8-x"; - } - if (! isset($output_charset)){ - $output_charset=strtolower($charset); - } - -// where is non-braking space symbol -switch($output_charset): - case "iso-8859-x": - case "cp125x": - case "iso-2022-jp": - $nbsp="\xA0"; - break; - case "koi8-x": - $nbsp="\x9A"; - break; - case "utf-8": - $nbsp="\xC2\xA0"; - break; - default: - // don't change string if charset is unmatched - return $string; -endswitch; - -// return space instead of non-braking space. - return str_replace($nbsp,' ',$string); -} - -/** - * Function informs if it is safe to convert given charset to the one that is used by user. - * - * It is safe to use conversion only if user uses utf-8 encoding and when - * converted charset is similar to the one that is used by user. - * - * @param string $input_charset Charset of text that needs to be converted - * @return bool is it possible to convert to user's charset - */ -function is_conversion_safe($input_charset) { - global $languages, $sm_notAlias, $default_charset, $lossy_encoding; - - if (isset($lossy_encoding) && $lossy_encoding ) - return true; - - // convert to lower case - $input_charset = strtolower($input_charset); - - // Is user's locale Unicode based ? - if ( $default_charset == "utf-8" ) { - return true; - } - - // Charsets that are similar -switch ($default_charset): -case "windows-1251": - if ( $input_charset == "iso-8859-5" || - $input_charset == "koi8-r" || - $input_charset == "koi8-u" ) { - return true; - } else { - return false; - } -case "windows-1257": - if ( $input_charset == "iso-8859-13" || - $input_charset == "iso-8859-4" ) { - return true; - } else { - return false; - } -case "iso-8859-4": - if ( $input_charset == "iso-8859-13" || - $input_charset == "windows-1257" ) { - return true; - } else { - return false; - } -case "iso-8859-5": - if ( $input_charset == "windows-1251" || - $input_charset == "koi8-r" || - $input_charset == "koi8-u" ) { - return true; - } else { - return false; - } -case "iso-8859-13": - if ( $input_charset == "iso-8859-4" || - $input_charset == "windows-1257" ) { - return true; - } else { - return false; - } -case "koi8-r": - if ( $input_charset == "windows-1251" || - $input_charset == "iso-8859-5" || - $input_charset == "koi8-u" ) { - return true; - } else { - return false; - } -case "koi8-u": - if ( $input_charset == "windows-1251" || - $input_charset == "iso-8859-5" || - $input_charset == "koi8-r" ) { - return true; - } else { - return false; - } -default: - return false; -endswitch; -} - - -/* ------------------------------ main --------------------------- */ - -global $squirrelmail_language, $languages, $use_gettext; - -if (! sqgetGlobalVar('squirrelmail_language',$squirrelmail_language,SQ_COOKIE)) { - $squirrelmail_language = ''; -} - -/** - * Array specifies the available translations. - * - * Structure of array: - * $languages['language']['variable'] = 'value' - * - * Possible 'variable' names: - * NAME - Translation name in English - * CHARSET - Encoding used by translation - * ALIAS - used when 'language' is only short name and 'value' should provide long language name - * ALTNAME - Native translation name. Any 8bit symbols must be html encoded. - * LOCALE - Full locale name (in xx_XX.charset format). It can use array with more than one locale name since 1.4.5 and 1.5.1 - * DIR - Text direction. Used to define Right-to-Left languages. Possible values 'rtl' or 'ltr'. If undefined - defaults to 'ltr' - * XTRA_CODE - translation uses special functions. See doc/i18n.txt - * - * Each 'language' definition requires NAME+CHARSET or ALIAS variables. - * - * @name $languages - * @global array $languages - */ -$languages['en_US']['NAME'] = 'English'; -$languages['en_US']['CHARSET'] = 'iso-8859-1'; -$languages['en_US']['LOCALE'] = 'en_US.ISO8859-1'; -$languages['en']['ALIAS'] = 'en_US'; - -/** - * Automatic translation loading from setup.php files. - * Solution for bug. 1240889. - * setup.php file can contain $languages array entries and XTRA_CODE functions. - */ -if (is_dir(SM_PATH . 'locale') && - is_readable(SM_PATH . 'locale')) { - $localedir = dir(SM_PATH . 'locale'); - while($lang_dir=$localedir->read()) { - // remove trailing slash, if present - if (substr($lang_dir,-1)=='/') { - $lang_dir = substr($lang_dir,0,-1); - } - if ($lang_dir != '..' && $lang_dir != '.' && $lang_dir != 'CVS' && - is_dir(SM_PATH.'locale/'.$lang_dir) && - file_exists(SM_PATH.'locale/'.$lang_dir.'/setup.php')) { - include_once(SM_PATH.'locale/'.$lang_dir.'/setup.php'); - } - } - $localedir->close(); -} - -/* Detect whether gettext is installed. */ -$gettext_flags = 0; -if (function_exists('_')) { - $gettext_flags += 1; -} -if (function_exists('bindtextdomain')) { - $gettext_flags += 2; -} -if (function_exists('textdomain')) { - $gettext_flags += 4; -} -if (function_exists('ngettext')) { - $gettext_flags += 8; -} - -/* If gettext is fully loaded, cool */ -if ($gettext_flags == 15) { - $use_gettext = true; -} - -/* If ngettext support is missing, load it */ -elseif ($gettext_flags == 7) { - $use_gettext = true; - // load internal ngettext functions - include_once(SM_PATH . 'class/l10n.class.php'); - include_once(SM_PATH . 'functions/ngettext.php'); -} -/* If we can fake gettext, try that */ -elseif ($gettext_flags == 0) { - $use_gettext = true; - include_once(SM_PATH . 'functions/gettext.php'); -} else { - /* Uh-ho. A weird install */ - if (! $gettext_flags & 1) { - /** - * Function is used as replacement in broken installs - * @ignore - */ - function _($str) { - return $str; - } - } - if (! $gettext_flags & 2) { - /** - * Function is used as replacement in broken installs - * @ignore - */ - function bindtextdomain() { - return; - } - } - if (! $gettext_flags & 4) { - /** - * Function is used as replacemet in broken installs - * @ignore - */ - function textdomain() { - return; - } - } - if (! $gettext_flags & 8) { - /** - * Function is used as replacemet in broken installs - * @ignore - */ - function ngettext($str,$str2,$number) { - if ($number>1) { - return $str2; - } else { - return $str; - } - } - } - if (! function_exists('dgettext')) { - /** - * Replacement for broken setups. - * @ignore - */ - function dgettext($domain,$str) { - return $str; - } - } - if (! function_exists('dngettext')) { - /** - * Replacement for broken setups - * @ignore - */ - function dngettext($domain,$str1,$strn,$number) { - return ($number==1 ? $str1 : $strn); - } - } -} +/** break if somebody tries to load this file */ +die('Rewrite your code, functions/i18n.php file location is changed in 1.5.2.' + .' Direct loading of functions/i18n.php is deprecated.'); ?> \ No newline at end of file