Paul's changes

[squirrelmail.git] / functions / i18n.php
diff --git a/functions/i18n.php b/functions/i18n.php

index e4954114ef67af9cc44ce58e59deda79ea9570fd..f7ad4658d76398f62a3e47766275cefbc4c8baec 100644 (file)
--- a/functions/i18n.php
+++ b/functions/i18n.php
@@ -17,6 +17,12 @@
  
  /* Decodes a string to the internal encoding from the given charset */
  function charset_decode ($charset, $string) {
+    global $languages, $squirrelmail_language;
+
+    if (isset($languages[$squirrelmail_language]['XTRA_CODE']) &&
+        function_exists($languages[$squirrelmail_language]['XTRA_CODE'])) {
+        $string = $languages[$squirrelmail_language]['XTRA_CODE']('decode', $string);
+    }
  
      /* All HTML special characters are 7 bit and can be replaced first */
      $string = htmlspecialchars ($string);
@@ -435,11 +441,8 @@ function charset_decode_iso_8859_7 ($string) {
       * ISO-8859-7 characters from 11/04 (0xB4) to 11/06 (0xB6)
       * These are Unicode 900-902
       */
-    while (ereg("([\264-\266])", $string, $res)) {
-        $replace = '&#' . (ord($res[1])+720) . ';';
-        $string = str_replace($res[1], $replace, $string);
-    }
-
+    $string = preg_replace("/([\264-\266])/","'&#' . (ord(\\1)+720)",$string);
+    
      /* 11/07 (0xB7) Middle dot is the same in iso-8859-1 */
      $string = str_replace("\267", '&#183;', $string);
  
@@ -447,10 +450,7 @@ function charset_decode_iso_8859_7 ($string) {
       * ISO-8859-7 characters from 11/08 (0xB8) to 11/10 (0xBA)
       * These are Unicode 900-902
       */
-    while (ereg("([\270-\272])", $string, $res)) {
-        $replace = '&#' . (ord($res[1])+720) . ";";
-        $string = str_replace($res[1], $replace, $string);
-    }
+    $string = preg_replace("/([\270-\272])/","'&#' . (ord(\\1)+720)",$string);
  
      /*
       * 11/11 (0xBB) Right angle quotation mark is the same as in
@@ -459,10 +459,7 @@ function charset_decode_iso_8859_7 ($string) {
      $string = str_replace("\273", '&#187;', $string);
  
      /* And now the rest of the charset */
-    while (ereg("([\274-\376])", $string, $res)) {
-        $replace = '&#' . (ord($res[1])+720) . ';';
-        $string = str_replace($res[1], $replace, $string);
-    }
+    $string = preg_replace("/([\274-\376])/","'&#' . (ord(\\1)+720)",$string);
  
      return $string;
  }
@@ -475,7 +472,7 @@ function charset_decode_iso_8859_15 ($string) {
      // Euro sign
      $string = str_replace ("\244", '&#8364;', $string);
      // Latin capital letter S with caron
-    $string = str_replace ("\244", '&#352;', $string);
+    $string = str_replace ("\246", '&#352;', $string);
      // Latin small letter s with caron
      $string = str_replace ("\250", '&#353;', $string);
      // Latin capital letter Z with caron
@@ -492,7 +489,7 @@ function charset_decode_iso_8859_15 ($string) {
      return (charset_decode_iso_8859_1($string));
  }
  
-/* ISO-8859-15 is Cyrillic */
+/* ISO-8859-5 is Cyrillic */
  function charset_decode_iso_8859_5 ($string) {
      // Convert to KOI8-R, then return this decoded.
      $string = convert_cyr_string($string, 'i', 'k');
@@ -682,6 +679,63 @@ function charset_decode_koi8r ($string) {
      return $string;
  }
  
+
+/*
+ * Japanese charset extra function
+ *
+ */
+function japanese_charset_xtra() {
+    $ret = func_get_arg(1);  /* default return value */
+    if (function_exists('mb_detect_encoding')) {
+        switch (func_get_arg(0)) { /* action */
+        case 'decode':
+            $detect_encoding = mb_detect_encoding($ret);
+            if ($detect_encoding == 'JIS' ||
+                $detect_encoding == 'EUC-JP' ||
+                $detect_encoding == 'SJIS') {
+                
+                $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO');
+            }
+            break;
+        case 'encode':
+            $detect_encoding = mb_detect_encoding($ret);
+            if ($detect_encoding == 'JIS' ||
+                $detect_encoding == 'EUC-JP' ||
+                $detect_encoding == 'SJIS') {
+                
+                $ret = mb_convert_encoding($ret, 'JIS', 'AUTO');
+            }
+            break;
+        case 'strimwidth':
+            $width = func_get_arg(2);
+            $ret = mb_strimwidth($ret, 0, $width, '...'); 
+            break;
+        case 'encodeheader':
+            $ret = mb_encode_mimeheader($ret);
+            break;
+        case 'decodeheader':
+            $ret = str_replace("\t", "", $ret);
+            if (eregi('=\\?([^?]+)\\?(q|b)\\?([^?]+)\\?=', $ret))
+                $ret = mb_decode_mimeheader($ret);
+            $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO');
+            break;
+        case 'downloadfilename':
+            $useragent = func_get_arg(2);
+            if (strstr($useragent, 'Windows') !== false ||
+                strstr($useragent, 'Mac_') !== false) {
+                $ret = mb_convert_encoding($ret, 'SJIS', 'AUTO');
+            } else {
+                $ret = mb_convert_encoding($ret, 'EUC-JP', 'AUTO');
+}
+            break;
+        default:
+            break;
+        }
+    }
+    return $ret;
+}
+
+
  /*
   * Set up the language to be output
   * if $do_search is true, then scan the browser information
@@ -712,23 +766,32 @@ function set_up_language($sm_language, $do_search = false) {
          $sm_notAlias = $languages[$sm_notAlias]['ALIAS'];
      }
  
-    if ( isset($sm_language) && 
+    if ( isset($sm_language) &&
           $use_gettext &&
           $sm_language != '' &&
           isset($languages[$sm_notAlias]['CHARSET']) ) {
          bindtextdomain( 'squirrelmail', '../locale/' );
-        textdomain( 'squirrelmail' );         
-        if ( !ini_get('safe_mode') && 
+        textdomain( 'squirrelmail' );
+        if ( !ini_get('safe_mode') &&
               getenv( 'LC_ALL' ) != $sm_notAlias ) {
              putenv( "LC_ALL=$sm_notAlias" );
              putenv( "LANG=$sm_notAlias" );
              putenv( "LANGUAGE=$sm_notAlias" );
          }
-        setlocale('LC_ALL', $sm_notAlias);
+        setlocale(LC_ALL, $sm_notAlias);
          $squirrelmail_language = $sm_notAlias;
+        if ($squirrelmail_language == 'ja_JP' && function_exists('mb_detect_encoding') ) {
+            header ('Content-Type: text/html; charset=EUC-JP');
+            if (!function_exists('mb_internal_encoding')) {
+                echo _("You need to have php4 installed with the multibyte string function enabled (using configure option --with-mbstring).");
+            }
+            mb_internal_encoding('EUC-JP');
+            mb_http_output('pass');
+        } else {
          header( 'Content-Type: text/html; charset=' . $languages[$sm_notAlias]['CHARSET'] );
      }
  }
+}
  
  function set_my_charset(){
  
@@ -742,7 +805,7 @@ function set_my_charset(){
       * message blindly with the system-wide $default_charset.
       */
      global $data_dir, $username, $default_charset, $languages;
-    
+
      $my_language = getPref($data_dir, $username, 'language');
      if (!$my_language) {
          return;
@@ -829,6 +892,11 @@ $languages['it_IT']['NAME']    = 'Italian';
  $languages['it_IT']['CHARSET'] = 'iso-8859-1';
  $languages['it']['ALIAS'] = 'it_IT';
  
+$languages['ja_JP']['NAME']    = 'Japanese';
+$languages['ja_JP']['CHARSET'] = 'iso-2022-jp';
+$languages['ja_JP']['XTRA_CODE'] = 'japanese_charset_xtra';
+$languages['ja']['ALIAS'] = 'ja_JP';
+
  $languages['ko_KR']['NAME']    = 'Korean';
  $languages['ko_KR']['CHARSET'] = 'euc-KR';
  $languages['ko']['ALIAS'] = 'ko_KR';
@@ -840,8 +908,8 @@ $languages['nl']['ALIAS'] = 'nl_NL';
  $languages['no_NO']['NAME']    = 'Norwegian (Bokm&aring;l)';
  $languages['no_NO']['CHARSET'] = 'iso-8859-1';
  $languages['no']['ALIAS'] = 'no_NO';
-$languages['no_NO_ny']['NAME']    = 'Norwegian (Nynorsk)';
-$languages['no_NO_ny']['CHARSET'] = 'iso-8859-1';
+$languages['nn_NO']['NAME']    = 'Norwegian (Nynorsk)';
+$languages['nn_NO']['CHARSET'] = 'iso-8859-1';
  
  $languages['pl_PL']['NAME']    = 'Polish';
  $languages['pl_PL']['CHARSET'] = 'iso-8859-2';
@@ -857,9 +925,9 @@ $languages['ru_RU']['NAME']    = 'Russian';
  $languages['ru_RU']['CHARSET'] = 'koi8-r';
  $languages['ru']['ALIAS'] = 'ru_RU';
  
-$languages['sr']['NAME']    = 'Serbian';
-$languages['sr']['CHARSET'] = 'iso-8859-2';
-$languages['sr_YU']['ALIAS'] = 'sr';
+$languages['sr_YU']['NAME']    = 'Serbian';
+$languages['sr_YU']['CHARSET'] = 'iso-8859-2';
+$languages['sr']['ALIAS'] = 'sr_YU';
  
  $languages['sv_SE']['NAME']    = 'Swedish';
  $languages['sv_SE']['CHARSET'] = 'iso-8859-1';
@@ -869,12 +937,14 @@ $languages['tr_TR']['NAME']    = 'Turkish';
  $languages['tr_TR']['CHARSET'] = 'iso-8859-9';
  $languages['tr']['ALIAS'] = 'tr_TR';
  
-// it's zh_TW, actually.
-
  $languages['zh_TW']['NAME']    = 'Taiwan';
  $languages['zh_TW']['CHARSET'] = 'big5';
  $languages['tw']['ALIAS'] = 'zh_TW';
  
+$languages['zh_TW']['NAME']    = 'Chinese';
+$languages['zh_TW']['CHARSET'] = 'gb2312';
+$languages['tw']['ALIAS'] = 'zh_CN';
+
  $languages['sk_SK']['NAME']     = 'Slovak';
  $languages['sk_SK']['CHARSET']  = 'iso-8859-2';
  $languages['sk']['ALIAS']       = 'sk_SK';
@@ -899,6 +969,14 @@ $languages['bg_BG']['NAME']    = 'Bulgarian';
  $languages['bg_BG']['CHARSET'] = 'windows-1251';
  $languages['bg']['ALIAS'] = 'bg_BG';
  
+// Right to left languages
+
+$languages['he_HE']['NAME']    = 'Hebrew';
+$languages['he_HE']['CHARSET'] = 'windows-1255';
+$languages['he_HE']['DIR']     = 'rtl';
+$languages['he']['ALIAS']      = 'he_HE';
+
+
  /* Detect whether gettext is installed. */
  $gettext_flags = 0;
  if (function_exists('_')) {
@@ -938,4 +1016,4 @@ elseif ($gettext_flags == 0) {
      }
  }
  
-?>
-\ No newline at end of file
+?>