| 1 | <?php |
| 2 | |
| 3 | /** |
| 4 | ** i18n.php |
| 5 | ** |
| 6 | ** This file contains variuos functions that are needed to do |
| 7 | ** internationalization of SquirrelMail. |
| 8 | ** |
| 9 | ** Internally the output character set is used. Other characters are |
| 10 | ** encoded using Unicode entities according to HTML 4.0. |
| 11 | ** |
| 12 | **/ |
| 13 | |
| 14 | $i18n_php = true; |
| 15 | |
| 16 | // This array specifies the available languages. |
| 17 | $languages["en"]["NAME"] = "English"; |
| 18 | $languages["no"]["NAME"] = "Norsk"; |
| 19 | $languages["no"]["CHARSET"] = "iso-8859-1"; |
| 20 | $languages["de"]["NAME"] = "Deutsch"; |
| 21 | $languages["de"]["CHARSET"] = "iso-8859-1"; |
| 22 | $languages["ru"]["NAME"] = "Russian KOI8-R"; |
| 23 | $languages["ru"]["CHARSET"] = "koi8-r"; |
| 24 | $languages["pl"]["NAME"] = "Polish"; |
| 25 | $languages["pl"]["CHARSET"] = "iso-8859-2"; |
| 26 | |
| 27 | // Decodes a string to the internal encoding from the given charset |
| 28 | function charset_decode ($charset, $string) { |
| 29 | // All HTML special characters are 7 bit and can be replaced first |
| 30 | $string = htmlspecialchars ($string); |
| 31 | |
| 32 | $charset = strtolower($charset); |
| 33 | |
| 34 | if (ereg("iso-8859-(.*)", $charset, $res)) { |
| 35 | if ($res[1] == "1") |
| 36 | return charset_decode_iso_8859_1 ($string); |
| 37 | if ($res[1] == "7") |
| 38 | return charset_decode_iso_8859_7 ($string); |
| 39 | else if ($res[1] == "15") |
| 40 | return charset_decode_iso_8859_15 ($string); |
| 41 | else |
| 42 | return charset_decode_iso_8859_default ($string); |
| 43 | } else if ($charset == "ns_4551-1") { |
| 44 | return charset_decode_ns_4551_1 ($string); |
| 45 | } else if ($charset == "koi8-r") { |
| 46 | return charset_decode_koi8r ($string); |
| 47 | } else |
| 48 | return "$string"; |
| 49 | } |
| 50 | |
| 51 | // iso-8859-1 is the same as Latin 1 and is normally used |
| 52 | // in western europe. |
| 53 | function charset_decode_iso_8859_1 ($string) { |
| 54 | global $default_charset; |
| 55 | |
| 56 | if (strtolower($default_charset) == "iso-8859-1") { |
| 57 | return $string; |
| 58 | } else { |
| 59 | // Only do the slow convert if there are 8-bit characters |
| 60 | if (ereg("[\200-\377]", $string)) { |
| 61 | $string = str_replace("\201", "", $string); |
| 62 | $string = str_replace("\202", "‚", $string); |
| 63 | $string = str_replace("\203", "ƒ", $string); |
| 64 | $string = str_replace("\204", "„", $string); |
| 65 | $string = str_replace("\205", "…", $string); |
| 66 | $string = str_replace("\206", "†", $string); |
| 67 | $string = str_replace("\207", "‡", $string); |
| 68 | $string = str_replace("\210", "ˆ", $string); |
| 69 | $string = str_replace("\211", "‰", $string); |
| 70 | $string = str_replace("\212", "Š", $string); |
| 71 | $string = str_replace("\213", "‹", $string); |
| 72 | $string = str_replace("\214", "Œ", $string); |
| 73 | $string = str_replace("\215", "", $string); |
| 74 | $string = str_replace("\216", "Ž", $string); |
| 75 | $string = str_replace("\217", "", $string); |
| 76 | $string = str_replace("\220", "", $string); |
| 77 | $string = str_replace("\221", "‘", $string); |
| 78 | $string = str_replace("\222", "’", $string); |
| 79 | $string = str_replace("\223", "“", $string); |
| 80 | $string = str_replace("\224", "”", $string); |
| 81 | $string = str_replace("\225", "•", $string); |
| 82 | $string = str_replace("\226", "–", $string); |
| 83 | $string = str_replace("\227", "—", $string); |
| 84 | $string = str_replace("\230", "˜", $string); |
| 85 | $string = str_replace("\231", "™", $string); |
| 86 | $string = str_replace("\232", "š", $string); |
| 87 | $string = str_replace("\233", "›", $string); |
| 88 | $string = str_replace("\234", "œ", $string); |
| 89 | $string = str_replace("\235", "", $string); |
| 90 | $string = str_replace("\236", "ž", $string); |
| 91 | $string = str_replace("\237", "Ÿ", $string); |
| 92 | $string = str_replace("\240", " ", $string); |
| 93 | $string = str_replace("\241", "¡", $string); |
| 94 | $string = str_replace("\242", "¢", $string); |
| 95 | $string = str_replace("\243", "£", $string); |
| 96 | $string = str_replace("\244", "¤", $string); |
| 97 | $string = str_replace("\245", "¥", $string); |
| 98 | $string = str_replace("\246", "¦", $string); |
| 99 | $string = str_replace("\247", "§", $string); |
| 100 | $string = str_replace("\250", "¨", $string); |
| 101 | $string = str_replace("\251", "©", $string); |
| 102 | $string = str_replace("\252", "ª", $string); |
| 103 | $string = str_replace("\253", "«", $string); |
| 104 | $string = str_replace("\254", "¬", $string); |
| 105 | $string = str_replace("\255", "­", $string); |
| 106 | $string = str_replace("\256", "®", $string); |
| 107 | $string = str_replace("\257", "¯", $string); |
| 108 | $string = str_replace("\260", "°", $string); |
| 109 | $string = str_replace("\261", "±", $string); |
| 110 | $string = str_replace("\262", "²", $string); |
| 111 | $string = str_replace("\263", "³", $string); |
| 112 | $string = str_replace("\264", "´", $string); |
| 113 | $string = str_replace("\265", "µ", $string); |
| 114 | $string = str_replace("\266", "¶", $string); |
| 115 | $string = str_replace("\267", "·", $string); |
| 116 | $string = str_replace("\270", "¸", $string); |
| 117 | $string = str_replace("\271", "¹", $string); |
| 118 | $string = str_replace("\272", "º", $string); |
| 119 | $string = str_replace("\273", "»", $string); |
| 120 | $string = str_replace("\274", "¼", $string); |
| 121 | $string = str_replace("\275", "½", $string); |
| 122 | $string = str_replace("\276", "¾", $string); |
| 123 | $string = str_replace("\277", "¿", $string); |
| 124 | $string = str_replace("\300", "À", $string); |
| 125 | $string = str_replace("\301", "Á", $string); |
| 126 | $string = str_replace("\302", "Â", $string); |
| 127 | $string = str_replace("\303", "Ã", $string); |
| 128 | $string = str_replace("\304", "Ä", $string); |
| 129 | $string = str_replace("\305", "Å", $string); |
| 130 | $string = str_replace("\306", "Æ", $string); |
| 131 | $string = str_replace("\307", "Ç", $string); |
| 132 | $string = str_replace("\310", "È", $string); |
| 133 | $string = str_replace("\311", "É", $string); |
| 134 | $string = str_replace("\312", "Ê", $string); |
| 135 | $string = str_replace("\313", "Ë", $string); |
| 136 | $string = str_replace("\314", "Ì", $string); |
| 137 | $string = str_replace("\315", "Í", $string); |
| 138 | $string = str_replace("\316", "Î", $string); |
| 139 | $string = str_replace("\317", "Ï", $string); |
| 140 | $string = str_replace("\320", "Ð", $string); |
| 141 | $string = str_replace("\321", "Ñ", $string); |
| 142 | $string = str_replace("\322", "Ò", $string); |
| 143 | $string = str_replace("\323", "Ó", $string); |
| 144 | $string = str_replace("\324", "Ô", $string); |
| 145 | $string = str_replace("\325", "Õ", $string); |
| 146 | $string = str_replace("\326", "Ö", $string); |
| 147 | $string = str_replace("\327", "×", $string); |
| 148 | $string = str_replace("\330", "Ø", $string); |
| 149 | $string = str_replace("\331", "Ù", $string); |
| 150 | $string = str_replace("\332", "Ú", $string); |
| 151 | $string = str_replace("\333", "Û", $string); |
| 152 | $string = str_replace("\334", "Ü", $string); |
| 153 | $string = str_replace("\335", "Ý", $string); |
| 154 | $string = str_replace("\336", "Þ", $string); |
| 155 | $string = str_replace("\337", "ß", $string); |
| 156 | $string = str_replace("\340", "à", $string); |
| 157 | $string = str_replace("\341", "á", $string); |
| 158 | $string = str_replace("\342", "â", $string); |
| 159 | $string = str_replace("\343", "ã", $string); |
| 160 | $string = str_replace("\344", "ä", $string); |
| 161 | $string = str_replace("\345", "å", $string); |
| 162 | $string = str_replace("\346", "æ", $string); |
| 163 | $string = str_replace("\347", "ç", $string); |
| 164 | $string = str_replace("\350", "è", $string); |
| 165 | $string = str_replace("\351", "é", $string); |
| 166 | $string = str_replace("\352", "ê", $string); |
| 167 | $string = str_replace("\353", "ë", $string); |
| 168 | $string = str_replace("\354", "ì", $string); |
| 169 | $string = str_replace("\355", "í", $string); |
| 170 | $string = str_replace("\356", "î", $string); |
| 171 | $string = str_replace("\357", "ï", $string); |
| 172 | $string = str_replace("\360", "ð", $string); |
| 173 | $string = str_replace("\361", "ñ", $string); |
| 174 | $string = str_replace("\362", "ò", $string); |
| 175 | $string = str_replace("\363", "ó", $string); |
| 176 | $string = str_replace("\364", "ô", $string); |
| 177 | $string = str_replace("\365", "õ", $string); |
| 178 | $string = str_replace("\366", "ö", $string); |
| 179 | $string = str_replace("\367", "÷", $string); |
| 180 | $string = str_replace("\370", "ø", $string); |
| 181 | $string = str_replace("\371", "ù", $string); |
| 182 | $string = str_replace("\372", "ú", $string); |
| 183 | $string = str_replace("\373", "û", $string); |
| 184 | $string = str_replace("\374", "ü", $string); |
| 185 | $string = str_replace("\375", "ý", $string); |
| 186 | $string = str_replace("\376", "þ", $string); |
| 187 | $string = str_replace("\377", "ÿ", $string); |
| 188 | } |
| 189 | } |
| 190 | |
| 191 | return ($string); |
| 192 | } |
| 193 | |
| 194 | // iso-8859-7 is Greek. |
| 195 | function charset_decode_iso_8859_7 ($string) { |
| 196 | global $default_charset; |
| 197 | |
| 198 | if (strtolower($default_charset) == "iso-8859-7") { |
| 199 | return $string; |
| 200 | } else { |
| 201 | // Only do the slow convert if there are 8-bit characters |
| 202 | if (ereg("[\200-\377]", $string)) { |
| 203 | // Some diverse characters in the beginning |
| 204 | $string = str_replace("\240", " ", $string); |
| 205 | $string = str_replace("\241", "‘", $string); |
| 206 | $string = str_replace("\242", "’", $string); |
| 207 | $string = str_replace("\243", "£", $string); |
| 208 | $string = str_replace("\246", "¦", $string); |
| 209 | $string = str_replace("\247", "§", $string); |
| 210 | $string = str_replace("\250", "¨", $string); |
| 211 | $string = str_replace("\251", "©", $string); |
| 212 | $string = str_replace("\253", "«", $string); |
| 213 | $string = str_replace("\254", "¬", $string); |
| 214 | $string = str_replace("\255", "­", $string); |
| 215 | $string = str_replace("\257", "―", $string); |
| 216 | $string = str_replace("\260", "°", $string); |
| 217 | $string = str_replace("\261", "±", $string); |
| 218 | $string = str_replace("\262", "²", $string); |
| 219 | $string = str_replace("\263", "³", $string); |
| 220 | |
| 221 | // Horizontal bar (parentheki pavla) |
| 222 | $string = str_replace ("\257", "―", $string); |
| 223 | |
| 224 | // ISO-8859-7 characters from 11/04 (0xB4) to 11/06 (0xB6) |
| 225 | // These are Unicode 900-902 |
| 226 | while (ereg("([\264-\266])", $string, $res)) { |
| 227 | $replace = "&#" . (ord($res[1])+720) . ";"; |
| 228 | $string = str_replace($res[1], $replace, $string); |
| 229 | } |
| 230 | |
| 231 | // 11/07 (0xB7) Middle dot is the same in iso-8859-1 |
| 232 | $string = str_replace("\267", "·", $string); |
| 233 | |
| 234 | // ISO-8859-7 characters from 11/08 (0xB8) to 11/10 (0xBA) |
| 235 | // These are Unicode 900-902 |
| 236 | while (ereg("([\270-\272])", $string, $res)) { |
| 237 | $replace = "&#" . (ord($res[1])+720) . ";"; |
| 238 | $string = str_replace($res[1], $replace, $string); |
| 239 | } |
| 240 | |
| 241 | // 11/11 (0xBB) Right angle quotation mark is the same as in |
| 242 | // iso-8859-1 |
| 243 | $string = str_replace("\273", "»", $string); |
| 244 | |
| 245 | // And now the rest of the charset |
| 246 | while (ereg("([\274-\376])", $string, $res)) { |
| 247 | $replace = "&#" . (ord($res[1])+720) . ";"; |
| 248 | $string = str_replace($res[1], $replace, $string); |
| 249 | } |
| 250 | } |
| 251 | } |
| 252 | |
| 253 | return $string; |
| 254 | } |
| 255 | |
| 256 | // iso-8859-15 is Latin 15 and has very much the same use as Latin 1 |
| 257 | // but has the Euro symbol and some characters needed for French. |
| 258 | function charset_decode_iso_8859_15 ($string) { |
| 259 | // Euro sign |
| 260 | $string = str_replace ("\244", "€", $string); |
| 261 | // Latin capital letter S with caron |
| 262 | $string = str_replace ("\244", "Š", $string); |
| 263 | // Latin small letter s with caron |
| 264 | $string = str_replace ("\250", "š", $string); |
| 265 | // Latin capital letter Z with caron |
| 266 | $string = str_replace ("\264", "Ž", $string); |
| 267 | // Latin small letter z with caron |
| 268 | $string = str_replace ("\270", "ž", $string); |
| 269 | // Latin capital ligature OE |
| 270 | $string = str_replace ("\274", "Œ", $string); |
| 271 | // Latin small ligature oe |
| 272 | $string = str_replace ("\275", "œ", $string); |
| 273 | // Latin capital letter Y with diaeresis |
| 274 | $string = str_replace ("\276", "Ÿ", $string); |
| 275 | |
| 276 | return (charset_decode_iso_8859_1($string)); |
| 277 | } |
| 278 | |
| 279 | // ISO-8859-15 is Cyrillic |
| 280 | function charset_decode_iso_8859_5 ($string) { |
| 281 | // Convert to KOI8-R, then return this decoded. |
| 282 | $string = convert_cyr_string($string, "i", "k"); |
| 283 | return charset_decode_koi8r($string); |
| 284 | } |
| 285 | |
| 286 | // Remove all 8 bit characters from all other ISO-8859 character sets |
| 287 | function charset_decode_iso_8859_default ($string) { |
| 288 | return (strtr($string, "\240\241\242\243\244\245\246\247". |
| 289 | "\250\251\252\253\254\255\256\257". |
| 290 | "\260\261\262\263\264\265\266\267". |
| 291 | "\270\271\272\273\274\275\276\277". |
| 292 | "\300\301\302\303\304\305\306\307". |
| 293 | "\310\311\312\313\314\315\316\317". |
| 294 | "\320\321\322\323\324\325\326\327". |
| 295 | "\330\331\332\333\334\335\336\337". |
| 296 | "\340\341\342\343\344\345\346\347". |
| 297 | "\350\351\352\353\354\355\356\357". |
| 298 | "\360\361\362\363\364\365\366\367". |
| 299 | "\370\371\372\373\374\375\376\377", |
| 300 | "????????????????????????????????????????". |
| 301 | "????????????????????????????????????????". |
| 302 | "????????????????????????????????????????". |
| 303 | "????????")); |
| 304 | |
| 305 | } |
| 306 | |
| 307 | // This is the same as ISO-646-NO and is used by some |
| 308 | // Microsoft programs when sending Norwegian characters |
| 309 | function charset_decode_ns_4551_1 ($string) { |
| 310 | // These characters are: |
| 311 | // Latin capital letter AE |
| 312 | // Latin capital letter O with stroke |
| 313 | // Latin capital letter A with ring above |
| 314 | // and the same as small letters |
| 315 |